diff --git "a/wandb/run-20220317_164114-2vzd8l55/files/wandb-summary.json" "b/wandb/run-20220317_164114-2vzd8l55/files/wandb-summary.json" --- "a/wandb/run-20220317_164114-2vzd8l55/files/wandb-summary.json" +++ "b/wandb/run-20220317_164114-2vzd8l55/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 3.4205, "train/learning_rate": 9.11104513064133e-05, "train/epoch": 2.8, "train/global_step": 2500, "_runtime": 16487, "_timestamp": 1647551761, "_step": 2500, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 9.0, 17.0, 53.0, 89.0, 171.0, 221.0, 186.0, 140.0, 77.0, 31.0, 12.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.7315673828125, -103.61234283447266, -101.49312591552734, -99.3739013671875, -97.25468444824219, -95.13545989990234, -93.01624298095703, -90.89701843261719, -88.77780151367188, -86.65857696533203, -84.53936004638672, -82.42013549804688, -80.30091857910156, -78.18169403076172, -76.0624771118164, -73.94325256347656, -71.82403564453125, -69.7048110961914, -67.5855941772461, -65.46636962890625, -63.34715270996094, -61.22793197631836, -59.10871124267578, -56.98948669433594, -54.870262145996094, -52.751041412353516, -50.63182067871094, -48.51259994506836, -46.39337921142578, -44.2741584777832, -42.154937744140625, -40.03571319580078, -37.9164924621582, -35.797271728515625, -33.67805099487305, -31.55883026123047, -29.43960952758789, -27.320388793945312, -25.2011661529541, -23.081945419311523, -20.962724685668945, -18.843503952026367, -16.72428321838379, -14.605061531066895, -12.485840797424316, -10.366620063781738, -8.247398376464844, -6.128177642822266, -4.0089569091796875, -1.8897359371185303, 0.22948503494262695, 2.3487062454223633, 4.467926979064941, 6.5871477127075195, 8.706369400024414, 10.825590133666992, 12.94481086730957, 15.064031600952148, 17.183252334594727, 19.302474975585938, 21.421695709228516, 23.540916442871094, 25.660137176513672, 27.77935791015625, 29.898578643798828]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 2.0, 7.0, 15.0, 13.0, 6.0, 8.0, 14.0, 12.0, 16.0, 21.0, 28.0, 37.0, 26.0, 40.0, 31.0, 44.0, 43.0, 52.0, 41.0, 42.0, 53.0, 44.0, 37.0, 37.0, 48.0, 38.0, 30.0, 29.0, 26.0, 19.0, 18.0, 23.0, 16.0, 19.0, 7.0, 7.0, 10.0, 8.0, 6.0, 8.0, 8.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-52.37346649169922, -50.87981414794922, -49.38616180419922, -47.89250946044922, -46.39885711669922, -44.90520477294922, -43.41155242919922, -41.91790008544922, -40.42424774169922, -38.93059539794922, -37.43694305419922, -35.94329071044922, -34.44963836669922, -32.95598602294922, -31.46233558654785, -29.96868324279785, -28.475032806396484, -26.981380462646484, -25.487728118896484, -23.994075775146484, -22.500423431396484, -21.006771087646484, -19.513120651245117, -18.019468307495117, -16.525815963745117, -15.032163619995117, -13.538511276245117, -12.044859886169434, -10.551207542419434, -9.057555198669434, -7.56390380859375, -6.07025146484375, -4.576595306396484, -3.0829432010650635, -1.5892910957336426, -0.09563922882080078, 1.3980131149291992, 2.891665458679199, 4.385316848754883, 5.878969192504883, 7.372621536254883, 8.866273880004883, 10.359926223754883, 11.853577613830566, 13.347229957580566, 14.840882301330566, 16.33453369140625, 17.82818603515625, 19.32183837890625, 20.81549072265625, 22.30914306640625, 23.80279541015625, 25.29644775390625, 26.79010009765625, 28.283750534057617, 29.777402877807617, 31.271055221557617, 32.764705657958984, 34.258358001708984, 35.752010345458984, 37.245662689208984, 38.739315032958984, 40.232967376708984, 41.726619720458984, 43.220272064208984]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 4.0, 2.0, 4.0, 8.0, 10.0, 10.0, 8.0, 16.0, 12.0, 15.0, 13.0, 12.0, 18.0, 22.0, 28.0, 23.0, 38.0, 37.0, 49.0, 40.0, 31.0, 35.0, 51.0, 35.0, 50.0, 29.0, 48.0, 47.0, 42.0, 41.0, 23.0, 31.0, 18.0, 16.0, 24.0, 12.0, 12.0, 8.0, 15.0, 15.0, 13.0, 5.0, 12.0, 7.0, 3.0, 6.0, 0.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0859375, -2.02142333984375, -1.9569091796875, -1.89239501953125, -1.827880859375, -1.76336669921875, -1.6988525390625, -1.63433837890625, -1.56982421875, -1.50531005859375, -1.4407958984375, -1.37628173828125, -1.311767578125, -1.24725341796875, -1.1827392578125, -1.11822509765625, -1.0537109375, -0.98919677734375, -0.9246826171875, -0.86016845703125, -0.795654296875, -0.73114013671875, -0.6666259765625, -0.60211181640625, -0.53759765625, -0.47308349609375, -0.4085693359375, -0.34405517578125, -0.279541015625, -0.21502685546875, -0.1505126953125, -0.08599853515625, -0.021484375, 0.04302978515625, 0.1075439453125, 0.17205810546875, 0.236572265625, 0.30108642578125, 0.3656005859375, 0.43011474609375, 0.49462890625, 0.55914306640625, 0.6236572265625, 0.68817138671875, 0.752685546875, 0.81719970703125, 0.8817138671875, 0.94622802734375, 1.0107421875, 1.07525634765625, 1.1397705078125, 1.20428466796875, 1.268798828125, 1.33331298828125, 1.3978271484375, 1.46234130859375, 1.52685546875, 1.59136962890625, 1.6558837890625, 1.72039794921875, 1.784912109375, 1.84942626953125, 1.9139404296875, 1.97845458984375, 2.04296875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 12.0, 9.0, 13.0, 20.0, 30.0, 43.0, 53.0, 60.0, 87.0, 167.0, 227.0, 405.0, 706.0, 1319.0, 2874.0, 6862.0, 21120.0, 93226.0, 674037.0, 2707966.0, 571230.0, 83031.0, 19230.0, 6198.0, 2497.0, 1184.0, 611.0, 373.0, 225.0, 137.0, 83.0, 54.0, 67.0, 32.0, 29.0, 18.0, 17.0, 9.0, 7.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.09375, -6.82568359375, -6.5576171875, -6.28955078125, -6.021484375, -5.75341796875, -5.4853515625, -5.21728515625, -4.94921875, -4.68115234375, -4.4130859375, -4.14501953125, -3.876953125, -3.60888671875, -3.3408203125, -3.07275390625, -2.8046875, -2.53662109375, -2.2685546875, -2.00048828125, -1.732421875, -1.46435546875, -1.1962890625, -0.92822265625, -0.66015625, -0.39208984375, -0.1240234375, 0.14404296875, 0.412109375, 0.68017578125, 0.9482421875, 1.21630859375, 1.484375, 1.75244140625, 2.0205078125, 2.28857421875, 2.556640625, 2.82470703125, 3.0927734375, 3.36083984375, 3.62890625, 3.89697265625, 4.1650390625, 4.43310546875, 4.701171875, 4.96923828125, 5.2373046875, 5.50537109375, 5.7734375, 6.04150390625, 6.3095703125, 6.57763671875, 6.845703125, 7.11376953125, 7.3818359375, 7.64990234375, 7.91796875, 8.18603515625, 8.4541015625, 8.72216796875, 8.990234375, 9.25830078125, 9.5263671875, 9.79443359375, 10.0625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 8.0, 8.0, 14.0, 18.0, 54.0, 62.0, 117.0, 192.0, 326.0, 512.0, 715.0, 675.0, 500.0, 341.0, 213.0, 124.0, 90.0, 45.0, 26.0, 19.0, 11.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.875, -12.4302978515625, -11.985595703125, -11.5408935546875, -11.09619140625, -10.6514892578125, -10.206787109375, -9.7620849609375, -9.3173828125, -8.8726806640625, -8.427978515625, -7.9832763671875, -7.53857421875, -7.0938720703125, -6.649169921875, -6.2044677734375, -5.759765625, -5.3150634765625, -4.870361328125, -4.4256591796875, -3.98095703125, -3.5362548828125, -3.091552734375, -2.6468505859375, -2.2021484375, -1.7574462890625, -1.312744140625, -0.8680419921875, -0.42333984375, 0.0213623046875, 0.466064453125, 0.9107666015625, 1.35546875, 1.8001708984375, 2.244873046875, 2.6895751953125, 3.13427734375, 3.5789794921875, 4.023681640625, 4.4683837890625, 4.9130859375, 5.3577880859375, 5.802490234375, 6.2471923828125, 6.69189453125, 7.1365966796875, 7.581298828125, 8.0260009765625, 8.470703125, 8.9154052734375, 9.360107421875, 9.8048095703125, 10.24951171875, 10.6942138671875, 11.138916015625, 11.5836181640625, 12.0283203125, 12.4730224609375, 12.917724609375, 13.3624267578125, 13.80712890625, 14.2518310546875, 14.696533203125, 15.1412353515625, 15.5859375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 6.0, 5.0, 20.0, 41.0, 54.0, 125.0, 221.0, 451.0, 917.0, 2143.0, 8867.0, 750794.0, 3399096.0, 25982.0, 3152.0, 1250.0, 547.0, 285.0, 143.0, 68.0, 46.0, 27.0, 10.0, 4.0, 3.0, 0.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-38.28125, -37.0126953125, -35.744140625, -34.4755859375, -33.20703125, -31.9384765625, -30.669921875, -29.4013671875, -28.1328125, -26.8642578125, -25.595703125, -24.3271484375, -23.05859375, -21.7900390625, -20.521484375, -19.2529296875, -17.984375, -16.7158203125, -15.447265625, -14.1787109375, -12.91015625, -11.6416015625, -10.373046875, -9.1044921875, -7.8359375, -6.5673828125, -5.298828125, -4.0302734375, -2.76171875, -1.4931640625, -0.224609375, 1.0439453125, 2.3125, 3.5810546875, 4.849609375, 6.1181640625, 7.38671875, 8.6552734375, 9.923828125, 11.1923828125, 12.4609375, 13.7294921875, 14.998046875, 16.2666015625, 17.53515625, 18.8037109375, 20.072265625, 21.3408203125, 22.609375, 23.8779296875, 25.146484375, 26.4150390625, 27.68359375, 28.9521484375, 30.220703125, 31.4892578125, 32.7578125, 34.0263671875, 35.294921875, 36.5634765625, 37.83203125, 39.1005859375, 40.369140625, 41.6376953125, 42.90625]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 129.0, 528.0, 312.0, 41.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-275.53656005859375, -270.3975524902344, -265.2585754394531, -260.11956787109375, -254.98056030273438, -249.84156799316406, -244.70257568359375, -239.56356811523438, -234.42457580566406, -229.28558349609375, -224.14657592773438, -219.00758361816406, -213.8685760498047, -208.72958374023438, -203.590576171875, -198.4515838623047, -193.31259155273438, -188.17359924316406, -183.0345916748047, -177.89559936523438, -172.756591796875, -167.6175994873047, -162.47860717773438, -157.339599609375, -152.20059204101562, -147.0615997314453, -141.92259216308594, -136.78359985351562, -131.64459228515625, -126.50559997558594, -121.3666000366211, -116.22760009765625, -111.08860778808594, -105.9496078491211, -100.81060791015625, -95.67161560058594, -90.5326156616211, -85.39361572265625, -80.2546157836914, -75.11561584472656, -69.97662353515625, -64.8376235961914, -59.69862747192383, -54.559627532958984, -49.420631408691406, -44.28163146972656, -39.14263153076172, -34.00363540649414, -28.86463165283203, -23.72563362121582, -18.58663558959961, -13.447635650634766, -8.308637619018555, -3.1696395874023438, 1.9693603515625, 7.108356475830078, 12.247356414794922, 17.386354446411133, 22.525352478027344, 27.664352416992188, 32.80335235595703, 37.94234848022461, 43.08134841918945, 48.22034454345703, 53.359344482421875]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 8.0, 8.0, 7.0, 10.0, 12.0, 14.0, 15.0, 20.0, 19.0, 22.0, 27.0, 44.0, 30.0, 40.0, 45.0, 39.0, 41.0, 49.0, 54.0, 52.0, 44.0, 51.0, 54.0, 40.0, 43.0, 28.0, 24.0, 41.0, 26.0, 21.0, 22.0, 15.0, 13.0, 6.0, 1.0, 7.0, 6.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-50.03572463989258, -48.73379135131836, -47.431861877441406, -46.12992858886719, -44.82799530029297, -43.52606201171875, -42.22412872314453, -40.92219924926758, -39.62026596069336, -38.31833267211914, -37.01640319824219, -35.71446990966797, -34.41253662109375, -33.11060333251953, -31.808671951293945, -30.50674057006836, -29.20480728149414, -27.902873992919922, -26.600942611694336, -25.29901123046875, -23.99707794189453, -22.695144653320312, -21.393213272094727, -20.09128189086914, -18.789348602294922, -17.487415313720703, -16.185483932495117, -14.883551597595215, -13.581619262695312, -12.27968692779541, -10.977754592895508, -9.675822257995605, -8.373893737792969, -7.071961402893066, -5.770029067993164, -4.468096733093262, -3.1661643981933594, -1.864232063293457, -0.5622997283935547, 0.7396326065063477, 2.04156494140625, 3.3434972763061523, 4.645429611206055, 5.947361946105957, 7.249294281005859, 8.551226615905762, 9.853158950805664, 11.155091285705566, 12.457023620605469, 13.758955955505371, 15.060888290405273, 16.36281967163086, 17.664752960205078, 18.966686248779297, 20.268617630004883, 21.57054901123047, 22.872482299804688, 24.174415588378906, 25.476346969604492, 26.778278350830078, 28.080211639404297, 29.382144927978516, 30.6840763092041, 31.986007690429688, 33.287940979003906]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 6.0, 4.0, 5.0, 9.0, 8.0, 15.0, 15.0, 23.0, 25.0, 22.0, 27.0, 22.0, 25.0, 33.0, 38.0, 49.0, 48.0, 48.0, 65.0, 45.0, 52.0, 37.0, 45.0, 54.0, 21.0, 38.0, 32.0, 34.0, 25.0, 21.0, 26.0, 22.0, 14.0, 7.0, 7.0, 10.0, 2.0, 11.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.494140625, -2.41485595703125, -2.3355712890625, -2.25628662109375, -2.177001953125, -2.09771728515625, -2.0184326171875, -1.93914794921875, -1.85986328125, -1.78057861328125, -1.7012939453125, -1.62200927734375, -1.542724609375, -1.46343994140625, -1.3841552734375, -1.30487060546875, -1.2255859375, -1.14630126953125, -1.0670166015625, -0.98773193359375, -0.908447265625, -0.82916259765625, -0.7498779296875, -0.67059326171875, -0.59130859375, -0.51202392578125, -0.4327392578125, -0.35345458984375, -0.274169921875, -0.19488525390625, -0.1156005859375, -0.03631591796875, 0.04296875, 0.12225341796875, 0.2015380859375, 0.28082275390625, 0.360107421875, 0.43939208984375, 0.5186767578125, 0.59796142578125, 0.67724609375, 0.75653076171875, 0.8358154296875, 0.91510009765625, 0.994384765625, 1.07366943359375, 1.1529541015625, 1.23223876953125, 1.3115234375, 1.39080810546875, 1.4700927734375, 1.54937744140625, 1.628662109375, 1.70794677734375, 1.7872314453125, 1.86651611328125, 1.94580078125, 2.02508544921875, 2.1043701171875, 2.18365478515625, 2.262939453125, 2.34222412109375, 2.4215087890625, 2.50079345703125, 2.580078125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 11.0, 12.0, 24.0, 24.0, 41.0, 73.0, 145.0, 225.0, 381.0, 748.0, 1518.0, 2830.0, 5896.0, 12414.0, 26106.0, 55584.0, 111675.0, 196342.0, 252858.0, 184523.0, 101379.0, 49924.0, 23764.0, 11245.0, 5379.0, 2613.0, 1285.0, 647.0, 340.0, 197.0, 139.0, 74.0, 59.0, 25.0, 17.0, 10.0, 7.0, 6.0, 6.0, 7.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.31640625, -1.2792510986328125, -1.242095947265625, -1.2049407958984375, -1.16778564453125, -1.1306304931640625, -1.093475341796875, -1.0563201904296875, -1.0191650390625, -0.9820098876953125, -0.944854736328125, -0.9076995849609375, -0.87054443359375, -0.8333892822265625, -0.796234130859375, -0.7590789794921875, -0.721923828125, -0.6847686767578125, -0.647613525390625, -0.6104583740234375, -0.57330322265625, -0.5361480712890625, -0.498992919921875, -0.4618377685546875, -0.4246826171875, -0.3875274658203125, -0.350372314453125, -0.3132171630859375, -0.27606201171875, -0.2389068603515625, -0.201751708984375, -0.1645965576171875, -0.12744140625, -0.0902862548828125, -0.053131103515625, -0.0159759521484375, 0.02117919921875, 0.0583343505859375, 0.095489501953125, 0.1326446533203125, 0.1697998046875, 0.2069549560546875, 0.244110107421875, 0.2812652587890625, 0.31842041015625, 0.3555755615234375, 0.392730712890625, 0.4298858642578125, 0.467041015625, 0.5041961669921875, 0.541351318359375, 0.5785064697265625, 0.61566162109375, 0.6528167724609375, 0.689971923828125, 0.7271270751953125, 0.7642822265625, 0.8014373779296875, 0.838592529296875, 0.8757476806640625, 0.91290283203125, 0.9500579833984375, 0.987213134765625, 1.0243682861328125, 1.0615234375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 9.0, 8.0, 5.0, 10.0, 17.0, 13.0, 9.0, 16.0, 10.0, 24.0, 15.0, 27.0, 23.0, 32.0, 27.0, 28.0, 34.0, 25.0, 38.0, 46.0, 39.0, 24.0, 1051.0, 42.0, 42.0, 36.0, 21.0, 40.0, 35.0, 27.0, 36.0, 29.0, 20.0, 26.0, 22.0, 20.0, 16.0, 11.0, 12.0, 11.0, 11.0, 8.0, 6.0, 8.0, 5.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0], "bins": [-1.7939453125, -1.7387542724609375, -1.683563232421875, -1.6283721923828125, -1.57318115234375, -1.5179901123046875, -1.462799072265625, -1.4076080322265625, -1.3524169921875, -1.2972259521484375, -1.242034912109375, -1.1868438720703125, -1.13165283203125, -1.0764617919921875, -1.021270751953125, -0.9660797119140625, -0.910888671875, -0.8556976318359375, -0.800506591796875, -0.7453155517578125, -0.69012451171875, -0.6349334716796875, -0.579742431640625, -0.5245513916015625, -0.4693603515625, -0.4141693115234375, -0.358978271484375, -0.3037872314453125, -0.24859619140625, -0.1934051513671875, -0.138214111328125, -0.0830230712890625, -0.02783203125, 0.0273590087890625, 0.082550048828125, 0.1377410888671875, 0.19293212890625, 0.2481231689453125, 0.303314208984375, 0.3585052490234375, 0.4136962890625, 0.4688873291015625, 0.524078369140625, 0.5792694091796875, 0.63446044921875, 0.6896514892578125, 0.744842529296875, 0.8000335693359375, 0.855224609375, 0.9104156494140625, 0.965606689453125, 1.0207977294921875, 1.07598876953125, 1.1311798095703125, 1.186370849609375, 1.2415618896484375, 1.2967529296875, 1.3519439697265625, 1.407135009765625, 1.4623260498046875, 1.51751708984375, 1.5727081298828125, 1.627899169921875, 1.6830902099609375, 1.73828125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 7.0, 6.0, 5.0, 7.0, 10.0, 6.0, 6.0, 13.0, 11.0, 16.0, 19.0, 18.0, 36.0, 72.0, 136.0, 299.0, 807.0, 2231.0, 7031.0, 23283.0, 148922.0, 1875400.0, 26809.0, 7777.0, 2593.0, 874.0, 340.0, 137.0, 79.0, 48.0, 26.0, 18.0, 21.0, 9.0, 14.0, 9.0, 9.0, 6.0, 8.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.59375, -2.50128173828125, -2.4088134765625, -2.31634521484375, -2.223876953125, -2.13140869140625, -2.0389404296875, -1.94647216796875, -1.85400390625, -1.76153564453125, -1.6690673828125, -1.57659912109375, -1.484130859375, -1.39166259765625, -1.2991943359375, -1.20672607421875, -1.1142578125, -1.02178955078125, -0.9293212890625, -0.83685302734375, -0.744384765625, -0.65191650390625, -0.5594482421875, -0.46697998046875, -0.37451171875, -0.28204345703125, -0.1895751953125, -0.09710693359375, -0.004638671875, 0.08782958984375, 0.1802978515625, 0.27276611328125, 0.365234375, 0.45770263671875, 0.5501708984375, 0.64263916015625, 0.735107421875, 0.82757568359375, 0.9200439453125, 1.01251220703125, 1.10498046875, 1.19744873046875, 1.2899169921875, 1.38238525390625, 1.474853515625, 1.56732177734375, 1.6597900390625, 1.75225830078125, 1.8447265625, 1.93719482421875, 2.0296630859375, 2.12213134765625, 2.214599609375, 2.30706787109375, 2.3995361328125, 2.49200439453125, 2.58447265625, 2.67694091796875, 2.7694091796875, 2.86187744140625, 2.954345703125, 3.04681396484375, 3.1392822265625, 3.23175048828125, 3.32421875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 3.0, 11.0, 7.0, 6.0, 11.0, 15.0, 26.0, 27.0, 25.0, 20.0, 29.0, 39.0, 82.0, 90.0, 124.0, 115.0, 100.0, 53.0, 34.0, 32.0, 20.0, 22.0, 14.0, 13.0, 13.0, 10.0, 10.0, 10.0, 6.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.040252685546875, -0.03908681869506836, -0.03792095184326172, -0.03675508499145508, -0.03558921813964844, -0.0344233512878418, -0.033257484436035156, -0.032091617584228516, -0.030925750732421875, -0.029759883880615234, -0.028594017028808594, -0.027428150177001953, -0.026262283325195312, -0.025096416473388672, -0.02393054962158203, -0.02276468276977539, -0.02159881591796875, -0.02043294906616211, -0.01926708221435547, -0.018101215362548828, -0.016935348510742188, -0.015769481658935547, -0.014603614807128906, -0.013437747955322266, -0.012271881103515625, -0.011106014251708984, -0.009940147399902344, -0.008774280548095703, -0.0076084136962890625, -0.006442546844482422, -0.005276679992675781, -0.004110813140869141, -0.0029449462890625, -0.0017790794372558594, -0.0006132125854492188, 0.0005526542663574219, 0.0017185211181640625, 0.002884387969970703, 0.004050254821777344, 0.005216121673583984, 0.006381988525390625, 0.007547855377197266, 0.008713722229003906, 0.009879589080810547, 0.011045455932617188, 0.012211322784423828, 0.013377189636230469, 0.01454305648803711, 0.01570892333984375, 0.01687479019165039, 0.01804065704345703, 0.019206523895263672, 0.020372390747070312, 0.021538257598876953, 0.022704124450683594, 0.023869991302490234, 0.025035858154296875, 0.026201725006103516, 0.027367591857910156, 0.028533458709716797, 0.029699325561523438, 0.030865192413330078, 0.03203105926513672, 0.03319692611694336, 0.03436279296875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 5.0, 1.0, 4.0, 2.0, 4.0, 10.0, 12.0, 16.0, 13.0, 18.0, 21.0, 38.0, 32.0, 46.0, 61.0, 81.0, 87.0, 100.0, 144.0, 269.0, 617.0, 61134.0, 983169.0, 1479.0, 375.0, 195.0, 142.0, 79.0, 64.0, 69.0, 60.0, 32.0, 32.0, 33.0, 23.0, 18.0, 14.0, 15.0, 8.0, 4.0, 1.0, 3.0, 7.0, 4.0, 4.0, 0.0, 0.0, 3.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6904296875, -0.6689834594726562, -0.6475372314453125, -0.6260910034179688, -0.604644775390625, -0.5831985473632812, -0.5617523193359375, -0.5403060913085938, -0.51885986328125, -0.49741363525390625, -0.4759674072265625, -0.45452117919921875, -0.433074951171875, -0.41162872314453125, -0.3901824951171875, -0.36873626708984375, -0.3472900390625, -0.32584381103515625, -0.3043975830078125, -0.28295135498046875, -0.261505126953125, -0.24005889892578125, -0.2186126708984375, -0.19716644287109375, -0.17572021484375, -0.15427398681640625, -0.1328277587890625, -0.11138153076171875, -0.089935302734375, -0.06848907470703125, -0.0470428466796875, -0.02559661865234375, -0.004150390625, 0.01729583740234375, 0.0387420654296875, 0.06018829345703125, 0.081634521484375, 0.10308074951171875, 0.1245269775390625, 0.14597320556640625, 0.16741943359375, 0.18886566162109375, 0.2103118896484375, 0.23175811767578125, 0.253204345703125, 0.27465057373046875, 0.2960968017578125, 0.31754302978515625, 0.3389892578125, 0.36043548583984375, 0.3818817138671875, 0.40332794189453125, 0.424774169921875, 0.44622039794921875, 0.4676666259765625, 0.48911285400390625, 0.51055908203125, 0.5320053100585938, 0.5534515380859375, 0.5748977661132812, 0.596343994140625, 0.6177902221679688, 0.6392364501953125, 0.6606826782226562, 0.68212890625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 18.0, 748.0, 244.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1040395200252533, -0.06843385100364685, -0.03282817453145981, 0.002777501940727234, 0.03838317096233368, 0.07398883998394012, 0.10959452390670776, 0.1452001929283142, 0.18080586194992065, 0.2164115309715271, 0.25201719999313354, 0.28762286901474, 0.32322853803634644, 0.3588342070579529, 0.3944399058818817, 0.43004557490348816, 0.4656512439250946, 0.5012569427490234, 0.5368626117706299, 0.5724682807922363, 0.6080739498138428, 0.6436796188354492, 0.6792852878570557, 0.7148909568786621, 0.7504966259002686, 0.786102294921875, 0.8217079639434814, 0.8573136329650879, 0.8929193019866943, 0.9285249710083008, 0.9641306400299072, 0.9997363090515137, 1.0353420972824097, 1.0709477663040161, 1.1065534353256226, 1.142159104347229, 1.1777647733688354, 1.213370442390442, 1.2489761114120483, 1.2845817804336548, 1.3201874494552612, 1.3557931184768677, 1.3913987874984741, 1.4270044565200806, 1.462610125541687, 1.4982157945632935, 1.5338214635849, 1.5694271326065063, 1.6050329208374023, 1.6406385898590088, 1.6762442588806152, 1.7118499279022217, 1.7474555969238281, 1.7830612659454346, 1.818666934967041, 1.8542726039886475, 1.889878273010254, 1.9254839420318604, 1.9610896110534668, 1.9966952800750732, 2.0323009490966797, 2.067906618118286, 2.1035122871398926, 2.139117956161499, 2.1747236251831055]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 6.0, 6.0, 7.0, 17.0, 16.0, 14.0, 17.0, 13.0, 13.0, 16.0, 28.0, 32.0, 32.0, 35.0, 39.0, 30.0, 45.0, 52.0, 48.0, 48.0, 51.0, 48.0, 48.0, 39.0, 35.0, 34.0, 29.0, 31.0, 27.0, 31.0, 20.0, 25.0, 13.0, 10.0, 10.0, 8.0, 3.0, 10.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.13377106189727783, -0.1297144591808319, -0.12565787136554718, -0.12160126864910126, -0.11754467338323593, -0.1134880781173706, -0.10943147540092468, -0.10537488013505936, -0.10131828486919403, -0.0972616896033287, -0.09320509433746338, -0.08914849162101746, -0.08509189635515213, -0.0810353010892868, -0.07697869837284088, -0.07292210310697556, -0.06886550784111023, -0.0648089125752449, -0.06075231358408928, -0.056695714592933655, -0.05263911932706833, -0.048582524061203, -0.04452592507004738, -0.040469326078891754, -0.03641273081302643, -0.0323561355471611, -0.028299536556005478, -0.024242939427495003, -0.020186342298984528, -0.016129745170474052, -0.012073148041963577, -0.008016550913453102, -0.003959953784942627, 9.66433435678482e-05, 0.004153240472078323, 0.008209837600588799, 0.012266434729099274, 0.01632303185760975, 0.020379628986120224, 0.0244362261146307, 0.028492823243141174, 0.0325494185090065, 0.036606017500162125, 0.04066261649131775, 0.044719211757183075, 0.0487758070230484, 0.052832406014204025, 0.05688900500535965, 0.060945600271224976, 0.0650021955370903, 0.06905879080295563, 0.07311539351940155, 0.07717198878526688, 0.0812285840511322, 0.08528518676757812, 0.08934178203344345, 0.09339837729930878, 0.0974549725651741, 0.10151156783103943, 0.10556817054748535, 0.10962476581335068, 0.113681361079216, 0.11773796379566193, 0.12179455906152725, 0.12585115432739258]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 4.0, 8.0, 11.0, 10.0, 12.0, 12.0, 17.0, 21.0, 28.0, 32.0, 41.0, 42.0, 43.0, 30.0, 44.0, 40.0, 52.0, 54.0, 48.0, 36.0, 43.0, 40.0, 36.0, 33.0, 38.0, 36.0, 28.0, 21.0, 25.0, 22.0, 15.0, 13.0, 14.0, 9.0, 13.0, 6.0, 1.0, 8.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.322265625, -2.24542236328125, -2.1685791015625, -2.09173583984375, -2.014892578125, -1.93804931640625, -1.8612060546875, -1.78436279296875, -1.70751953125, -1.63067626953125, -1.5538330078125, -1.47698974609375, -1.400146484375, -1.32330322265625, -1.2464599609375, -1.16961669921875, -1.0927734375, -1.01593017578125, -0.9390869140625, -0.86224365234375, -0.785400390625, -0.70855712890625, -0.6317138671875, -0.55487060546875, -0.47802734375, -0.40118408203125, -0.3243408203125, -0.24749755859375, -0.170654296875, -0.09381103515625, -0.0169677734375, 0.05987548828125, 0.13671875, 0.21356201171875, 0.2904052734375, 0.36724853515625, 0.444091796875, 0.52093505859375, 0.5977783203125, 0.67462158203125, 0.75146484375, 0.82830810546875, 0.9051513671875, 0.98199462890625, 1.058837890625, 1.13568115234375, 1.2125244140625, 1.28936767578125, 1.3662109375, 1.44305419921875, 1.5198974609375, 1.59674072265625, 1.673583984375, 1.75042724609375, 1.8272705078125, 1.90411376953125, 1.98095703125, 2.05780029296875, 2.1346435546875, 2.21148681640625, 2.288330078125, 2.36517333984375, 2.4420166015625, 2.51885986328125, 2.595703125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 10.0, 9.0, 14.0, 16.0, 24.0, 39.0, 51.0, 56.0, 94.0, 128.0, 152.0, 237.0, 311.0, 441.0, 668.0, 929.0, 1570.0, 2645.0, 4992.0, 10165.0, 21983.0, 51630.0, 130860.0, 296754.0, 297263.0, 131362.0, 51822.0, 21774.0, 9994.0, 5025.0, 2807.0, 1599.0, 937.0, 585.0, 436.0, 312.0, 240.0, 167.0, 122.0, 94.0, 65.0, 52.0, 36.0, 22.0, 11.0, 23.0, 8.0, 7.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-5.734375, -5.56060791015625, -5.3868408203125, -5.21307373046875, -5.039306640625, -4.86553955078125, -4.6917724609375, -4.51800537109375, -4.34423828125, -4.17047119140625, -3.9967041015625, -3.82293701171875, -3.649169921875, -3.47540283203125, -3.3016357421875, -3.12786865234375, -2.9541015625, -2.78033447265625, -2.6065673828125, -2.43280029296875, -2.259033203125, -2.08526611328125, -1.9114990234375, -1.73773193359375, -1.56396484375, -1.39019775390625, -1.2164306640625, -1.04266357421875, -0.868896484375, -0.69512939453125, -0.5213623046875, -0.34759521484375, -0.173828125, -6.103515625e-05, 0.1737060546875, 0.34747314453125, 0.521240234375, 0.69500732421875, 0.8687744140625, 1.04254150390625, 1.21630859375, 1.39007568359375, 1.5638427734375, 1.73760986328125, 1.911376953125, 2.08514404296875, 2.2589111328125, 2.43267822265625, 2.6064453125, 2.78021240234375, 2.9539794921875, 3.12774658203125, 3.301513671875, 3.47528076171875, 3.6490478515625, 3.82281494140625, 3.99658203125, 4.17034912109375, 4.3441162109375, 4.51788330078125, 4.691650390625, 4.86541748046875, 5.0391845703125, 5.21295166015625, 5.38671875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 3.0, 8.0, 13.0, 4.0, 2.0, 8.0, 11.0, 13.0, 20.0, 15.0, 30.0, 23.0, 39.0, 43.0, 41.0, 49.0, 65.0, 99.0, 184.0, 1337.0, 303.0, 210.0, 97.0, 69.0, 62.0, 36.0, 44.0, 24.0, 34.0, 32.0, 21.0, 23.0, 21.0, 17.0, 11.0, 12.0, 4.0, 6.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.21875, -7.9447021484375, -7.670654296875, -7.3966064453125, -7.12255859375, -6.8485107421875, -6.574462890625, -6.3004150390625, -6.0263671875, -5.7523193359375, -5.478271484375, -5.2042236328125, -4.93017578125, -4.6561279296875, -4.382080078125, -4.1080322265625, -3.833984375, -3.5599365234375, -3.285888671875, -3.0118408203125, -2.73779296875, -2.4637451171875, -2.189697265625, -1.9156494140625, -1.6416015625, -1.3675537109375, -1.093505859375, -0.8194580078125, -0.54541015625, -0.2713623046875, 0.002685546875, 0.2767333984375, 0.55078125, 0.8248291015625, 1.098876953125, 1.3729248046875, 1.64697265625, 1.9210205078125, 2.195068359375, 2.4691162109375, 2.7431640625, 3.0172119140625, 3.291259765625, 3.5653076171875, 3.83935546875, 4.1134033203125, 4.387451171875, 4.6614990234375, 4.935546875, 5.2095947265625, 5.483642578125, 5.7576904296875, 6.03173828125, 6.3057861328125, 6.579833984375, 6.8538818359375, 7.1279296875, 7.4019775390625, 7.676025390625, 7.9500732421875, 8.22412109375, 8.4981689453125, 8.772216796875, 9.0462646484375, 9.3203125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 1.0, 6.0, 7.0, 5.0, 18.0, 15.0, 18.0, 10.0, 30.0, 13.0, 31.0, 33.0, 32.0, 48.0, 69.0, 115.0, 324.0, 1291.0, 53627.0, 3056978.0, 31190.0, 1127.0, 265.0, 106.0, 72.0, 48.0, 44.0, 28.0, 23.0, 20.0, 15.0, 22.0, 6.0, 17.0, 5.0, 3.0, 8.0, 7.0, 5.0, 5.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.640625, -29.634521484375, -28.62841796875, -27.622314453125, -26.6162109375, -25.610107421875, -24.60400390625, -23.597900390625, -22.591796875, -21.585693359375, -20.57958984375, -19.573486328125, -18.5673828125, -17.561279296875, -16.55517578125, -15.549072265625, -14.54296875, -13.536865234375, -12.53076171875, -11.524658203125, -10.5185546875, -9.512451171875, -8.50634765625, -7.500244140625, -6.494140625, -5.488037109375, -4.48193359375, -3.475830078125, -2.4697265625, -1.463623046875, -0.45751953125, 0.548583984375, 1.5546875, 2.560791015625, 3.56689453125, 4.572998046875, 5.5791015625, 6.585205078125, 7.59130859375, 8.597412109375, 9.603515625, 10.609619140625, 11.61572265625, 12.621826171875, 13.6279296875, 14.634033203125, 15.64013671875, 16.646240234375, 17.65234375, 18.658447265625, 19.66455078125, 20.670654296875, 21.6767578125, 22.682861328125, 23.68896484375, 24.695068359375, 25.701171875, 26.707275390625, 27.71337890625, 28.719482421875, 29.7255859375, 30.731689453125, 31.73779296875, 32.743896484375, 33.75]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15.0, 406.0, 579.0, 20.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.13119506835938, -107.31159973144531, -103.49199676513672, -99.67240142822266, -95.85279846191406, -92.033203125, -88.21360778808594, -84.39401245117188, -80.57440948486328, -76.75481414794922, -72.93521118164062, -69.11561584472656, -65.2960205078125, -61.476417541503906, -57.656822204589844, -53.837223052978516, -50.01762390136719, -46.19802474975586, -42.37842559814453, -38.55883026123047, -34.73923110961914, -30.919631958007812, -27.100034713745117, -23.280437469482422, -19.460838317871094, -15.641240119934082, -11.82164192199707, -8.002043724060059, -4.182445526123047, -0.36284637451171875, 3.4567508697509766, 7.276348114013672, 11.095947265625, 14.915545463562012, 18.735143661499023, 22.55474090576172, 26.374340057373047, 30.193939208984375, 34.01353454589844, 37.833133697509766, 41.652732849121094, 45.47233200073242, 49.29193115234375, 53.11152648925781, 56.93112564086914, 60.75072479248047, 64.57032012939453, 68.38992309570312, 72.20951843261719, 76.02911376953125, 79.84871673583984, 83.6683120727539, 87.4879150390625, 91.30751037597656, 95.12710571289062, 98.94670104980469, 102.76630401611328, 106.58589935302734, 110.40550231933594, 114.22509765625, 118.04469299316406, 121.86429595947266, 125.68389129638672, 129.5034942626953, 133.32308959960938]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 5.0, 14.0, 4.0, 16.0, 6.0, 8.0, 19.0, 19.0, 17.0, 15.0, 41.0, 27.0, 33.0, 40.0, 49.0, 40.0, 43.0, 56.0, 44.0, 41.0, 33.0, 53.0, 27.0, 38.0, 36.0, 37.0, 33.0, 36.0, 30.0, 22.0, 15.0, 19.0, 18.0, 10.0, 12.0, 9.0, 1.0, 6.0, 9.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-25.39031982421875, -24.521846771240234, -23.65337371826172, -22.784900665283203, -21.916427612304688, -21.047954559326172, -20.179481506347656, -19.31100845336914, -18.442535400390625, -17.57406234741211, -16.705589294433594, -15.837116241455078, -14.968643188476562, -14.100170135498047, -13.231697082519531, -12.363224029541016, -11.494750022888184, -10.626276969909668, -9.757803916931152, -8.889330863952637, -8.020857810974121, -7.152384281158447, -6.283911228179932, -5.415438175201416, -4.5469651222229, -3.6784920692443848, -2.810019016265869, -1.9415457248687744, -1.0730726718902588, -0.20459938049316406, 0.6638736724853516, 1.5323467254638672, 2.400819778442383, 3.2692928314208984, 4.137765884399414, 5.00623893737793, 5.874711990356445, 6.743185520172119, 7.611658573150635, 8.480131149291992, 9.348604202270508, 10.217077255249023, 11.085550308227539, 11.954023361206055, 12.82249641418457, 13.690969467163086, 14.559442520141602, 15.427915573120117, 16.296390533447266, 17.16486358642578, 18.033336639404297, 18.901809692382812, 19.770282745361328, 20.638755798339844, 21.50722885131836, 22.375701904296875, 23.24417495727539, 24.112648010253906, 24.981121063232422, 25.849594116210938, 26.718067169189453, 27.58654022216797, 28.455013275146484, 29.323486328125, 30.191959381103516]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 9.0, 4.0, 6.0, 10.0, 17.0, 10.0, 32.0, 23.0, 24.0, 36.0, 26.0, 38.0, 32.0, 47.0, 50.0, 55.0, 50.0, 49.0, 44.0, 50.0, 42.0, 38.0, 37.0, 43.0, 29.0, 29.0, 21.0, 20.0, 15.0, 22.0, 11.0, 18.0, 12.0, 14.0, 11.0, 3.0, 9.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.939453125, -2.855377197265625, -2.77130126953125, -2.687225341796875, -2.6031494140625, -2.519073486328125, -2.43499755859375, -2.350921630859375, -2.266845703125, -2.182769775390625, -2.09869384765625, -2.014617919921875, -1.9305419921875, -1.846466064453125, -1.76239013671875, -1.678314208984375, -1.59423828125, -1.510162353515625, -1.42608642578125, -1.342010498046875, -1.2579345703125, -1.173858642578125, -1.08978271484375, -1.005706787109375, -0.921630859375, -0.837554931640625, -0.75347900390625, -0.669403076171875, -0.5853271484375, -0.501251220703125, -0.41717529296875, -0.333099365234375, -0.2490234375, -0.164947509765625, -0.08087158203125, 0.003204345703125, 0.0872802734375, 0.171356201171875, 0.25543212890625, 0.339508056640625, 0.423583984375, 0.507659912109375, 0.59173583984375, 0.675811767578125, 0.7598876953125, 0.843963623046875, 0.92803955078125, 1.012115478515625, 1.09619140625, 1.180267333984375, 1.26434326171875, 1.348419189453125, 1.4324951171875, 1.516571044921875, 1.60064697265625, 1.684722900390625, 1.768798828125, 1.852874755859375, 1.93695068359375, 2.021026611328125, 2.1051025390625, 2.189178466796875, 2.27325439453125, 2.357330322265625, 2.44140625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 9.0, 8.0, 9.0, 13.0, 20.0, 24.0, 41.0, 45.0, 62.0, 104.0, 178.0, 263.0, 456.0, 986.0, 2072.0, 6504.0, 29583.0, 243375.0, 2894721.0, 922179.0, 75639.0, 12283.0, 3081.0, 1180.0, 551.0, 306.0, 164.0, 97.0, 85.0, 64.0, 41.0, 30.0, 33.0, 22.0, 15.0, 12.0, 12.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.296875, -12.8907470703125, -12.484619140625, -12.0784912109375, -11.67236328125, -11.2662353515625, -10.860107421875, -10.4539794921875, -10.0478515625, -9.6417236328125, -9.235595703125, -8.8294677734375, -8.42333984375, -8.0172119140625, -7.611083984375, -7.2049560546875, -6.798828125, -6.3927001953125, -5.986572265625, -5.5804443359375, -5.17431640625, -4.7681884765625, -4.362060546875, -3.9559326171875, -3.5498046875, -3.1436767578125, -2.737548828125, -2.3314208984375, -1.92529296875, -1.5191650390625, -1.113037109375, -0.7069091796875, -0.30078125, 0.1053466796875, 0.511474609375, 0.9176025390625, 1.32373046875, 1.7298583984375, 2.135986328125, 2.5421142578125, 2.9482421875, 3.3543701171875, 3.760498046875, 4.1666259765625, 4.57275390625, 4.9788818359375, 5.385009765625, 5.7911376953125, 6.197265625, 6.6033935546875, 7.009521484375, 7.4156494140625, 7.82177734375, 8.2279052734375, 8.634033203125, 9.0401611328125, 9.4462890625, 9.8524169921875, 10.258544921875, 10.6646728515625, 11.07080078125, 11.4769287109375, 11.883056640625, 12.2891845703125, 12.6953125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 22.0, 38.0, 50.0, 125.0, 225.0, 400.0, 637.0, 922.0, 710.0, 430.0, 220.0, 118.0, 82.0, 37.0, 18.0, 19.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7109375, -10.1890869140625, -9.667236328125, -9.1453857421875, -8.62353515625, -8.1016845703125, -7.579833984375, -7.0579833984375, -6.5361328125, -6.0142822265625, -5.492431640625, -4.9705810546875, -4.44873046875, -3.9268798828125, -3.405029296875, -2.8831787109375, -2.361328125, -1.8394775390625, -1.317626953125, -0.7957763671875, -0.27392578125, 0.2479248046875, 0.769775390625, 1.2916259765625, 1.8134765625, 2.3353271484375, 2.857177734375, 3.3790283203125, 3.90087890625, 4.4227294921875, 4.944580078125, 5.4664306640625, 5.98828125, 6.5101318359375, 7.031982421875, 7.5538330078125, 8.07568359375, 8.5975341796875, 9.119384765625, 9.6412353515625, 10.1630859375, 10.6849365234375, 11.206787109375, 11.7286376953125, 12.25048828125, 12.7723388671875, 13.294189453125, 13.8160400390625, 14.337890625, 14.8597412109375, 15.381591796875, 15.9034423828125, 16.42529296875, 16.9471435546875, 17.468994140625, 17.9908447265625, 18.5126953125, 19.0345458984375, 19.556396484375, 20.0782470703125, 20.60009765625, 21.1219482421875, 21.643798828125, 22.1656494140625, 22.6875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 11.0, 20.0, 35.0, 53.0, 123.0, 267.0, 653.0, 2213.0, 17942.0, 499240.0, 3461081.0, 200686.0, 9408.0, 1616.0, 493.0, 216.0, 104.0, 59.0, 25.0, 21.0, 7.0, 10.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.734375, -23.796630859375, -22.85888671875, -21.921142578125, -20.9833984375, -20.045654296875, -19.10791015625, -18.170166015625, -17.232421875, -16.294677734375, -15.35693359375, -14.419189453125, -13.4814453125, -12.543701171875, -11.60595703125, -10.668212890625, -9.73046875, -8.792724609375, -7.85498046875, -6.917236328125, -5.9794921875, -5.041748046875, -4.10400390625, -3.166259765625, -2.228515625, -1.290771484375, -0.35302734375, 0.584716796875, 1.5224609375, 2.460205078125, 3.39794921875, 4.335693359375, 5.2734375, 6.211181640625, 7.14892578125, 8.086669921875, 9.0244140625, 9.962158203125, 10.89990234375, 11.837646484375, 12.775390625, 13.713134765625, 14.65087890625, 15.588623046875, 16.5263671875, 17.464111328125, 18.40185546875, 19.339599609375, 20.27734375, 21.215087890625, 22.15283203125, 23.090576171875, 24.0283203125, 24.966064453125, 25.90380859375, 26.841552734375, 27.779296875, 28.717041015625, 29.65478515625, 30.592529296875, 31.5302734375, 32.468017578125, 33.40576171875, 34.343505859375, 35.28125]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 12.0, 34.0, 65.0, 106.0, 153.0, 148.0, 177.0, 131.0, 78.0, 57.0, 21.0, 11.0, 8.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-61.57192611694336, -59.79988098144531, -58.027835845947266, -56.25579071044922, -54.48374557495117, -52.711700439453125, -50.93965530395508, -49.16761016845703, -47.395565032958984, -45.62351989746094, -43.85147476196289, -42.079429626464844, -40.3073844909668, -38.53533935546875, -36.7632942199707, -34.991249084472656, -33.219207763671875, -31.447162628173828, -29.67511749267578, -27.903072357177734, -26.131027221679688, -24.35898208618164, -22.586936950683594, -20.814891815185547, -19.0428466796875, -17.270801544189453, -15.498756408691406, -13.72671127319336, -11.954666137695312, -10.182621955871582, -8.410576820373535, -6.638531684875488, -4.866485595703125, -3.094440460205078, -1.3223955631256104, 0.4496493339538574, 2.2216944694519043, 3.993739128112793, 5.76578426361084, 7.537829399108887, 9.309874534606934, 11.08191967010498, 12.853964805603027, 14.626008987426758, 16.398054122924805, 18.17009925842285, 19.9421443939209, 21.714189529418945, 23.486234664916992, 25.25827980041504, 27.030324935913086, 28.802370071411133, 30.57441520690918, 32.346458435058594, 34.11850357055664, 35.89054870605469, 37.662593841552734, 39.43463897705078, 41.20668411254883, 42.978729248046875, 44.75077438354492, 46.52281951904297, 48.294864654541016, 50.06690979003906, 51.83895492553711]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 4.0, 2.0, 10.0, 4.0, 11.0, 12.0, 15.0, 13.0, 19.0, 21.0, 22.0, 21.0, 22.0, 21.0, 31.0, 24.0, 24.0, 27.0, 41.0, 42.0, 45.0, 40.0, 33.0, 38.0, 30.0, 32.0, 31.0, 31.0, 32.0, 29.0, 40.0, 29.0, 20.0, 28.0, 29.0, 15.0, 19.0, 12.0, 18.0, 15.0, 8.0, 8.0, 5.0, 10.0, 1.0, 4.0, 7.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0], "bins": [-26.838348388671875, -25.9903564453125, -25.142364501953125, -24.29437255859375, -23.446380615234375, -22.598388671875, -21.750394821166992, -20.902402877807617, -20.054410934448242, -19.206418991088867, -18.358427047729492, -17.510435104370117, -16.66244125366211, -15.81445026397705, -14.96645736694336, -14.118465423583984, -13.27047348022461, -12.422481536865234, -11.57448959350586, -10.726496696472168, -9.878504753112793, -9.030512809753418, -8.182519912719727, -7.334527969360352, -6.486536026000977, -5.638544082641602, -4.790551662445068, -3.9425594806671143, -3.09456729888916, -2.246575355529785, -1.398582935333252, -0.5505905151367188, 0.29740333557128906, 1.1453955173492432, 1.9933876991271973, 2.8413798809051514, 3.6893720626831055, 4.5373640060424805, 5.385356426239014, 6.233348846435547, 7.081340789794922, 7.929332733154297, 8.777324676513672, 9.625317573547363, 10.473309516906738, 11.321301460266113, 12.169294357299805, 13.01728630065918, 13.865278244018555, 14.71327018737793, 15.561262130737305, 16.40925407409668, 17.257247924804688, 18.105239868164062, 18.953231811523438, 19.801223754882812, 20.649215698242188, 21.497207641601562, 22.345199584960938, 23.193191528320312, 24.041183471679688, 24.889175415039062, 25.73716926574707, 26.585161209106445, 27.43315315246582]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0, 5.0, 3.0, 5.0, 5.0, 12.0, 8.0, 17.0, 19.0, 23.0, 22.0, 37.0, 32.0, 34.0, 39.0, 43.0, 45.0, 45.0, 59.0, 48.0, 60.0, 39.0, 63.0, 48.0, 30.0, 38.0, 37.0, 31.0, 16.0, 25.0, 18.0, 18.0, 14.0, 16.0, 10.0, 14.0, 6.0, 7.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.08203125, -2.9913330078125, -2.900634765625, -2.8099365234375, -2.71923828125, -2.6285400390625, -2.537841796875, -2.4471435546875, -2.3564453125, -2.2657470703125, -2.175048828125, -2.0843505859375, -1.99365234375, -1.9029541015625, -1.812255859375, -1.7215576171875, -1.630859375, -1.5401611328125, -1.449462890625, -1.3587646484375, -1.26806640625, -1.1773681640625, -1.086669921875, -0.9959716796875, -0.9052734375, -0.8145751953125, -0.723876953125, -0.6331787109375, -0.54248046875, -0.4517822265625, -0.361083984375, -0.2703857421875, -0.1796875, -0.0889892578125, 0.001708984375, 0.0924072265625, 0.18310546875, 0.2738037109375, 0.364501953125, 0.4552001953125, 0.5458984375, 0.6365966796875, 0.727294921875, 0.8179931640625, 0.90869140625, 0.9993896484375, 1.090087890625, 1.1807861328125, 1.271484375, 1.3621826171875, 1.452880859375, 1.5435791015625, 1.63427734375, 1.7249755859375, 1.815673828125, 1.9063720703125, 1.9970703125, 2.0877685546875, 2.178466796875, 2.2691650390625, 2.35986328125, 2.4505615234375, 2.541259765625, 2.6319580078125, 2.72265625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 5.0, 11.0, 13.0, 13.0, 40.0, 58.0, 90.0, 127.0, 231.0, 350.0, 561.0, 921.0, 1626.0, 2754.0, 4618.0, 7834.0, 13221.0, 22373.0, 36527.0, 57910.0, 86938.0, 120520.0, 149206.0, 154040.0, 127332.0, 94758.0, 63758.0, 41041.0, 24976.0, 14945.0, 8874.0, 5212.0, 3038.0, 1816.0, 1147.0, 657.0, 356.0, 268.0, 152.0, 101.0, 60.0, 25.0, 22.0, 13.0, 8.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.5830078125, -0.56591796875, -0.548828125, -0.53173828125, -0.5146484375, -0.49755859375, -0.48046875, -0.46337890625, -0.4462890625, -0.42919921875, -0.412109375, -0.39501953125, -0.3779296875, -0.36083984375, -0.34375, -0.32666015625, -0.3095703125, -0.29248046875, -0.275390625, -0.25830078125, -0.2412109375, -0.22412109375, -0.20703125, -0.18994140625, -0.1728515625, -0.15576171875, -0.138671875, -0.12158203125, -0.1044921875, -0.08740234375, -0.0703125, -0.05322265625, -0.0361328125, -0.01904296875, -0.001953125, 0.01513671875, 0.0322265625, 0.04931640625, 0.06640625, 0.08349609375, 0.1005859375, 0.11767578125, 0.134765625, 0.15185546875, 0.1689453125, 0.18603515625, 0.203125, 0.22021484375, 0.2373046875, 0.25439453125, 0.271484375, 0.28857421875, 0.3056640625, 0.32275390625, 0.33984375, 0.35693359375, 0.3740234375, 0.39111328125, 0.408203125, 0.42529296875, 0.4423828125, 0.45947265625, 0.4765625, 0.49365234375, 0.5107421875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 11.0, 10.0, 6.0, 18.0, 19.0, 14.0, 22.0, 24.0, 23.0, 32.0, 31.0, 35.0, 40.0, 53.0, 47.0, 42.0, 50.0, 1078.0, 42.0, 37.0, 54.0, 29.0, 43.0, 50.0, 32.0, 32.0, 24.0, 16.0, 22.0, 19.0, 17.0, 9.0, 9.0, 6.0, 11.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.619140625, -2.546142578125, -2.47314453125, -2.400146484375, -2.3271484375, -2.254150390625, -2.18115234375, -2.108154296875, -2.03515625, -1.962158203125, -1.88916015625, -1.816162109375, -1.7431640625, -1.670166015625, -1.59716796875, -1.524169921875, -1.451171875, -1.378173828125, -1.30517578125, -1.232177734375, -1.1591796875, -1.086181640625, -1.01318359375, -0.940185546875, -0.8671875, -0.794189453125, -0.72119140625, -0.648193359375, -0.5751953125, -0.502197265625, -0.42919921875, -0.356201171875, -0.283203125, -0.210205078125, -0.13720703125, -0.064208984375, 0.0087890625, 0.081787109375, 0.15478515625, 0.227783203125, 0.30078125, 0.373779296875, 0.44677734375, 0.519775390625, 0.5927734375, 0.665771484375, 0.73876953125, 0.811767578125, 0.884765625, 0.957763671875, 1.03076171875, 1.103759765625, 1.1767578125, 1.249755859375, 1.32275390625, 1.395751953125, 1.46875, 1.541748046875, 1.61474609375, 1.687744140625, 1.7607421875, 1.833740234375, 1.90673828125, 1.979736328125, 2.052734375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 8.0, 3.0, 9.0, 10.0, 15.0, 20.0, 43.0, 45.0, 61.0, 93.0, 169.0, 266.0, 500.0, 832.0, 1686.0, 2966.0, 5802.0, 10955.0, 21335.0, 43526.0, 1878422.0, 69545.0, 29522.0, 14866.0, 7596.0, 3996.0, 2185.0, 1091.0, 624.0, 359.0, 198.0, 127.0, 79.0, 51.0, 33.0, 24.0, 16.0, 12.0, 8.0, 3.0, 8.0, 6.0, 3.0, 2.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.16796875, -1.1333465576171875, -1.098724365234375, -1.0641021728515625, -1.02947998046875, -0.9948577880859375, -0.960235595703125, -0.9256134033203125, -0.8909912109375, -0.8563690185546875, -0.821746826171875, -0.7871246337890625, -0.75250244140625, -0.7178802490234375, -0.683258056640625, -0.6486358642578125, -0.614013671875, -0.5793914794921875, -0.544769287109375, -0.5101470947265625, -0.47552490234375, -0.4409027099609375, -0.406280517578125, -0.3716583251953125, -0.3370361328125, -0.3024139404296875, -0.267791748046875, -0.2331695556640625, -0.19854736328125, -0.1639251708984375, -0.129302978515625, -0.0946807861328125, -0.06005859375, -0.0254364013671875, 0.009185791015625, 0.0438079833984375, 0.07843017578125, 0.1130523681640625, 0.147674560546875, 0.1822967529296875, 0.2169189453125, 0.2515411376953125, 0.286163330078125, 0.3207855224609375, 0.35540771484375, 0.3900299072265625, 0.424652099609375, 0.4592742919921875, 0.493896484375, 0.5285186767578125, 0.563140869140625, 0.5977630615234375, 0.63238525390625, 0.6670074462890625, 0.701629638671875, 0.7362518310546875, 0.7708740234375, 0.8054962158203125, 0.840118408203125, 0.8747406005859375, 0.90936279296875, 0.9439849853515625, 0.978607177734375, 1.0132293701171875, 1.0478515625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 5.0, 4.0, 8.0, 15.0, 27.0, 28.0, 66.0, 102.0, 134.0, 172.0, 134.0, 95.0, 73.0, 42.0, 33.0, 16.0, 7.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056182861328125, -0.054280757904052734, -0.05237865447998047, -0.0504765510559082, -0.04857444763183594, -0.04667234420776367, -0.044770240783691406, -0.04286813735961914, -0.040966033935546875, -0.03906393051147461, -0.037161827087402344, -0.03525972366333008, -0.03335762023925781, -0.03145551681518555, -0.02955341339111328, -0.027651309967041016, -0.02574920654296875, -0.023847103118896484, -0.02194499969482422, -0.020042896270751953, -0.018140792846679688, -0.016238689422607422, -0.014336585998535156, -0.01243448257446289, -0.010532379150390625, -0.00863027572631836, -0.006728172302246094, -0.004826068878173828, -0.0029239654541015625, -0.0010218620300292969, 0.0008802413940429688, 0.0027823448181152344, 0.0046844482421875, 0.006586551666259766, 0.008488655090332031, 0.010390758514404297, 0.012292861938476562, 0.014194965362548828, 0.016097068786621094, 0.01799917221069336, 0.019901275634765625, 0.02180337905883789, 0.023705482482910156, 0.025607585906982422, 0.027509689331054688, 0.029411792755126953, 0.03131389617919922, 0.033215999603271484, 0.03511810302734375, 0.037020206451416016, 0.03892230987548828, 0.04082441329956055, 0.04272651672363281, 0.04462862014770508, 0.046530723571777344, 0.04843282699584961, 0.050334930419921875, 0.05223703384399414, 0.054139137268066406, 0.05604124069213867, 0.05794334411621094, 0.0598454475402832, 0.06174755096435547, 0.06364965438842773, 0.0655517578125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 7.0, 10.0, 14.0, 12.0, 17.0, 22.0, 22.0, 27.0, 39.0, 98.0, 262.0, 996.0, 4693.0, 84993.0, 947903.0, 7348.0, 1379.0, 364.0, 121.0, 67.0, 30.0, 22.0, 15.0, 12.0, 13.0, 16.0, 11.0, 6.0, 7.0, 6.0, 2.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2509765625, -1.209442138671875, -1.16790771484375, -1.126373291015625, -1.0848388671875, -1.043304443359375, -1.00177001953125, -0.960235595703125, -0.918701171875, -0.877166748046875, -0.83563232421875, -0.794097900390625, -0.7525634765625, -0.711029052734375, -0.66949462890625, -0.627960205078125, -0.58642578125, -0.544891357421875, -0.50335693359375, -0.461822509765625, -0.4202880859375, -0.378753662109375, -0.33721923828125, -0.295684814453125, -0.254150390625, -0.212615966796875, -0.17108154296875, -0.129547119140625, -0.0880126953125, -0.046478271484375, -0.00494384765625, 0.036590576171875, 0.078125, 0.119659423828125, 0.16119384765625, 0.202728271484375, 0.2442626953125, 0.285797119140625, 0.32733154296875, 0.368865966796875, 0.410400390625, 0.451934814453125, 0.49346923828125, 0.535003662109375, 0.5765380859375, 0.618072509765625, 0.65960693359375, 0.701141357421875, 0.74267578125, 0.784210205078125, 0.82574462890625, 0.867279052734375, 0.9088134765625, 0.950347900390625, 0.99188232421875, 1.033416748046875, 1.074951171875, 1.116485595703125, 1.15802001953125, 1.199554443359375, 1.2410888671875, 1.282623291015625, 1.32415771484375, 1.365692138671875, 1.4072265625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 11.0, 18.0, 22.0, 35.0, 64.0, 107.0, 229.0, 298.0, 114.0, 48.0, 24.0, 17.0, 3.0, 3.0, 3.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.40678444504737854, -0.3973753750324249, -0.3879663050174713, -0.3785572350025177, -0.3691481649875641, -0.3597390651702881, -0.3503299951553345, -0.34092092514038086, -0.33151185512542725, -0.32210278511047363, -0.31269371509552, -0.3032846450805664, -0.2938755750656128, -0.2844665050506592, -0.27505743503570557, -0.26564833521842957, -0.25623929500579834, -0.24683022499084473, -0.2374211549758911, -0.2280120849609375, -0.2186030000448227, -0.20919393002986908, -0.19978486001491547, -0.19037577509880066, -0.18096670508384705, -0.17155763506889343, -0.16214856505393982, -0.1527394950389862, -0.1433304101228714, -0.13392134010791779, -0.12451227009296417, -0.11510319262742996, -0.10569410026073456, -0.09628503024578094, -0.08687595278024673, -0.07746688276529312, -0.06805780529975891, -0.0586487352848053, -0.049239665269851685, -0.039830587804317474, -0.03042151778936386, -0.02101244404911995, -0.011603372171521187, -0.0021943002939224243, 0.007214773446321487, 0.0166238471865654, 0.026032917201519012, 0.03544199466705322, 0.044851064682006836, 0.05426013842225075, 0.06366921216249466, 0.07307828217744827, 0.08248735964298248, 0.0918964296579361, 0.10130549967288971, 0.11071457713842392, 0.12012364715337753, 0.12953272461891174, 0.13894179463386536, 0.14835086464881897, 0.15775993466377258, 0.1671690046787262, 0.1765780746936798, 0.18598715960979462, 0.19539622962474823]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 1.0, 4.0, 4.0, 10.0, 6.0, 6.0, 14.0, 14.0, 15.0, 15.0, 24.0, 24.0, 34.0, 26.0, 37.0, 33.0, 40.0, 35.0, 41.0, 40.0, 34.0, 37.0, 36.0, 37.0, 41.0, 41.0, 40.0, 36.0, 41.0, 25.0, 26.0, 27.0, 26.0, 29.0, 17.0, 18.0, 12.0, 14.0, 10.0, 4.0, 6.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.05008435249328613, -0.04862523078918457, -0.04716610908508301, -0.045706987380981445, -0.04424786567687988, -0.04278874397277832, -0.04132962226867676, -0.039870500564575195, -0.03841137886047363, -0.03695225715637207, -0.03549313545227051, -0.034034013748168945, -0.03257489204406738, -0.03111577033996582, -0.029656648635864258, -0.028197526931762695, -0.026738405227661133, -0.02527928352355957, -0.023820161819458008, -0.022361040115356445, -0.020901918411254883, -0.01944279670715332, -0.017983675003051758, -0.016524553298950195, -0.015065431594848633, -0.01360630989074707, -0.012147188186645508, -0.010688066482543945, -0.009228944778442383, -0.00776982307434082, -0.006310701370239258, -0.004851579666137695, -0.003392457962036133, -0.0019333362579345703, -0.0004742145538330078, 0.0009849071502685547, 0.002444028854370117, 0.0039031505584716797, 0.005362272262573242, 0.006821393966674805, 0.008280515670776367, 0.00973963737487793, 0.011198759078979492, 0.012657880783081055, 0.014117002487182617, 0.01557612419128418, 0.017035245895385742, 0.018494367599487305, 0.019953489303588867, 0.02141261100769043, 0.022871732711791992, 0.024330854415893555, 0.025789976119995117, 0.02724909782409668, 0.028708219528198242, 0.030167341232299805, 0.03162646293640137, 0.03308558464050293, 0.03454470634460449, 0.036003828048706055, 0.03746294975280762, 0.03892207145690918, 0.04038119316101074, 0.041840314865112305, 0.04329943656921387]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 8.0, 3.0, 6.0, 4.0, 10.0, 10.0, 11.0, 22.0, 22.0, 26.0, 34.0, 41.0, 41.0, 42.0, 37.0, 54.0, 39.0, 46.0, 55.0, 54.0, 44.0, 41.0, 48.0, 36.0, 48.0, 42.0, 25.0, 20.0, 26.0, 29.0, 17.0, 10.0, 10.0, 8.0, 11.0, 10.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.29296875, -3.200927734375, -3.10888671875, -3.016845703125, -2.9248046875, -2.832763671875, -2.74072265625, -2.648681640625, -2.556640625, -2.464599609375, -2.37255859375, -2.280517578125, -2.1884765625, -2.096435546875, -2.00439453125, -1.912353515625, -1.8203125, -1.728271484375, -1.63623046875, -1.544189453125, -1.4521484375, -1.360107421875, -1.26806640625, -1.176025390625, -1.083984375, -0.991943359375, -0.89990234375, -0.807861328125, -0.7158203125, -0.623779296875, -0.53173828125, -0.439697265625, -0.34765625, -0.255615234375, -0.16357421875, -0.071533203125, 0.0205078125, 0.112548828125, 0.20458984375, 0.296630859375, 0.388671875, 0.480712890625, 0.57275390625, 0.664794921875, 0.7568359375, 0.848876953125, 0.94091796875, 1.032958984375, 1.125, 1.217041015625, 1.30908203125, 1.401123046875, 1.4931640625, 1.585205078125, 1.67724609375, 1.769287109375, 1.861328125, 1.953369140625, 2.04541015625, 2.137451171875, 2.2294921875, 2.321533203125, 2.41357421875, 2.505615234375, 2.59765625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 6.0, 9.0, 10.0, 13.0, 37.0, 42.0, 64.0, 114.0, 230.0, 351.0, 802.0, 1565.0, 3603.0, 8698.0, 23090.0, 62882.0, 164289.0, 316686.0, 271600.0, 120620.0, 45180.0, 16793.0, 6511.0, 2763.0, 1213.0, 587.0, 340.0, 185.0, 88.0, 55.0, 54.0, 25.0, 20.0, 11.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-4.33984375, -4.23089599609375, -4.1219482421875, -4.01300048828125, -3.904052734375, -3.79510498046875, -3.6861572265625, -3.57720947265625, -3.46826171875, -3.35931396484375, -3.2503662109375, -3.14141845703125, -3.032470703125, -2.92352294921875, -2.8145751953125, -2.70562744140625, -2.5966796875, -2.48773193359375, -2.3787841796875, -2.26983642578125, -2.160888671875, -2.05194091796875, -1.9429931640625, -1.83404541015625, -1.72509765625, -1.61614990234375, -1.5072021484375, -1.39825439453125, -1.289306640625, -1.18035888671875, -1.0714111328125, -0.96246337890625, -0.853515625, -0.74456787109375, -0.6356201171875, -0.52667236328125, -0.417724609375, -0.30877685546875, -0.1998291015625, -0.09088134765625, 0.01806640625, 0.12701416015625, 0.2359619140625, 0.34490966796875, 0.453857421875, 0.56280517578125, 0.6717529296875, 0.78070068359375, 0.8896484375, 0.99859619140625, 1.1075439453125, 1.21649169921875, 1.325439453125, 1.43438720703125, 1.5433349609375, 1.65228271484375, 1.76123046875, 1.87017822265625, 1.9791259765625, 2.08807373046875, 2.197021484375, 2.30596923828125, 2.4149169921875, 2.52386474609375, 2.6328125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 4.0, 6.0, 5.0, 5.0, 20.0, 11.0, 22.0, 22.0, 26.0, 27.0, 34.0, 36.0, 42.0, 60.0, 79.0, 136.0, 252.0, 1409.0, 251.0, 140.0, 81.0, 65.0, 44.0, 37.0, 30.0, 26.0, 42.0, 20.0, 24.0, 18.0, 19.0, 7.0, 5.0, 15.0, 6.0, 5.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-11.8359375, -11.5023193359375, -11.168701171875, -10.8350830078125, -10.50146484375, -10.1678466796875, -9.834228515625, -9.5006103515625, -9.1669921875, -8.8333740234375, -8.499755859375, -8.1661376953125, -7.83251953125, -7.4989013671875, -7.165283203125, -6.8316650390625, -6.498046875, -6.1644287109375, -5.830810546875, -5.4971923828125, -5.16357421875, -4.8299560546875, -4.496337890625, -4.1627197265625, -3.8291015625, -3.4954833984375, -3.161865234375, -2.8282470703125, -2.49462890625, -2.1610107421875, -1.827392578125, -1.4937744140625, -1.16015625, -0.8265380859375, -0.492919921875, -0.1593017578125, 0.17431640625, 0.5079345703125, 0.841552734375, 1.1751708984375, 1.5087890625, 1.8424072265625, 2.176025390625, 2.5096435546875, 2.84326171875, 3.1768798828125, 3.510498046875, 3.8441162109375, 4.177734375, 4.5113525390625, 4.844970703125, 5.1785888671875, 5.51220703125, 5.8458251953125, 6.179443359375, 6.5130615234375, 6.8466796875, 7.1802978515625, 7.513916015625, 7.8475341796875, 8.18115234375, 8.5147705078125, 8.848388671875, 9.1820068359375, 9.515625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 8.0, 6.0, 5.0, 10.0, 12.0, 18.0, 22.0, 22.0, 20.0, 34.0, 41.0, 48.0, 74.0, 153.0, 316.0, 1059.0, 6620.0, 408252.0, 2696746.0, 29140.0, 2065.0, 488.0, 204.0, 94.0, 64.0, 41.0, 26.0, 20.0, 23.0, 18.0, 16.0, 12.0, 5.0, 4.0, 5.0, 5.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.5625, -17.927490234375, -17.29248046875, -16.657470703125, -16.0224609375, -15.387451171875, -14.75244140625, -14.117431640625, -13.482421875, -12.847412109375, -12.21240234375, -11.577392578125, -10.9423828125, -10.307373046875, -9.67236328125, -9.037353515625, -8.40234375, -7.767333984375, -7.13232421875, -6.497314453125, -5.8623046875, -5.227294921875, -4.59228515625, -3.957275390625, -3.322265625, -2.687255859375, -2.05224609375, -1.417236328125, -0.7822265625, -0.147216796875, 0.48779296875, 1.122802734375, 1.7578125, 2.392822265625, 3.02783203125, 3.662841796875, 4.2978515625, 4.932861328125, 5.56787109375, 6.202880859375, 6.837890625, 7.472900390625, 8.10791015625, 8.742919921875, 9.3779296875, 10.012939453125, 10.64794921875, 11.282958984375, 11.91796875, 12.552978515625, 13.18798828125, 13.822998046875, 14.4580078125, 15.093017578125, 15.72802734375, 16.363037109375, 16.998046875, 17.633056640625, 18.26806640625, 18.903076171875, 19.5380859375, 20.173095703125, 20.80810546875, 21.443115234375, 22.078125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [21.0, 264.0, 521.0, 195.0, 16.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.749096870422363, -3.421846628189087, -1.0945963859558105, 1.2326536178588867, 3.559904098510742, 5.887154579162598, 8.214404106140137, 10.541655540466309, 12.868905067443848, 15.196155548095703, 17.523405075073242, 19.85065460205078, 22.177906036376953, 24.505157470703125, 26.83240509033203, 29.159656524658203, 31.486907958984375, 33.81415939331055, 36.14140701293945, 38.468658447265625, 40.7959098815918, 43.12316131591797, 45.450408935546875, 47.77766036987305, 50.10490798950195, 52.432159423828125, 54.75940704345703, 57.0866584777832, 59.413909912109375, 61.74115753173828, 64.06840515136719, 66.39566040039062, 68.72290802001953, 71.05015563964844, 73.37741088867188, 75.70465850830078, 78.03190612792969, 80.35916137695312, 82.68640899658203, 85.01365661621094, 87.34091186523438, 89.66815948486328, 91.99541473388672, 94.32266235351562, 96.64990997314453, 98.97716522216797, 101.30441284179688, 103.63166809082031, 105.95890808105469, 108.2861557006836, 110.61341094970703, 112.94065856933594, 115.26790618896484, 117.59516143798828, 119.92240905761719, 122.24966430664062, 124.57691192626953, 126.90415954589844, 129.23141479492188, 131.55865478515625, 133.8859100341797, 136.21316528320312, 138.5404052734375, 140.86766052246094, 143.19491577148438]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 7.0, 7.0, 7.0, 3.0, 12.0, 16.0, 16.0, 21.0, 17.0, 18.0, 25.0, 27.0, 30.0, 27.0, 30.0, 27.0, 25.0, 32.0, 40.0, 44.0, 50.0, 26.0, 53.0, 37.0, 36.0, 42.0, 37.0, 30.0, 30.0, 21.0, 28.0, 17.0, 28.0, 22.0, 15.0, 13.0, 17.0, 11.0, 7.0, 15.0, 9.0, 5.0, 5.0, 10.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.189056396484375, -27.31736946105957, -26.445682525634766, -25.573993682861328, -24.702306747436523, -23.83061981201172, -22.958932876586914, -22.08724594116211, -21.215557098388672, -20.343870162963867, -19.472183227539062, -18.600494384765625, -17.72880744934082, -16.857120513916016, -15.985433578491211, -15.113746643066406, -14.242059707641602, -13.370372772216797, -12.498684883117676, -11.626997947692871, -10.75531005859375, -9.883623123168945, -9.01193618774414, -8.140249252319336, -7.268561363220215, -6.396873950958252, -5.525186538696289, -4.653499603271484, -3.7818121910095215, -2.9101247787475586, -2.038437843322754, -1.166750431060791, -0.2950630187988281, 0.5766242742538452, 1.4483115673065186, 2.3199987411499023, 3.1916861534118652, 4.063373565673828, 4.935060501098633, 5.806747913360596, 6.678435325622559, 7.5501227378845215, 8.421810150146484, 9.293497085571289, 10.165184020996094, 11.036871910095215, 11.90855884552002, 12.78024673461914, 13.651933670043945, 14.52362060546875, 15.395308494567871, 16.26699447631836, 17.138683319091797, 18.0103702545166, 18.882057189941406, 19.75374412536621, 20.625431060791016, 21.49711799621582, 22.368804931640625, 23.240493774414062, 24.112180709838867, 24.983867645263672, 25.855554580688477, 26.72724151611328, 27.59893035888672]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 1.0, 6.0, 8.0, 11.0, 3.0, 18.0, 18.0, 15.0, 23.0, 33.0, 32.0, 50.0, 36.0, 47.0, 44.0, 50.0, 55.0, 40.0, 51.0, 54.0, 53.0, 40.0, 31.0, 33.0, 43.0, 34.0, 22.0, 28.0, 21.0, 22.0, 18.0, 14.0, 8.0, 8.0, 11.0, 3.0, 7.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-3.412109375, -3.317779541015625, -3.22344970703125, -3.129119873046875, -3.0347900390625, -2.940460205078125, -2.84613037109375, -2.751800537109375, -2.657470703125, -2.563140869140625, -2.46881103515625, -2.374481201171875, -2.2801513671875, -2.185821533203125, -2.09149169921875, -1.997161865234375, -1.90283203125, -1.808502197265625, -1.71417236328125, -1.619842529296875, -1.5255126953125, -1.431182861328125, -1.33685302734375, -1.242523193359375, -1.148193359375, -1.053863525390625, -0.95953369140625, -0.865203857421875, -0.7708740234375, -0.676544189453125, -0.58221435546875, -0.487884521484375, -0.3935546875, -0.299224853515625, -0.20489501953125, -0.110565185546875, -0.0162353515625, 0.078094482421875, 0.17242431640625, 0.266754150390625, 0.361083984375, 0.455413818359375, 0.54974365234375, 0.644073486328125, 0.7384033203125, 0.832733154296875, 0.92706298828125, 1.021392822265625, 1.11572265625, 1.210052490234375, 1.30438232421875, 1.398712158203125, 1.4930419921875, 1.587371826171875, 1.68170166015625, 1.776031494140625, 1.870361328125, 1.964691162109375, 2.05902099609375, 2.153350830078125, 2.2476806640625, 2.342010498046875, 2.43634033203125, 2.530670166015625, 2.625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 0.0, 2.0, 5.0, 5.0, 9.0, 6.0, 14.0, 16.0, 19.0, 30.0, 50.0, 71.0, 74.0, 159.0, 248.0, 494.0, 1332.0, 4532.0, 21376.0, 149057.0, 1923944.0, 1910575.0, 153022.0, 22152.0, 4579.0, 1320.0, 467.0, 232.0, 142.0, 81.0, 74.0, 53.0, 26.0, 36.0, 23.0, 18.0, 11.0, 14.0, 4.0, 7.0, 1.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.65625, -14.2601318359375, -13.864013671875, -13.4678955078125, -13.07177734375, -12.6756591796875, -12.279541015625, -11.8834228515625, -11.4873046875, -11.0911865234375, -10.695068359375, -10.2989501953125, -9.90283203125, -9.5067138671875, -9.110595703125, -8.7144775390625, -8.318359375, -7.9222412109375, -7.526123046875, -7.1300048828125, -6.73388671875, -6.3377685546875, -5.941650390625, -5.5455322265625, -5.1494140625, -4.7532958984375, -4.357177734375, -3.9610595703125, -3.56494140625, -3.1688232421875, -2.772705078125, -2.3765869140625, -1.98046875, -1.5843505859375, -1.188232421875, -0.7921142578125, -0.39599609375, 0.0001220703125, 0.396240234375, 0.7923583984375, 1.1884765625, 1.5845947265625, 1.980712890625, 2.3768310546875, 2.77294921875, 3.1690673828125, 3.565185546875, 3.9613037109375, 4.357421875, 4.7535400390625, 5.149658203125, 5.5457763671875, 5.94189453125, 6.3380126953125, 6.734130859375, 7.1302490234375, 7.5263671875, 7.9224853515625, 8.318603515625, 8.7147216796875, 9.11083984375, 9.5069580078125, 9.903076171875, 10.2991943359375, 10.6953125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 10.0, 11.0, 11.0, 21.0, 29.0, 47.0, 48.0, 77.0, 130.0, 175.0, 242.0, 335.0, 454.0, 541.0, 524.0, 405.0, 305.0, 219.0, 151.0, 111.0, 75.0, 50.0, 39.0, 23.0, 16.0, 8.0, 12.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1640625, -12.8331298828125, -12.502197265625, -12.1712646484375, -11.84033203125, -11.5093994140625, -11.178466796875, -10.8475341796875, -10.5166015625, -10.1856689453125, -9.854736328125, -9.5238037109375, -9.19287109375, -8.8619384765625, -8.531005859375, -8.2000732421875, -7.869140625, -7.5382080078125, -7.207275390625, -6.8763427734375, -6.54541015625, -6.2144775390625, -5.883544921875, -5.5526123046875, -5.2216796875, -4.8907470703125, -4.559814453125, -4.2288818359375, -3.89794921875, -3.5670166015625, -3.236083984375, -2.9051513671875, -2.57421875, -2.2432861328125, -1.912353515625, -1.5814208984375, -1.25048828125, -0.9195556640625, -0.588623046875, -0.2576904296875, 0.0732421875, 0.4041748046875, 0.735107421875, 1.0660400390625, 1.39697265625, 1.7279052734375, 2.058837890625, 2.3897705078125, 2.720703125, 3.0516357421875, 3.382568359375, 3.7135009765625, 4.04443359375, 4.3753662109375, 4.706298828125, 5.0372314453125, 5.3681640625, 5.6990966796875, 6.030029296875, 6.3609619140625, 6.69189453125, 7.0228271484375, 7.353759765625, 7.6846923828125, 8.015625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 2.0, 3.0, 6.0, 18.0, 20.0, 31.0, 32.0, 73.0, 108.0, 204.0, 385.0, 772.0, 2018.0, 6704.0, 30684.0, 168932.0, 1030171.0, 2335327.0, 509419.0, 86045.0, 16488.0, 4148.0, 1330.0, 607.0, 318.0, 168.0, 100.0, 62.0, 39.0, 26.0, 9.0, 13.0, 6.0, 5.0, 3.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-16.765625, -16.290771484375, -15.81591796875, -15.341064453125, -14.8662109375, -14.391357421875, -13.91650390625, -13.441650390625, -12.966796875, -12.491943359375, -12.01708984375, -11.542236328125, -11.0673828125, -10.592529296875, -10.11767578125, -9.642822265625, -9.16796875, -8.693115234375, -8.21826171875, -7.743408203125, -7.2685546875, -6.793701171875, -6.31884765625, -5.843994140625, -5.369140625, -4.894287109375, -4.41943359375, -3.944580078125, -3.4697265625, -2.994873046875, -2.52001953125, -2.045166015625, -1.5703125, -1.095458984375, -0.62060546875, -0.145751953125, 0.3291015625, 0.803955078125, 1.27880859375, 1.753662109375, 2.228515625, 2.703369140625, 3.17822265625, 3.653076171875, 4.1279296875, 4.602783203125, 5.07763671875, 5.552490234375, 6.02734375, 6.502197265625, 6.97705078125, 7.451904296875, 7.9267578125, 8.401611328125, 8.87646484375, 9.351318359375, 9.826171875, 10.301025390625, 10.77587890625, 11.250732421875, 11.7255859375, 12.200439453125, 12.67529296875, 13.150146484375, 13.625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 12.0, 17.0, 23.0, 43.0, 43.0, 60.0, 91.0, 100.0, 103.0, 108.0, 87.0, 87.0, 72.0, 50.0, 28.0, 28.0, 18.0, 10.0, 8.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-56.1439323425293, -54.86574172973633, -53.58755111694336, -52.309356689453125, -51.031166076660156, -49.75297546386719, -48.47478485107422, -47.19659423828125, -45.91840362548828, -44.64021301269531, -43.362022399902344, -42.08382797241211, -40.80563735961914, -39.52744674682617, -38.2492561340332, -36.971065521240234, -35.69287109375, -34.41468048095703, -33.13648986816406, -31.85829734802246, -30.58010482788086, -29.30191421508789, -28.023723602294922, -26.745532989501953, -25.46734046936035, -24.189149856567383, -22.91095733642578, -21.632766723632812, -20.354576110839844, -19.076383590698242, -17.798192977905273, -16.520000457763672, -15.241806030273438, -13.963614463806152, -12.685422897338867, -11.407232284545898, -10.129040718078613, -8.850849151611328, -7.572658061981201, -6.294466972351074, -5.016275405883789, -3.738084077835083, -2.459892749786377, -1.181701421737671, 0.09648990631103516, 1.3746814727783203, 2.6528725624084473, 3.931063652038574, 5.209255218505859, 6.4874467849731445, 7.7656378746032715, 9.043828964233398, 10.322020530700684, 11.600212097167969, 12.878402709960938, 14.156594276428223, 15.434785842895508, 16.712976455688477, 17.991168975830078, 19.269359588623047, 20.547550201416016, 21.825742721557617, 23.103933334350586, 24.382125854492188, 25.660316467285156]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 5.0, 7.0, 5.0, 10.0, 13.0, 12.0, 17.0, 19.0, 23.0, 26.0, 24.0, 36.0, 30.0, 34.0, 28.0, 37.0, 39.0, 34.0, 37.0, 44.0, 41.0, 54.0, 43.0, 41.0, 43.0, 41.0, 26.0, 31.0, 46.0, 25.0, 23.0, 16.0, 22.0, 21.0, 15.0, 9.0, 7.0, 6.0, 4.0, 6.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.43029022216797, -27.487995147705078, -26.545698165893555, -25.603403091430664, -24.661108016967773, -23.71881103515625, -22.77651596069336, -21.83422088623047, -20.891925811767578, -19.949630737304688, -19.007333755493164, -18.065038681030273, -17.122743606567383, -16.18044662475586, -15.238151550292969, -14.295856475830078, -13.353559494018555, -12.411263465881348, -11.468968391418457, -10.52667236328125, -9.58437728881836, -8.642081260681152, -7.699785232543945, -6.7574896812438965, -5.815194129943848, -4.872898578643799, -3.930602788925171, -2.988306999206543, -2.046011447906494, -1.1037158966064453, -0.16141986846923828, 0.7808756828308105, 1.7231693267822266, 2.6654648780822754, 3.6077606678009033, 4.550056457519531, 5.49235200881958, 6.434647560119629, 7.376943588256836, 8.319238662719727, 9.261534690856934, 10.20383071899414, 11.146125793457031, 12.088421821594238, 13.030717849731445, 13.973012924194336, 14.915308952331543, 15.85760498046875, 16.79990005493164, 17.74219512939453, 18.684492111206055, 19.626787185668945, 20.569082260131836, 21.51137924194336, 22.45367431640625, 23.39596939086914, 24.33826446533203, 25.280559539794922, 26.222856521606445, 27.165151596069336, 28.107446670532227, 29.04974365234375, 29.99203872680664, 30.93433380126953, 31.876630783081055]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 7.0, 6.0, 5.0, 13.0, 11.0, 22.0, 23.0, 31.0, 33.0, 34.0, 34.0, 33.0, 49.0, 51.0, 41.0, 53.0, 41.0, 58.0, 42.0, 48.0, 30.0, 47.0, 44.0, 36.0, 35.0, 22.0, 19.0, 21.0, 25.0, 20.0, 19.0, 13.0, 7.0, 8.0, 7.0, 0.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.59375, -3.494903564453125, -3.39605712890625, -3.297210693359375, -3.1983642578125, -3.099517822265625, -3.00067138671875, -2.901824951171875, -2.802978515625, -2.704132080078125, -2.60528564453125, -2.506439208984375, -2.4075927734375, -2.308746337890625, -2.20989990234375, -2.111053466796875, -2.01220703125, -1.913360595703125, -1.81451416015625, -1.715667724609375, -1.6168212890625, -1.517974853515625, -1.41912841796875, -1.320281982421875, -1.221435546875, -1.122589111328125, -1.02374267578125, -0.924896240234375, -0.8260498046875, -0.727203369140625, -0.62835693359375, -0.529510498046875, -0.4306640625, -0.331817626953125, -0.23297119140625, -0.134124755859375, -0.0352783203125, 0.063568115234375, 0.16241455078125, 0.261260986328125, 0.360107421875, 0.458953857421875, 0.55780029296875, 0.656646728515625, 0.7554931640625, 0.854339599609375, 0.95318603515625, 1.052032470703125, 1.15087890625, 1.249725341796875, 1.34857177734375, 1.447418212890625, 1.5462646484375, 1.645111083984375, 1.74395751953125, 1.842803955078125, 1.941650390625, 2.040496826171875, 2.13934326171875, 2.238189697265625, 2.3370361328125, 2.435882568359375, 2.53472900390625, 2.633575439453125, 2.732421875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 7.0, 12.0, 13.0, 20.0, 39.0, 67.0, 101.0, 158.0, 258.0, 437.0, 630.0, 1029.0, 1747.0, 2817.0, 4572.0, 7217.0, 11609.0, 18415.0, 28582.0, 43380.0, 63445.0, 88331.0, 114243.0, 133777.0, 134701.0, 114560.0, 89682.0, 64851.0, 44235.0, 29193.0, 18949.0, 11985.0, 7502.0, 4505.0, 2830.0, 1785.0, 1100.0, 704.0, 390.0, 257.0, 160.0, 107.0, 55.0, 32.0, 27.0, 23.0, 9.0, 8.0, 6.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.53564453125, -0.5203514099121094, -0.5050582885742188, -0.4897651672363281, -0.4744720458984375, -0.4591789245605469, -0.44388580322265625, -0.4285926818847656, -0.413299560546875, -0.3980064392089844, -0.38271331787109375, -0.3674201965332031, -0.3521270751953125, -0.3368339538574219, -0.32154083251953125, -0.3062477111816406, -0.29095458984375, -0.2756614685058594, -0.26036834716796875, -0.24507522583007812, -0.2297821044921875, -0.21448898315429688, -0.19919586181640625, -0.18390274047851562, -0.168609619140625, -0.15331649780273438, -0.13802337646484375, -0.12273025512695312, -0.1074371337890625, -0.09214401245117188, -0.07685089111328125, -0.061557769775390625, -0.0462646484375, -0.030971527099609375, -0.01567840576171875, -0.000385284423828125, 0.0149078369140625, 0.030200958251953125, 0.04549407958984375, 0.060787200927734375, 0.076080322265625, 0.09137344360351562, 0.10666656494140625, 0.12195968627929688, 0.1372528076171875, 0.15254592895507812, 0.16783905029296875, 0.18313217163085938, 0.19842529296875, 0.21371841430664062, 0.22901153564453125, 0.24430465698242188, 0.2595977783203125, 0.2748908996582031, 0.29018402099609375, 0.3054771423339844, 0.320770263671875, 0.3360633850097656, 0.35135650634765625, 0.3666496276855469, 0.3819427490234375, 0.3972358703613281, 0.41252899169921875, 0.4278221130371094, 0.443115234375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 6.0, 5.0, 5.0, 7.0, 9.0, 8.0, 15.0, 12.0, 14.0, 12.0, 23.0, 19.0, 27.0, 36.0, 34.0, 34.0, 36.0, 37.0, 36.0, 31.0, 32.0, 48.0, 1069.0, 48.0, 45.0, 36.0, 30.0, 40.0, 38.0, 31.0, 22.0, 27.0, 24.0, 17.0, 28.0, 9.0, 9.0, 17.0, 9.0, 8.0, 9.0, 7.0, 9.0, 3.0, 3.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.091796875, -2.02276611328125, -1.9537353515625, -1.88470458984375, -1.815673828125, -1.74664306640625, -1.6776123046875, -1.60858154296875, -1.53955078125, -1.47052001953125, -1.4014892578125, -1.33245849609375, -1.263427734375, -1.19439697265625, -1.1253662109375, -1.05633544921875, -0.9873046875, -0.91827392578125, -0.8492431640625, -0.78021240234375, -0.711181640625, -0.64215087890625, -0.5731201171875, -0.50408935546875, -0.43505859375, -0.36602783203125, -0.2969970703125, -0.22796630859375, -0.158935546875, -0.08990478515625, -0.0208740234375, 0.04815673828125, 0.1171875, 0.18621826171875, 0.2552490234375, 0.32427978515625, 0.393310546875, 0.46234130859375, 0.5313720703125, 0.60040283203125, 0.66943359375, 0.73846435546875, 0.8074951171875, 0.87652587890625, 0.945556640625, 1.01458740234375, 1.0836181640625, 1.15264892578125, 1.2216796875, 1.29071044921875, 1.3597412109375, 1.42877197265625, 1.497802734375, 1.56683349609375, 1.6358642578125, 1.70489501953125, 1.77392578125, 1.84295654296875, 1.9119873046875, 1.98101806640625, 2.050048828125, 2.11907958984375, 2.1881103515625, 2.25714111328125, 2.326171875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 9.0, 3.0, 8.0, 11.0, 17.0, 24.0, 32.0, 49.0, 84.0, 96.0, 180.0, 335.0, 588.0, 1029.0, 1850.0, 3362.0, 6340.0, 12035.0, 22793.0, 46946.0, 1883820.0, 59878.0, 26938.0, 14321.0, 7539.0, 3908.0, 2186.0, 1119.0, 684.0, 381.0, 211.0, 117.0, 82.0, 46.0, 45.0, 17.0, 17.0, 12.0, 2.0, 7.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.091796875, -1.0583343505859375, -1.024871826171875, -0.9914093017578125, -0.95794677734375, -0.9244842529296875, -0.891021728515625, -0.8575592041015625, -0.8240966796875, -0.7906341552734375, -0.757171630859375, -0.7237091064453125, -0.69024658203125, -0.6567840576171875, -0.623321533203125, -0.5898590087890625, -0.556396484375, -0.5229339599609375, -0.489471435546875, -0.4560089111328125, -0.42254638671875, -0.3890838623046875, -0.355621337890625, -0.3221588134765625, -0.2886962890625, -0.2552337646484375, -0.221771240234375, -0.1883087158203125, -0.15484619140625, -0.1213836669921875, -0.087921142578125, -0.0544586181640625, -0.02099609375, 0.0124664306640625, 0.045928955078125, 0.0793914794921875, 0.11285400390625, 0.1463165283203125, 0.179779052734375, 0.2132415771484375, 0.2467041015625, 0.2801666259765625, 0.313629150390625, 0.3470916748046875, 0.38055419921875, 0.4140167236328125, 0.447479248046875, 0.4809417724609375, 0.514404296875, 0.5478668212890625, 0.581329345703125, 0.6147918701171875, 0.64825439453125, 0.6817169189453125, 0.715179443359375, 0.7486419677734375, 0.7821044921875, 0.8155670166015625, 0.849029541015625, 0.8824920654296875, 0.91595458984375, 0.9494171142578125, 0.982879638671875, 1.0163421630859375, 1.0498046875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 7.0, 8.0, 4.0, 8.0, 9.0, 11.0, 3.0, 18.0, 14.0, 23.0, 50.0, 81.0, 146.0, 210.0, 156.0, 77.0, 45.0, 22.0, 11.0, 16.0, 16.0, 11.0, 5.0, 3.0, 4.0, 5.0, 4.0, 3.0, 9.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0394287109375, -0.03821516036987305, -0.037001609802246094, -0.03578805923461914, -0.03457450866699219, -0.033360958099365234, -0.03214740753173828, -0.030933856964111328, -0.029720306396484375, -0.028506755828857422, -0.02729320526123047, -0.026079654693603516, -0.024866104125976562, -0.02365255355834961, -0.022439002990722656, -0.021225452423095703, -0.02001190185546875, -0.018798351287841797, -0.017584800720214844, -0.01637125015258789, -0.015157699584960938, -0.013944149017333984, -0.012730598449707031, -0.011517047882080078, -0.010303497314453125, -0.009089946746826172, -0.007876396179199219, -0.006662845611572266, -0.0054492950439453125, -0.004235744476318359, -0.0030221939086914062, -0.0018086433410644531, -0.0005950927734375, 0.0006184577941894531, 0.0018320083618164062, 0.0030455589294433594, 0.0042591094970703125, 0.005472660064697266, 0.006686210632324219, 0.007899761199951172, 0.009113311767578125, 0.010326862335205078, 0.011540412902832031, 0.012753963470458984, 0.013967514038085938, 0.01518106460571289, 0.016394615173339844, 0.017608165740966797, 0.01882171630859375, 0.020035266876220703, 0.021248817443847656, 0.02246236801147461, 0.023675918579101562, 0.024889469146728516, 0.02610301971435547, 0.027316570281982422, 0.028530120849609375, 0.029743671417236328, 0.03095722198486328, 0.032170772552490234, 0.03338432312011719, 0.03459787368774414, 0.035811424255371094, 0.03702497482299805, 0.038238525390625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 5.0, 12.0, 11.0, 11.0, 11.0, 18.0, 24.0, 46.0, 58.0, 128.0, 184.0, 329.0, 832.0, 2068.0, 6131.0, 29041.0, 860093.0, 129980.0, 13154.0, 3704.0, 1421.0, 613.0, 280.0, 125.0, 62.0, 45.0, 37.0, 24.0, 23.0, 12.0, 11.0, 11.0, 8.0, 10.0, 6.0, 2.0, 3.0, 4.0, 3.0, 5.0, 0.0, 2.0, 3.0], "bins": [-0.88134765625, -0.8580169677734375, -0.834686279296875, -0.8113555908203125, -0.78802490234375, -0.7646942138671875, -0.741363525390625, -0.7180328369140625, -0.6947021484375, -0.6713714599609375, -0.648040771484375, -0.6247100830078125, -0.60137939453125, -0.5780487060546875, -0.554718017578125, -0.5313873291015625, -0.508056640625, -0.4847259521484375, -0.461395263671875, -0.4380645751953125, -0.41473388671875, -0.3914031982421875, -0.368072509765625, -0.3447418212890625, -0.3214111328125, -0.2980804443359375, -0.274749755859375, -0.2514190673828125, -0.22808837890625, -0.2047576904296875, -0.181427001953125, -0.1580963134765625, -0.134765625, -0.1114349365234375, -0.088104248046875, -0.0647735595703125, -0.04144287109375, -0.0181121826171875, 0.005218505859375, 0.0285491943359375, 0.0518798828125, 0.0752105712890625, 0.098541259765625, 0.1218719482421875, 0.14520263671875, 0.1685333251953125, 0.191864013671875, 0.2151947021484375, 0.238525390625, 0.2618560791015625, 0.285186767578125, 0.3085174560546875, 0.33184814453125, 0.3551788330078125, 0.378509521484375, 0.4018402099609375, 0.4251708984375, 0.4485015869140625, 0.471832275390625, 0.4951629638671875, 0.51849365234375, 0.5418243408203125, 0.565155029296875, 0.5884857177734375, 0.61181640625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 9.0, 11.0, 16.0, 19.0, 44.0, 93.0, 202.0, 368.0, 134.0, 54.0, 24.0, 14.0, 9.0, 10.0, 4.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.9064396023750305, -0.8884613513946533, -0.8704831004142761, -0.8525048494338989, -0.8345265984535217, -0.8165483474731445, -0.7985700964927673, -0.7805918455123901, -0.7626135945320129, -0.7446353435516357, -0.7266570925712585, -0.7086788415908813, -0.6907005906105042, -0.672722339630127, -0.6547440886497498, -0.6367658376693726, -0.6187876462936401, -0.6008093953132629, -0.5828311443328857, -0.5648528933525085, -0.5468746423721313, -0.5288963913917542, -0.510918140411377, -0.49293988943099976, -0.47496163845062256, -0.45698338747024536, -0.43900513648986816, -0.42102688550949097, -0.40304863452911377, -0.3850703835487366, -0.3670921325683594, -0.3491138815879822, -0.33113566040992737, -0.31315740942955017, -0.295179158449173, -0.2772009074687958, -0.2592226564884186, -0.24124440550804138, -0.22326616942882538, -0.20528791844844818, -0.18730966746807098, -0.1693314164876938, -0.1513531655073166, -0.13337492942810059, -0.11539667099714279, -0.0974184200167656, -0.079440176486969, -0.0614619255065918, -0.0434836745262146, -0.02550542540848255, -0.0075271762907505035, 0.010451070964336395, 0.028429321944713593, 0.04640757292509079, 0.06438581645488739, 0.08236406743526459, 0.10034231841564178, 0.11832056939601898, 0.13629882037639618, 0.15427705645561218, 0.17225530743598938, 0.19023355841636658, 0.20821180939674377, 0.22619006037712097, 0.24416831135749817]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 5.0, 6.0, 6.0, 17.0, 10.0, 14.0, 14.0, 20.0, 25.0, 29.0, 30.0, 39.0, 40.0, 31.0, 38.0, 39.0, 39.0, 45.0, 38.0, 35.0, 46.0, 38.0, 39.0, 47.0, 32.0, 28.0, 31.0, 24.0, 33.0, 19.0, 21.0, 22.0, 15.0, 18.0, 15.0, 13.0, 5.0, 6.0, 4.0, 5.0, 4.0, 2.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07152998447418213, -0.06935515254735947, -0.06718031316995621, -0.06500548124313354, -0.06283064186573029, -0.06065580993890762, -0.05848097801208496, -0.056306142359972, -0.05413130670785904, -0.05195647105574608, -0.04978163540363312, -0.047606803476810455, -0.045431967824697495, -0.043257132172584534, -0.04108230024576187, -0.03890746459364891, -0.03673262894153595, -0.03455779328942299, -0.03238295763731003, -0.030208125710487366, -0.028033290058374405, -0.025858454406261444, -0.023683620616793633, -0.02150878682732582, -0.01933395117521286, -0.0171591155230999, -0.014984281733632088, -0.012809447012841702, -0.010634612292051315, -0.008459777571260929, -0.006284942850470543, -0.004110108129680157, -0.0019352734088897705, 0.0002395613119006157, 0.002414396032691002, 0.004589230753481388, 0.006764065474271774, 0.00893890019506216, 0.011113734915852547, 0.013288569636642933, 0.015463404357433319, 0.01763824000954628, 0.01981307379901409, 0.021987907588481903, 0.024162743240594864, 0.026337578892707825, 0.028512412682175636, 0.030687246471643448, 0.03286208212375641, 0.03503691777586937, 0.03721175342798233, 0.03938658535480499, 0.041561421006917953, 0.043736256659030914, 0.04591108858585358, 0.04808592423796654, 0.0502607598900795, 0.05243559554219246, 0.05461043119430542, 0.05678526312112808, 0.05896009877324104, 0.061134934425354004, 0.06330976635217667, 0.06548460572957993, 0.06765943765640259]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 5.0, 6.0, 3.0, 10.0, 13.0, 14.0, 17.0, 24.0, 27.0, 35.0, 32.0, 33.0, 38.0, 34.0, 38.0, 48.0, 46.0, 62.0, 50.0, 40.0, 39.0, 46.0, 40.0, 50.0, 49.0, 36.0, 26.0, 22.0, 22.0, 19.0, 12.0, 13.0, 11.0, 8.0, 8.0, 5.0, 5.0, 4.0, 5.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.388671875, -3.289947509765625, -3.19122314453125, -3.092498779296875, -2.9937744140625, -2.895050048828125, -2.79632568359375, -2.697601318359375, -2.598876953125, -2.500152587890625, -2.40142822265625, -2.302703857421875, -2.2039794921875, -2.105255126953125, -2.00653076171875, -1.907806396484375, -1.80908203125, -1.710357666015625, -1.61163330078125, -1.512908935546875, -1.4141845703125, -1.315460205078125, -1.21673583984375, -1.118011474609375, -1.019287109375, -0.920562744140625, -0.82183837890625, -0.723114013671875, -0.6243896484375, -0.525665283203125, -0.42694091796875, -0.328216552734375, -0.2294921875, -0.130767822265625, -0.03204345703125, 0.066680908203125, 0.1654052734375, 0.264129638671875, 0.36285400390625, 0.461578369140625, 0.560302734375, 0.659027099609375, 0.75775146484375, 0.856475830078125, 0.9552001953125, 1.053924560546875, 1.15264892578125, 1.251373291015625, 1.35009765625, 1.448822021484375, 1.54754638671875, 1.646270751953125, 1.7449951171875, 1.843719482421875, 1.94244384765625, 2.041168212890625, 2.139892578125, 2.238616943359375, 2.33734130859375, 2.436065673828125, 2.5347900390625, 2.633514404296875, 2.73223876953125, 2.830963134765625, 2.9296875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 6.0, 15.0, 17.0, 30.0, 33.0, 46.0, 100.0, 130.0, 211.0, 299.0, 477.0, 718.0, 1228.0, 2061.0, 3354.0, 5687.0, 10164.0, 17961.0, 34071.0, 74011.0, 182765.0, 351084.0, 201373.0, 81238.0, 36641.0, 19182.0, 10329.0, 5986.0, 3598.0, 2212.0, 1312.0, 762.0, 490.0, 336.0, 221.0, 129.0, 103.0, 61.0, 44.0, 22.0, 11.0, 9.0, 6.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.087890625, -2.98681640625, -2.8857421875, -2.78466796875, -2.68359375, -2.58251953125, -2.4814453125, -2.38037109375, -2.279296875, -2.17822265625, -2.0771484375, -1.97607421875, -1.875, -1.77392578125, -1.6728515625, -1.57177734375, -1.470703125, -1.36962890625, -1.2685546875, -1.16748046875, -1.06640625, -0.96533203125, -0.8642578125, -0.76318359375, -0.662109375, -0.56103515625, -0.4599609375, -0.35888671875, -0.2578125, -0.15673828125, -0.0556640625, 0.04541015625, 0.146484375, 0.24755859375, 0.3486328125, 0.44970703125, 0.55078125, 0.65185546875, 0.7529296875, 0.85400390625, 0.955078125, 1.05615234375, 1.1572265625, 1.25830078125, 1.359375, 1.46044921875, 1.5615234375, 1.66259765625, 1.763671875, 1.86474609375, 1.9658203125, 2.06689453125, 2.16796875, 2.26904296875, 2.3701171875, 2.47119140625, 2.572265625, 2.67333984375, 2.7744140625, 2.87548828125, 2.9765625, 3.07763671875, 3.1787109375, 3.27978515625, 3.380859375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 3.0, 12.0, 11.0, 11.0, 11.0, 14.0, 24.0, 16.0, 22.0, 22.0, 42.0, 34.0, 32.0, 42.0, 34.0, 70.0, 64.0, 112.0, 258.0, 1472.0, 198.0, 123.0, 53.0, 46.0, 32.0, 32.0, 27.0, 29.0, 28.0, 25.0, 19.0, 18.0, 13.0, 15.0, 10.0, 14.0, 10.0, 10.0, 9.0, 6.0, 7.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-11.328125, -11.0167236328125, -10.705322265625, -10.3939208984375, -10.08251953125, -9.7711181640625, -9.459716796875, -9.1483154296875, -8.8369140625, -8.5255126953125, -8.214111328125, -7.9027099609375, -7.59130859375, -7.2799072265625, -6.968505859375, -6.6571044921875, -6.345703125, -6.0343017578125, -5.722900390625, -5.4114990234375, -5.10009765625, -4.7886962890625, -4.477294921875, -4.1658935546875, -3.8544921875, -3.5430908203125, -3.231689453125, -2.9202880859375, -2.60888671875, -2.2974853515625, -1.986083984375, -1.6746826171875, -1.36328125, -1.0518798828125, -0.740478515625, -0.4290771484375, -0.11767578125, 0.1937255859375, 0.505126953125, 0.8165283203125, 1.1279296875, 1.4393310546875, 1.750732421875, 2.0621337890625, 2.37353515625, 2.6849365234375, 2.996337890625, 3.3077392578125, 3.619140625, 3.9305419921875, 4.241943359375, 4.5533447265625, 4.86474609375, 5.1761474609375, 5.487548828125, 5.7989501953125, 6.1103515625, 6.4217529296875, 6.733154296875, 7.0445556640625, 7.35595703125, 7.6673583984375, 7.978759765625, 8.2901611328125, 8.6015625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 5.0, 8.0, 6.0, 12.0, 15.0, 15.0, 15.0, 20.0, 23.0, 37.0, 46.0, 60.0, 113.0, 144.0, 269.0, 573.0, 1622.0, 7260.0, 71398.0, 2274829.0, 750787.0, 31834.0, 4282.0, 1148.0, 462.0, 241.0, 125.0, 77.0, 63.0, 47.0, 37.0, 23.0, 20.0, 16.0, 16.0, 14.0, 10.0, 6.0, 6.0, 4.0, 6.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.03125, -12.563232421875, -12.09521484375, -11.627197265625, -11.1591796875, -10.691162109375, -10.22314453125, -9.755126953125, -9.287109375, -8.819091796875, -8.35107421875, -7.883056640625, -7.4150390625, -6.947021484375, -6.47900390625, -6.010986328125, -5.54296875, -5.074951171875, -4.60693359375, -4.138916015625, -3.6708984375, -3.202880859375, -2.73486328125, -2.266845703125, -1.798828125, -1.330810546875, -0.86279296875, -0.394775390625, 0.0732421875, 0.541259765625, 1.00927734375, 1.477294921875, 1.9453125, 2.413330078125, 2.88134765625, 3.349365234375, 3.8173828125, 4.285400390625, 4.75341796875, 5.221435546875, 5.689453125, 6.157470703125, 6.62548828125, 7.093505859375, 7.5615234375, 8.029541015625, 8.49755859375, 8.965576171875, 9.43359375, 9.901611328125, 10.36962890625, 10.837646484375, 11.3056640625, 11.773681640625, 12.24169921875, 12.709716796875, 13.177734375, 13.645751953125, 14.11376953125, 14.581787109375, 15.0498046875, 15.517822265625, 15.98583984375, 16.453857421875, 16.921875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 23.0, 164.0, 412.0, 311.0, 91.0, 11.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.462188720703125, -44.22444152832031, -41.9866943359375, -39.74894714355469, -37.51119613647461, -35.2734489440918, -33.035701751708984, -30.797954559326172, -28.560205459594727, -26.322458267211914, -24.08470916748047, -21.846961975097656, -19.609214782714844, -17.3714656829834, -15.133718490600586, -12.895970344543457, -10.658222198486328, -8.4204740524292, -6.1827263832092285, -3.944978713989258, -1.707230567932129, 0.530517578125, 2.7682647705078125, 5.006012916564941, 7.24376106262207, 9.4815092086792, 11.719257354736328, 13.95700454711914, 16.194751739501953, 18.4325008392334, 20.67024803161621, 22.907997131347656, 25.14574432373047, 27.38349151611328, 29.621240615844727, 31.85898780822754, 34.096736907958984, 36.3344841003418, 38.57223129272461, 40.80997848510742, 43.0477294921875, 45.28547668457031, 47.523223876953125, 49.76097106933594, 51.998722076416016, 54.23646926879883, 56.47421646118164, 58.71196365356445, 60.949710845947266, 63.18745803833008, 65.42520904541016, 67.66295623779297, 69.90070343017578, 72.1384506225586, 74.3761978149414, 76.61394500732422, 78.85169219970703, 81.08943939208984, 83.32718658447266, 85.56493377685547, 87.80268096923828, 90.04043579101562, 92.27818298339844, 94.51593017578125, 96.75367736816406]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 1.0, 9.0, 8.0, 5.0, 4.0, 9.0, 7.0, 13.0, 16.0, 11.0, 11.0, 17.0, 25.0, 27.0, 24.0, 33.0, 34.0, 33.0, 31.0, 27.0, 35.0, 43.0, 41.0, 43.0, 41.0, 51.0, 30.0, 31.0, 40.0, 39.0, 23.0, 25.0, 27.0, 24.0, 27.0, 24.0, 19.0, 14.0, 16.0, 12.0, 11.0, 5.0, 4.0, 5.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-31.448070526123047, -30.444339752197266, -29.440610885620117, -28.43688201904297, -27.433151245117188, -26.429420471191406, -25.425691604614258, -24.42196273803711, -23.418231964111328, -22.414501190185547, -21.4107723236084, -20.40704345703125, -19.40331268310547, -18.399581909179688, -17.39585304260254, -16.39212417602539, -15.38839340209961, -14.384663581848145, -13.38093376159668, -12.377203941345215, -11.37347412109375, -10.369744300842285, -9.36601448059082, -8.362284660339355, -7.358554840087891, -6.354825019836426, -5.351095199584961, -4.347365379333496, -3.3436355590820312, -2.3399057388305664, -1.3361759185791016, -0.3324460983276367, 0.6712799072265625, 1.6750097274780273, 2.678739547729492, 3.682469367980957, 4.686199188232422, 5.689929008483887, 6.693658828735352, 7.697388648986816, 8.701118469238281, 9.704848289489746, 10.708578109741211, 11.712307929992676, 12.71603775024414, 13.719767570495605, 14.72349739074707, 15.727227210998535, 16.73095703125, 17.73468780517578, 18.73841667175293, 19.742145538330078, 20.74587631225586, 21.74960708618164, 22.75333595275879, 23.757064819335938, 24.76079559326172, 25.7645263671875, 26.76825523376465, 27.771984100341797, 28.775714874267578, 29.77944564819336, 30.783174514770508, 31.786903381347656, 32.79063415527344]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 9.0, 10.0, 7.0, 19.0, 17.0, 24.0, 31.0, 26.0, 41.0, 30.0, 40.0, 37.0, 52.0, 50.0, 36.0, 44.0, 56.0, 52.0, 61.0, 47.0, 31.0, 44.0, 32.0, 36.0, 31.0, 28.0, 21.0, 21.0, 21.0, 15.0, 4.0, 2.0, 10.0, 4.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07421875, -3.9644775390625, -3.854736328125, -3.7449951171875, -3.63525390625, -3.5255126953125, -3.415771484375, -3.3060302734375, -3.1962890625, -3.0865478515625, -2.976806640625, -2.8670654296875, -2.75732421875, -2.6475830078125, -2.537841796875, -2.4281005859375, -2.318359375, -2.2086181640625, -2.098876953125, -1.9891357421875, -1.87939453125, -1.7696533203125, -1.659912109375, -1.5501708984375, -1.4404296875, -1.3306884765625, -1.220947265625, -1.1112060546875, -1.00146484375, -0.8917236328125, -0.781982421875, -0.6722412109375, -0.5625, -0.4527587890625, -0.343017578125, -0.2332763671875, -0.12353515625, -0.0137939453125, 0.095947265625, 0.2056884765625, 0.3154296875, 0.4251708984375, 0.534912109375, 0.6446533203125, 0.75439453125, 0.8641357421875, 0.973876953125, 1.0836181640625, 1.193359375, 1.3031005859375, 1.412841796875, 1.5225830078125, 1.63232421875, 1.7420654296875, 1.851806640625, 1.9615478515625, 2.0712890625, 2.1810302734375, 2.290771484375, 2.4005126953125, 2.51025390625, 2.6199951171875, 2.729736328125, 2.8394775390625, 2.94921875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 10.0, 9.0, 8.0, 19.0, 23.0, 31.0, 25.0, 51.0, 74.0, 96.0, 146.0, 241.0, 551.0, 1200.0, 3764.0, 15249.0, 76720.0, 571839.0, 2821094.0, 599490.0, 80822.0, 16039.0, 4179.0, 1337.0, 511.0, 260.0, 156.0, 87.0, 72.0, 52.0, 20.0, 20.0, 21.0, 22.0, 15.0, 10.0, 7.0, 8.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.25, -11.905029296875, -11.56005859375, -11.215087890625, -10.8701171875, -10.525146484375, -10.18017578125, -9.835205078125, -9.490234375, -9.145263671875, -8.80029296875, -8.455322265625, -8.1103515625, -7.765380859375, -7.42041015625, -7.075439453125, -6.73046875, -6.385498046875, -6.04052734375, -5.695556640625, -5.3505859375, -5.005615234375, -4.66064453125, -4.315673828125, -3.970703125, -3.625732421875, -3.28076171875, -2.935791015625, -2.5908203125, -2.245849609375, -1.90087890625, -1.555908203125, -1.2109375, -0.865966796875, -0.52099609375, -0.176025390625, 0.1689453125, 0.513916015625, 0.85888671875, 1.203857421875, 1.548828125, 1.893798828125, 2.23876953125, 2.583740234375, 2.9287109375, 3.273681640625, 3.61865234375, 3.963623046875, 4.30859375, 4.653564453125, 4.99853515625, 5.343505859375, 5.6884765625, 6.033447265625, 6.37841796875, 6.723388671875, 7.068359375, 7.413330078125, 7.75830078125, 8.103271484375, 8.4482421875, 8.793212890625, 9.13818359375, 9.483154296875, 9.828125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 7.0, 8.0, 7.0, 5.0, 25.0, 29.0, 45.0, 58.0, 85.0, 112.0, 136.0, 187.0, 272.0, 399.0, 464.0, 499.0, 468.0, 363.0, 262.0, 178.0, 134.0, 109.0, 64.0, 38.0, 35.0, 25.0, 13.0, 11.0, 13.0, 4.0, 7.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6484375, -9.3406982421875, -9.032958984375, -8.7252197265625, -8.41748046875, -8.1097412109375, -7.802001953125, -7.4942626953125, -7.1865234375, -6.8787841796875, -6.571044921875, -6.2633056640625, -5.95556640625, -5.6478271484375, -5.340087890625, -5.0323486328125, -4.724609375, -4.4168701171875, -4.109130859375, -3.8013916015625, -3.49365234375, -3.1859130859375, -2.878173828125, -2.5704345703125, -2.2626953125, -1.9549560546875, -1.647216796875, -1.3394775390625, -1.03173828125, -0.7239990234375, -0.416259765625, -0.1085205078125, 0.19921875, 0.5069580078125, 0.814697265625, 1.1224365234375, 1.43017578125, 1.7379150390625, 2.045654296875, 2.3533935546875, 2.6611328125, 2.9688720703125, 3.276611328125, 3.5843505859375, 3.89208984375, 4.1998291015625, 4.507568359375, 4.8153076171875, 5.123046875, 5.4307861328125, 5.738525390625, 6.0462646484375, 6.35400390625, 6.6617431640625, 6.969482421875, 7.2772216796875, 7.5849609375, 7.8927001953125, 8.200439453125, 8.5081787109375, 8.81591796875, 9.1236572265625, 9.431396484375, 9.7391357421875, 10.046875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 1.0, 8.0, 10.0, 13.0, 18.0, 34.0, 60.0, 76.0, 92.0, 198.0, 357.0, 726.0, 1754.0, 5577.0, 25723.0, 161767.0, 1160353.0, 2349340.0, 412512.0, 59588.0, 11013.0, 2858.0, 1023.0, 482.0, 255.0, 153.0, 85.0, 67.0, 44.0, 29.0, 22.0, 9.0, 6.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.953125, -16.42724609375, -15.9013671875, -15.37548828125, -14.849609375, -14.32373046875, -13.7978515625, -13.27197265625, -12.74609375, -12.22021484375, -11.6943359375, -11.16845703125, -10.642578125, -10.11669921875, -9.5908203125, -9.06494140625, -8.5390625, -8.01318359375, -7.4873046875, -6.96142578125, -6.435546875, -5.90966796875, -5.3837890625, -4.85791015625, -4.33203125, -3.80615234375, -3.2802734375, -2.75439453125, -2.228515625, -1.70263671875, -1.1767578125, -0.65087890625, -0.125, 0.40087890625, 0.9267578125, 1.45263671875, 1.978515625, 2.50439453125, 3.0302734375, 3.55615234375, 4.08203125, 4.60791015625, 5.1337890625, 5.65966796875, 6.185546875, 6.71142578125, 7.2373046875, 7.76318359375, 8.2890625, 8.81494140625, 9.3408203125, 9.86669921875, 10.392578125, 10.91845703125, 11.4443359375, 11.97021484375, 12.49609375, 13.02197265625, 13.5478515625, 14.07373046875, 14.599609375, 15.12548828125, 15.6513671875, 16.17724609375, 16.703125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 9.0, 12.0, 19.0, 29.0, 64.0, 67.0, 96.0, 90.0, 121.0, 112.0, 104.0, 91.0, 68.0, 50.0, 26.0, 18.0, 19.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-83.0816879272461, -81.41362762451172, -79.74556732177734, -78.0775146484375, -76.40945434570312, -74.74139404296875, -73.07333374023438, -71.4052734375, -69.73721313476562, -68.06915283203125, -66.40109252929688, -64.7330322265625, -63.06497573852539, -61.39691925048828, -59.728858947753906, -58.06079864501953, -56.39274215698242, -54.72468185424805, -53.05662536621094, -51.38856506347656, -49.72050476074219, -48.05244445800781, -46.3843879699707, -44.71632766723633, -43.04827117919922, -41.380210876464844, -39.712154388427734, -38.04409408569336, -36.376033782958984, -34.707977294921875, -33.0399169921875, -31.371856689453125, -29.703792572021484, -28.035734176635742, -26.367673873901367, -24.699615478515625, -23.03155517578125, -21.363496780395508, -19.695438385009766, -18.02737808227539, -16.35931968688965, -14.69126033782959, -13.023200988769531, -11.355142593383789, -9.68708324432373, -8.019023895263672, -6.35096549987793, -4.682906150817871, -3.0148468017578125, -1.346787691116333, 0.3212714195251465, 1.9893302917480469, 3.6573896408081055, 5.325448989868164, 6.993507385253906, 8.661566734313965, 10.329626083374023, 11.997685432434082, 13.66574478149414, 15.333803176879883, 17.001861572265625, 18.669921875, 20.337980270385742, 22.006038665771484, 23.67409896850586]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 4.0, 9.0, 7.0, 9.0, 8.0, 18.0, 23.0, 20.0, 24.0, 27.0, 31.0, 26.0, 34.0, 36.0, 44.0, 35.0, 40.0, 47.0, 46.0, 51.0, 38.0, 33.0, 40.0, 43.0, 47.0, 34.0, 33.0, 35.0, 17.0, 22.0, 19.0, 19.0, 15.0, 14.0, 13.0, 10.0, 6.0, 10.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.321483612060547, -29.324167251586914, -28.32684898376465, -27.329532623291016, -26.33221435546875, -25.334897994995117, -24.337581634521484, -23.34026336669922, -22.342945098876953, -21.34562873840332, -20.348310470581055, -19.350994110107422, -18.353675842285156, -17.356359481811523, -16.35904312133789, -15.361724853515625, -14.364408493041992, -13.367091178894043, -12.369773864746094, -11.372457504272461, -10.375139236450195, -9.377822875976562, -8.380505561828613, -7.383188247680664, -6.385870933532715, -5.388553619384766, -4.391236305236816, -3.3939194679260254, -2.396602153778076, -1.399284839630127, -0.40196800231933594, 0.5953493118286133, 1.5926666259765625, 2.5899839401245117, 3.587301015853882, 4.584618091583252, 5.581935405731201, 6.57925271987915, 7.576569557189941, 8.57388687133789, 9.57120418548584, 10.568521499633789, 11.565838813781738, 12.563156127929688, 13.56047248840332, 14.557790756225586, 15.555107116699219, 16.552425384521484, 17.549741744995117, 18.54705810546875, 19.544376373291016, 20.54169273376465, 21.539011001586914, 22.536327362060547, 23.533645629882812, 24.530961990356445, 25.528278350830078, 26.52559471130371, 27.522912979125977, 28.52022933959961, 29.517547607421875, 30.514863967895508, 31.51218032836914, 32.509498596191406, 33.50681686401367]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 6.0, 5.0, 6.0, 4.0, 6.0, 18.0, 18.0, 17.0, 21.0, 23.0, 33.0, 39.0, 39.0, 41.0, 30.0, 54.0, 29.0, 40.0, 44.0, 60.0, 40.0, 50.0, 49.0, 39.0, 43.0, 34.0, 25.0, 26.0, 27.0, 25.0, 27.0, 23.0, 8.0, 12.0, 6.0, 8.0, 8.0, 8.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-3.607421875, -3.505462646484375, -3.40350341796875, -3.301544189453125, -3.1995849609375, -3.097625732421875, -2.99566650390625, -2.893707275390625, -2.791748046875, -2.689788818359375, -2.58782958984375, -2.485870361328125, -2.3839111328125, -2.281951904296875, -2.17999267578125, -2.078033447265625, -1.97607421875, -1.874114990234375, -1.77215576171875, -1.670196533203125, -1.5682373046875, -1.466278076171875, -1.36431884765625, -1.262359619140625, -1.160400390625, -1.058441162109375, -0.95648193359375, -0.854522705078125, -0.7525634765625, -0.650604248046875, -0.54864501953125, -0.446685791015625, -0.3447265625, -0.242767333984375, -0.14080810546875, -0.038848876953125, 0.0631103515625, 0.165069580078125, 0.26702880859375, 0.368988037109375, 0.470947265625, 0.572906494140625, 0.67486572265625, 0.776824951171875, 0.8787841796875, 0.980743408203125, 1.08270263671875, 1.184661865234375, 1.28662109375, 1.388580322265625, 1.49053955078125, 1.592498779296875, 1.6944580078125, 1.796417236328125, 1.89837646484375, 2.000335693359375, 2.102294921875, 2.204254150390625, 2.30621337890625, 2.408172607421875, 2.5101318359375, 2.612091064453125, 2.71405029296875, 2.816009521484375, 2.91796875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 3.0, 10.0, 7.0, 16.0, 10.0, 28.0, 32.0, 67.0, 80.0, 160.0, 257.0, 451.0, 905.0, 1773.0, 3752.0, 7792.0, 17038.0, 35814.0, 72520.0, 133765.0, 201774.0, 220175.0, 164061.0, 95624.0, 48468.0, 23079.0, 10785.0, 5048.0, 2401.0, 1213.0, 621.0, 322.0, 184.0, 105.0, 83.0, 41.0, 39.0, 21.0, 10.0, 11.0, 5.0, 4.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.921875, -0.891357421875, -0.86083984375, -0.830322265625, -0.7998046875, -0.769287109375, -0.73876953125, -0.708251953125, -0.677734375, -0.647216796875, -0.61669921875, -0.586181640625, -0.5556640625, -0.525146484375, -0.49462890625, -0.464111328125, -0.43359375, -0.403076171875, -0.37255859375, -0.342041015625, -0.3115234375, -0.281005859375, -0.25048828125, -0.219970703125, -0.189453125, -0.158935546875, -0.12841796875, -0.097900390625, -0.0673828125, -0.036865234375, -0.00634765625, 0.024169921875, 0.0546875, 0.085205078125, 0.11572265625, 0.146240234375, 0.1767578125, 0.207275390625, 0.23779296875, 0.268310546875, 0.298828125, 0.329345703125, 0.35986328125, 0.390380859375, 0.4208984375, 0.451416015625, 0.48193359375, 0.512451171875, 0.54296875, 0.573486328125, 0.60400390625, 0.634521484375, 0.6650390625, 0.695556640625, 0.72607421875, 0.756591796875, 0.787109375, 0.817626953125, 0.84814453125, 0.878662109375, 0.9091796875, 0.939697265625, 0.97021484375, 1.000732421875, 1.03125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 8.0, 6.0, 7.0, 13.0, 20.0, 9.0, 17.0, 28.0, 28.0, 19.0, 21.0, 31.0, 41.0, 40.0, 37.0, 38.0, 51.0, 37.0, 44.0, 1073.0, 40.0, 39.0, 32.0, 36.0, 36.0, 35.0, 37.0, 25.0, 22.0, 21.0, 19.0, 25.0, 12.0, 22.0, 7.0, 12.0, 11.0, 4.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.669921875, -2.593902587890625, -2.51788330078125, -2.441864013671875, -2.3658447265625, -2.289825439453125, -2.21380615234375, -2.137786865234375, -2.061767578125, -1.985748291015625, -1.90972900390625, -1.833709716796875, -1.7576904296875, -1.681671142578125, -1.60565185546875, -1.529632568359375, -1.45361328125, -1.377593994140625, -1.30157470703125, -1.225555419921875, -1.1495361328125, -1.073516845703125, -0.99749755859375, -0.921478271484375, -0.845458984375, -0.769439697265625, -0.69342041015625, -0.617401123046875, -0.5413818359375, -0.465362548828125, -0.38934326171875, -0.313323974609375, -0.2373046875, -0.161285400390625, -0.08526611328125, -0.009246826171875, 0.0667724609375, 0.142791748046875, 0.21881103515625, 0.294830322265625, 0.370849609375, 0.446868896484375, 0.52288818359375, 0.598907470703125, 0.6749267578125, 0.750946044921875, 0.82696533203125, 0.902984619140625, 0.97900390625, 1.055023193359375, 1.13104248046875, 1.207061767578125, 1.2830810546875, 1.359100341796875, 1.43511962890625, 1.511138916015625, 1.587158203125, 1.663177490234375, 1.73919677734375, 1.815216064453125, 1.8912353515625, 1.967254638671875, 2.04327392578125, 2.119293212890625, 2.1953125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 2.0, 0.0, 8.0, 10.0, 11.0, 24.0, 27.0, 60.0, 91.0, 149.0, 308.0, 573.0, 1272.0, 3044.0, 7527.0, 19118.0, 51365.0, 1909771.0, 64596.0, 23297.0, 9230.0, 3709.0, 1515.0, 682.0, 325.0, 158.0, 85.0, 51.0, 37.0, 20.0, 19.0, 12.0, 10.0, 2.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.9130859375, -1.8561553955078125, -1.799224853515625, -1.7422943115234375, -1.68536376953125, -1.6284332275390625, -1.571502685546875, -1.5145721435546875, -1.4576416015625, -1.4007110595703125, -1.343780517578125, -1.2868499755859375, -1.22991943359375, -1.1729888916015625, -1.116058349609375, -1.0591278076171875, -1.002197265625, -0.9452667236328125, -0.888336181640625, -0.8314056396484375, -0.77447509765625, -0.7175445556640625, -0.660614013671875, -0.6036834716796875, -0.5467529296875, -0.4898223876953125, -0.432891845703125, -0.3759613037109375, -0.31903076171875, -0.2621002197265625, -0.205169677734375, -0.1482391357421875, -0.09130859375, -0.0343780517578125, 0.022552490234375, 0.0794830322265625, 0.13641357421875, 0.1933441162109375, 0.250274658203125, 0.3072052001953125, 0.3641357421875, 0.4210662841796875, 0.477996826171875, 0.5349273681640625, 0.59185791015625, 0.6487884521484375, 0.705718994140625, 0.7626495361328125, 0.819580078125, 0.8765106201171875, 0.933441162109375, 0.9903717041015625, 1.04730224609375, 1.1042327880859375, 1.161163330078125, 1.2180938720703125, 1.2750244140625, 1.3319549560546875, 1.388885498046875, 1.4458160400390625, 1.50274658203125, 1.5596771240234375, 1.616607666015625, 1.6735382080078125, 1.73046875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 3.0, 4.0, 4.0, 10.0, 8.0, 16.0, 22.0, 38.0, 41.0, 61.0, 71.0, 130.0, 203.0, 132.0, 68.0, 61.0, 31.0, 18.0, 15.0, 11.0, 7.0, 12.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11724853515625, -0.1138315200805664, -0.11041450500488281, -0.10699748992919922, -0.10358047485351562, -0.10016345977783203, -0.09674644470214844, -0.09332942962646484, -0.08991241455078125, -0.08649539947509766, -0.08307838439941406, -0.07966136932373047, -0.07624435424804688, -0.07282733917236328, -0.06941032409667969, -0.0659933090209961, -0.0625762939453125, -0.059159278869628906, -0.05574226379394531, -0.05232524871826172, -0.048908233642578125, -0.04549121856689453, -0.04207420349121094, -0.038657188415527344, -0.03524017333984375, -0.031823158264160156, -0.028406143188476562, -0.02498912811279297, -0.021572113037109375, -0.01815509796142578, -0.014738082885742188, -0.011321067810058594, -0.007904052734375, -0.004487037658691406, -0.0010700225830078125, 0.0023469924926757812, 0.005764007568359375, 0.009181022644042969, 0.012598037719726562, 0.016015052795410156, 0.01943206787109375, 0.022849082946777344, 0.026266098022460938, 0.02968311309814453, 0.033100128173828125, 0.03651714324951172, 0.03993415832519531, 0.043351173400878906, 0.0467681884765625, 0.050185203552246094, 0.05360221862792969, 0.05701923370361328, 0.060436248779296875, 0.06385326385498047, 0.06727027893066406, 0.07068729400634766, 0.07410430908203125, 0.07752132415771484, 0.08093833923339844, 0.08435535430908203, 0.08777236938476562, 0.09118938446044922, 0.09460639953613281, 0.0980234146118164, 0.1014404296875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 9.0, 3.0, 10.0, 9.0, 14.0, 25.0, 41.0, 49.0, 83.0, 223.0, 706.0, 3011.0, 22614.0, 998113.0, 19644.0, 2926.0, 633.0, 186.0, 77.0, 52.0, 24.0, 18.0, 15.0, 19.0, 8.0, 8.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.705078125, -2.624267578125, -2.54345703125, -2.462646484375, -2.3818359375, -2.301025390625, -2.22021484375, -2.139404296875, -2.05859375, -1.977783203125, -1.89697265625, -1.816162109375, -1.7353515625, -1.654541015625, -1.57373046875, -1.492919921875, -1.412109375, -1.331298828125, -1.25048828125, -1.169677734375, -1.0888671875, -1.008056640625, -0.92724609375, -0.846435546875, -0.765625, -0.684814453125, -0.60400390625, -0.523193359375, -0.4423828125, -0.361572265625, -0.28076171875, -0.199951171875, -0.119140625, -0.038330078125, 0.04248046875, 0.123291015625, 0.2041015625, 0.284912109375, 0.36572265625, 0.446533203125, 0.52734375, 0.608154296875, 0.68896484375, 0.769775390625, 0.8505859375, 0.931396484375, 1.01220703125, 1.093017578125, 1.173828125, 1.254638671875, 1.33544921875, 1.416259765625, 1.4970703125, 1.577880859375, 1.65869140625, 1.739501953125, 1.8203125, 1.901123046875, 1.98193359375, 2.062744140625, 2.1435546875, 2.224365234375, 2.30517578125, 2.385986328125, 2.466796875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 5.0, 6.0, 4.0, 12.0, 16.0, 16.0, 33.0, 41.0, 65.0, 128.0, 174.0, 197.0, 123.0, 66.0, 34.0, 22.0, 22.0, 12.0, 9.0, 9.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.6788213849067688, -0.6634685397148132, -0.6481156945228577, -0.6327629089355469, -0.6174100637435913, -0.6020572185516357, -0.5867043733596802, -0.5713515281677246, -0.5559987425804138, -0.5406458973884583, -0.5252930521965027, -0.5099402666091919, -0.49458742141723633, -0.47923457622528076, -0.4638817310333252, -0.448528915643692, -0.43317607045173645, -0.4178232252597809, -0.4024704098701477, -0.38711756467819214, -0.37176474928855896, -0.3564119040966034, -0.3410590887069702, -0.32570624351501465, -0.3103533983230591, -0.2950005531311035, -0.27964773774147034, -0.26429489254951477, -0.2489420771598816, -0.23358923196792603, -0.21823640167713165, -0.20288357138633728, -0.1875307261943817, -0.17217789590358734, -0.15682506561279297, -0.1414722204208374, -0.12611940503120422, -0.11076656728982925, -0.09541372954845428, -0.08006089925765991, -0.06470806896686554, -0.04935523867607117, -0.034002404659986496, -0.018649570643901825, -0.0032967403531074524, 0.01205608993768692, 0.02740892767906189, 0.04276175796985626, 0.058114588260650635, 0.07346741855144501, 0.08882024884223938, 0.10417308658361435, 0.11952591687440872, 0.1348787546157837, 0.15023158490657806, 0.16558441519737244, 0.1809372454881668, 0.19629007577896118, 0.21164290606975555, 0.22699573636054993, 0.2423485815525055, 0.25770139694213867, 0.27305424213409424, 0.2884070873260498, 0.303759902715683]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 3.0, 3.0, 3.0, 6.0, 8.0, 5.0, 9.0, 10.0, 4.0, 15.0, 14.0, 14.0, 15.0, 16.0, 21.0, 28.0, 29.0, 34.0, 20.0, 27.0, 36.0, 26.0, 41.0, 30.0, 44.0, 36.0, 31.0, 34.0, 33.0, 33.0, 32.0, 27.0, 33.0, 26.0, 38.0, 35.0, 27.0, 22.0, 18.0, 15.0, 20.0, 16.0, 6.0, 5.0, 11.0, 6.0, 7.0, 5.0, 7.0, 7.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0], "bins": [-0.06626802682876587, -0.06419019401073456, -0.06211236119270325, -0.060034532099962234, -0.05795669928193092, -0.05587886646389961, -0.0538010373711586, -0.05172320455312729, -0.04964537173509598, -0.04756753891706467, -0.045489706099033356, -0.04341187700629234, -0.04133404418826103, -0.03925621137022972, -0.03717838227748871, -0.0351005494594574, -0.033022716641426086, -0.030944883823394775, -0.028867052868008614, -0.026789221912622452, -0.02471138909459114, -0.02263355627655983, -0.020555725321173668, -0.018477894365787506, -0.016400061547756195, -0.014322229661047459, -0.012244397774338722, -0.010166565887629986, -0.00808873400092125, -0.006010902114212513, -0.0039330702275037766, -0.0018552383407950401, 0.0002225935459136963, 0.0023004254326224327, 0.004378257319331169, 0.0064560892060399055, 0.008533921092748642, 0.010611752979457378, 0.012689584866166115, 0.014767416752874851, 0.016845248639583588, 0.0189230814576149, 0.02100091241300106, 0.023078743368387222, 0.025156576186418533, 0.027234409004449844, 0.029312239959836006, 0.03139007091522217, 0.03346790373325348, 0.03554573655128479, 0.0376235693693161, 0.039701398462057114, 0.041779231280088425, 0.043857064098119736, 0.04593489319086075, 0.04801272600889206, 0.05009055882692337, 0.05216839164495468, 0.05424622446298599, 0.056324053555727005, 0.058401886373758316, 0.06047971919178963, 0.06255754828453064, 0.06463538110256195, 0.06671321392059326]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 2.0, 4.0, 7.0, 6.0, 21.0, 18.0, 14.0, 20.0, 33.0, 20.0, 34.0, 47.0, 24.0, 35.0, 44.0, 36.0, 41.0, 52.0, 46.0, 52.0, 50.0, 48.0, 47.0, 44.0, 38.0, 24.0, 27.0, 24.0, 23.0, 19.0, 14.0, 17.0, 10.0, 17.0, 10.0, 13.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.673828125, -3.570831298828125, -3.46783447265625, -3.364837646484375, -3.2618408203125, -3.158843994140625, -3.05584716796875, -2.952850341796875, -2.849853515625, -2.746856689453125, -2.64385986328125, -2.540863037109375, -2.4378662109375, -2.334869384765625, -2.23187255859375, -2.128875732421875, -2.02587890625, -1.922882080078125, -1.81988525390625, -1.716888427734375, -1.6138916015625, -1.510894775390625, -1.40789794921875, -1.304901123046875, -1.201904296875, -1.098907470703125, -0.99591064453125, -0.892913818359375, -0.7899169921875, -0.686920166015625, -0.58392333984375, -0.480926513671875, -0.3779296875, -0.274932861328125, -0.17193603515625, -0.068939208984375, 0.0340576171875, 0.137054443359375, 0.24005126953125, 0.343048095703125, 0.446044921875, 0.549041748046875, 0.65203857421875, 0.755035400390625, 0.8580322265625, 0.961029052734375, 1.06402587890625, 1.167022705078125, 1.27001953125, 1.373016357421875, 1.47601318359375, 1.579010009765625, 1.6820068359375, 1.785003662109375, 1.88800048828125, 1.990997314453125, 2.093994140625, 2.196990966796875, 2.29998779296875, 2.402984619140625, 2.5059814453125, 2.608978271484375, 2.71197509765625, 2.814971923828125, 2.91796875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 5.0, 9.0, 10.0, 11.0, 10.0, 24.0, 25.0, 54.0, 89.0, 111.0, 216.0, 315.0, 531.0, 876.0, 1545.0, 2671.0, 4643.0, 8005.0, 13645.0, 24284.0, 42087.0, 75491.0, 139345.0, 234774.0, 218874.0, 124403.0, 67333.0, 37939.0, 21533.0, 12475.0, 7269.0, 4079.0, 2384.0, 1390.0, 783.0, 489.0, 292.0, 196.0, 96.0, 85.0, 47.0, 32.0, 18.0, 17.0, 11.0, 15.0, 6.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.306640625, -2.234344482421875, -2.16204833984375, -2.089752197265625, -2.0174560546875, -1.945159912109375, -1.87286376953125, -1.800567626953125, -1.728271484375, -1.655975341796875, -1.58367919921875, -1.511383056640625, -1.4390869140625, -1.366790771484375, -1.29449462890625, -1.222198486328125, -1.14990234375, -1.077606201171875, -1.00531005859375, -0.933013916015625, -0.8607177734375, -0.788421630859375, -0.71612548828125, -0.643829345703125, -0.571533203125, -0.499237060546875, -0.42694091796875, -0.354644775390625, -0.2823486328125, -0.210052490234375, -0.13775634765625, -0.065460205078125, 0.0068359375, 0.079132080078125, 0.15142822265625, 0.223724365234375, 0.2960205078125, 0.368316650390625, 0.44061279296875, 0.512908935546875, 0.585205078125, 0.657501220703125, 0.72979736328125, 0.802093505859375, 0.8743896484375, 0.946685791015625, 1.01898193359375, 1.091278076171875, 1.16357421875, 1.235870361328125, 1.30816650390625, 1.380462646484375, 1.4527587890625, 1.525054931640625, 1.59735107421875, 1.669647216796875, 1.741943359375, 1.814239501953125, 1.88653564453125, 1.958831787109375, 2.0311279296875, 2.103424072265625, 2.17572021484375, 2.248016357421875, 2.3203125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 9.0, 9.0, 9.0, 13.0, 8.0, 16.0, 16.0, 20.0, 26.0, 29.0, 39.0, 45.0, 42.0, 54.0, 62.0, 101.0, 181.0, 1434.0, 339.0, 130.0, 72.0, 61.0, 46.0, 37.0, 41.0, 26.0, 33.0, 27.0, 17.0, 20.0, 21.0, 18.0, 10.0, 10.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.5859375, -11.23291015625, -10.8798828125, -10.52685546875, -10.173828125, -9.82080078125, -9.4677734375, -9.11474609375, -8.76171875, -8.40869140625, -8.0556640625, -7.70263671875, -7.349609375, -6.99658203125, -6.6435546875, -6.29052734375, -5.9375, -5.58447265625, -5.2314453125, -4.87841796875, -4.525390625, -4.17236328125, -3.8193359375, -3.46630859375, -3.11328125, -2.76025390625, -2.4072265625, -2.05419921875, -1.701171875, -1.34814453125, -0.9951171875, -0.64208984375, -0.2890625, 0.06396484375, 0.4169921875, 0.77001953125, 1.123046875, 1.47607421875, 1.8291015625, 2.18212890625, 2.53515625, 2.88818359375, 3.2412109375, 3.59423828125, 3.947265625, 4.30029296875, 4.6533203125, 5.00634765625, 5.359375, 5.71240234375, 6.0654296875, 6.41845703125, 6.771484375, 7.12451171875, 7.4775390625, 7.83056640625, 8.18359375, 8.53662109375, 8.8896484375, 9.24267578125, 9.595703125, 9.94873046875, 10.3017578125, 10.65478515625, 11.0078125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 3.0, 1.0, 7.0, 5.0, 14.0, 13.0, 19.0, 26.0, 27.0, 39.0, 48.0, 41.0, 101.0, 153.0, 252.0, 515.0, 1498.0, 7167.0, 83125.0, 2416929.0, 605558.0, 25061.0, 3244.0, 842.0, 390.0, 194.0, 124.0, 84.0, 48.0, 39.0, 28.0, 24.0, 14.0, 13.0, 13.0, 12.0, 6.0, 2.0, 7.0, 5.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.328125, -13.8773193359375, -13.426513671875, -12.9757080078125, -12.52490234375, -12.0740966796875, -11.623291015625, -11.1724853515625, -10.7216796875, -10.2708740234375, -9.820068359375, -9.3692626953125, -8.91845703125, -8.4676513671875, -8.016845703125, -7.5660400390625, -7.115234375, -6.6644287109375, -6.213623046875, -5.7628173828125, -5.31201171875, -4.8612060546875, -4.410400390625, -3.9595947265625, -3.5087890625, -3.0579833984375, -2.607177734375, -2.1563720703125, -1.70556640625, -1.2547607421875, -0.803955078125, -0.3531494140625, 0.09765625, 0.5484619140625, 0.999267578125, 1.4500732421875, 1.90087890625, 2.3516845703125, 2.802490234375, 3.2532958984375, 3.7041015625, 4.1549072265625, 4.605712890625, 5.0565185546875, 5.50732421875, 5.9581298828125, 6.408935546875, 6.8597412109375, 7.310546875, 7.7613525390625, 8.212158203125, 8.6629638671875, 9.11376953125, 9.5645751953125, 10.015380859375, 10.4661865234375, 10.9169921875, 11.3677978515625, 11.818603515625, 12.2694091796875, 12.72021484375, 13.1710205078125, 13.621826171875, 14.0726318359375, 14.5234375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 84.0, 879.0, 53.0], "bins": [-413.71990966796875, -407.0920715332031, -400.4642333984375, -393.83636474609375, -387.2085266113281, -380.5806884765625, -373.9528503417969, -367.32501220703125, -360.6971740722656, -354.0693359375, -347.4414978027344, -340.81365966796875, -334.185791015625, -327.5579528808594, -320.93011474609375, -314.3022766113281, -307.6744079589844, -301.04656982421875, -294.4187316894531, -287.7908935546875, -281.16302490234375, -274.5351867675781, -267.9073486328125, -261.2795104980469, -254.65167236328125, -248.02383422851562, -241.39598083496094, -234.7681427001953, -228.1403045654297, -221.512451171875, -214.88461303710938, -208.25677490234375, -201.62892150878906, -195.00108337402344, -188.37322998046875, -181.74539184570312, -175.1175537109375, -168.4897003173828, -161.8618621826172, -155.2340087890625, -148.60618591308594, -141.9783477783203, -135.35049438476562, -128.72265625, -122.09481048583984, -115.46696472167969, -108.83912658691406, -102.2112808227539, -95.58343505859375, -88.9555892944336, -82.32775115966797, -75.69990539550781, -69.07205963134766, -62.444217681884766, -55.816375732421875, -49.18852996826172, -42.56068420410156, -35.93284225463867, -29.304996490478516, -22.677154541015625, -16.0493106842041, -9.421466827392578, -2.7936248779296875, 3.8342208862304688, 10.462060928344727]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 5.0, 6.0, 9.0, 14.0, 9.0, 14.0, 16.0, 15.0, 16.0, 21.0, 26.0, 32.0, 32.0, 28.0, 37.0, 36.0, 34.0, 37.0, 38.0, 51.0, 37.0, 45.0, 50.0, 41.0, 46.0, 32.0, 36.0, 31.0, 34.0, 28.0, 22.0, 20.0, 19.0, 13.0, 5.0, 14.0, 8.0, 11.0, 9.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.5050048828125, -33.35088348388672, -32.19676208496094, -31.042638778686523, -29.88851547241211, -28.734394073486328, -27.580272674560547, -26.426151275634766, -25.27202796936035, -24.11790657043457, -22.963783264160156, -21.809661865234375, -20.655540466308594, -19.50141716003418, -18.3472957611084, -17.193172454833984, -16.039051055908203, -14.884928703308105, -13.730806350708008, -12.576684951782227, -11.422562599182129, -10.268440246582031, -9.11431884765625, -7.960196495056152, -6.806074142456055, -5.651951789855957, -4.497829914093018, -3.343707799911499, -2.1895856857299805, -1.0354633331298828, 0.11865854263305664, 1.272780418395996, 2.4269065856933594, 3.581028699874878, 4.7351508140563965, 5.889272689819336, 7.043395042419434, 8.197517395019531, 9.351638793945312, 10.50576114654541, 11.659883499145508, 12.814005851745605, 13.968128204345703, 15.122249603271484, 16.276371002197266, 17.43049430847168, 18.58461570739746, 19.738739013671875, 20.892860412597656, 22.046981811523438, 23.20110511779785, 24.355226516723633, 25.509349822998047, 26.663471221923828, 27.81759262084961, 28.97171401977539, 30.125837326049805, 31.279958724975586, 32.43408203125, 33.58820343017578, 34.74232482910156, 35.896446228027344, 37.05057144165039, 38.20469284057617, 39.35881423950195]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 7.0, 7.0, 7.0, 17.0, 12.0, 17.0, 24.0, 26.0, 34.0, 30.0, 32.0, 39.0, 47.0, 39.0, 49.0, 43.0, 46.0, 38.0, 48.0, 44.0, 47.0, 39.0, 35.0, 42.0, 38.0, 26.0, 22.0, 23.0, 18.0, 18.0, 15.0, 12.0, 8.0, 7.0, 8.0, 9.0, 5.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.478515625, -3.3743896484375, -3.270263671875, -3.1661376953125, -3.06201171875, -2.9578857421875, -2.853759765625, -2.7496337890625, -2.6455078125, -2.5413818359375, -2.437255859375, -2.3331298828125, -2.22900390625, -2.1248779296875, -2.020751953125, -1.9166259765625, -1.8125, -1.7083740234375, -1.604248046875, -1.5001220703125, -1.39599609375, -1.2918701171875, -1.187744140625, -1.0836181640625, -0.9794921875, -0.8753662109375, -0.771240234375, -0.6671142578125, -0.56298828125, -0.4588623046875, -0.354736328125, -0.2506103515625, -0.146484375, -0.0423583984375, 0.061767578125, 0.1658935546875, 0.27001953125, 0.3741455078125, 0.478271484375, 0.5823974609375, 0.6865234375, 0.7906494140625, 0.894775390625, 0.9989013671875, 1.10302734375, 1.2071533203125, 1.311279296875, 1.4154052734375, 1.51953125, 1.6236572265625, 1.727783203125, 1.8319091796875, 1.93603515625, 2.0401611328125, 2.144287109375, 2.2484130859375, 2.3525390625, 2.4566650390625, 2.560791015625, 2.6649169921875, 2.76904296875, 2.8731689453125, 2.977294921875, 3.0814208984375, 3.185546875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 11.0, 14.0, 21.0, 44.0, 48.0, 68.0, 86.0, 177.0, 289.0, 631.0, 1322.0, 3443.0, 10488.0, 38035.0, 174418.0, 1068277.0, 2316085.0, 462734.0, 86510.0, 21114.0, 6220.0, 2249.0, 950.0, 444.0, 234.0, 137.0, 62.0, 47.0, 30.0, 24.0, 14.0, 12.0, 9.0, 7.0, 3.0, 10.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-11.0234375, -10.7427978515625, -10.462158203125, -10.1815185546875, -9.90087890625, -9.6202392578125, -9.339599609375, -9.0589599609375, -8.7783203125, -8.4976806640625, -8.217041015625, -7.9364013671875, -7.65576171875, -7.3751220703125, -7.094482421875, -6.8138427734375, -6.533203125, -6.2525634765625, -5.971923828125, -5.6912841796875, -5.41064453125, -5.1300048828125, -4.849365234375, -4.5687255859375, -4.2880859375, -4.0074462890625, -3.726806640625, -3.4461669921875, -3.16552734375, -2.8848876953125, -2.604248046875, -2.3236083984375, -2.04296875, -1.7623291015625, -1.481689453125, -1.2010498046875, -0.92041015625, -0.6397705078125, -0.359130859375, -0.0784912109375, 0.2021484375, 0.4827880859375, 0.763427734375, 1.0440673828125, 1.32470703125, 1.6053466796875, 1.885986328125, 2.1666259765625, 2.447265625, 2.7279052734375, 3.008544921875, 3.2891845703125, 3.56982421875, 3.8504638671875, 4.131103515625, 4.4117431640625, 4.6923828125, 4.9730224609375, 5.253662109375, 5.5343017578125, 5.81494140625, 6.0955810546875, 6.376220703125, 6.6568603515625, 6.9375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 7.0, 6.0, 11.0, 7.0, 20.0, 18.0, 36.0, 21.0, 41.0, 63.0, 70.0, 126.0, 177.0, 178.0, 268.0, 312.0, 393.0, 439.0, 431.0, 323.0, 235.0, 230.0, 180.0, 131.0, 96.0, 60.0, 57.0, 34.0, 28.0, 15.0, 18.0, 11.0, 11.0, 3.0, 3.0, 7.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.359375, -9.09722900390625, -8.8350830078125, -8.57293701171875, -8.310791015625, -8.04864501953125, -7.7864990234375, -7.52435302734375, -7.26220703125, -7.00006103515625, -6.7379150390625, -6.47576904296875, -6.213623046875, -5.95147705078125, -5.6893310546875, -5.42718505859375, -5.1650390625, -4.90289306640625, -4.6407470703125, -4.37860107421875, -4.116455078125, -3.85430908203125, -3.5921630859375, -3.33001708984375, -3.06787109375, -2.80572509765625, -2.5435791015625, -2.28143310546875, -2.019287109375, -1.75714111328125, -1.4949951171875, -1.23284912109375, -0.970703125, -0.70855712890625, -0.4464111328125, -0.18426513671875, 0.077880859375, 0.34002685546875, 0.6021728515625, 0.86431884765625, 1.12646484375, 1.38861083984375, 1.6507568359375, 1.91290283203125, 2.175048828125, 2.43719482421875, 2.6993408203125, 2.96148681640625, 3.2236328125, 3.48577880859375, 3.7479248046875, 4.01007080078125, 4.272216796875, 4.53436279296875, 4.7965087890625, 5.05865478515625, 5.32080078125, 5.58294677734375, 5.8450927734375, 6.10723876953125, 6.369384765625, 6.63153076171875, 6.8936767578125, 7.15582275390625, 7.41796875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 10.0, 13.0, 27.0, 26.0, 39.0, 67.0, 86.0, 125.0, 195.0, 321.0, 536.0, 929.0, 1863.0, 4380.0, 11009.0, 32649.0, 108469.0, 378541.0, 1271107.0, 1630803.0, 531246.0, 151622.0, 45080.0, 14654.0, 5367.0, 2371.0, 1136.0, 657.0, 336.0, 205.0, 130.0, 92.0, 56.0, 34.0, 31.0, 23.0, 18.0, 14.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.1328125, -9.807373046875, -9.48193359375, -9.156494140625, -8.8310546875, -8.505615234375, -8.18017578125, -7.854736328125, -7.529296875, -7.203857421875, -6.87841796875, -6.552978515625, -6.2275390625, -5.902099609375, -5.57666015625, -5.251220703125, -4.92578125, -4.600341796875, -4.27490234375, -3.949462890625, -3.6240234375, -3.298583984375, -2.97314453125, -2.647705078125, -2.322265625, -1.996826171875, -1.67138671875, -1.345947265625, -1.0205078125, -0.695068359375, -0.36962890625, -0.044189453125, 0.28125, 0.606689453125, 0.93212890625, 1.257568359375, 1.5830078125, 1.908447265625, 2.23388671875, 2.559326171875, 2.884765625, 3.210205078125, 3.53564453125, 3.861083984375, 4.1865234375, 4.511962890625, 4.83740234375, 5.162841796875, 5.48828125, 5.813720703125, 6.13916015625, 6.464599609375, 6.7900390625, 7.115478515625, 7.44091796875, 7.766357421875, 8.091796875, 8.417236328125, 8.74267578125, 9.068115234375, 9.3935546875, 9.718994140625, 10.04443359375, 10.369873046875, 10.6953125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 10.0, 40.0, 61.0, 115.0, 162.0, 187.0, 194.0, 107.0, 79.0, 30.0, 17.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.63488006591797, -50.91880416870117, -48.202728271484375, -45.486656188964844, -42.77058029174805, -40.05450439453125, -37.33843231201172, -34.62235641479492, -31.906280517578125, -29.190204620361328, -26.474130630493164, -23.758056640625, -21.041980743408203, -18.325904846191406, -15.609830856323242, -12.893756866455078, -10.177680969238281, -7.461606025695801, -4.74553108215332, -2.02945613861084, 0.6866188049316406, 3.402693748474121, 6.118768692016602, 8.834842681884766, 11.550918579101562, 14.266993522644043, 16.983068466186523, 19.699142456054688, 22.415218353271484, 25.13129425048828, 27.847368240356445, 30.56344223022461, 33.27952575683594, 35.995601654052734, 38.71167755126953, 41.42774963378906, 44.14382553100586, 46.859901428222656, 49.57597351074219, 52.292049407958984, 55.00812530517578, 57.72420120239258, 60.440277099609375, 63.156349182128906, 65.87242126464844, 68.5885009765625, 71.30457305908203, 74.02064514160156, 76.73672485351562, 79.45279693603516, 82.16887664794922, 84.88494873046875, 87.60102844238281, 90.31710052490234, 93.03317260742188, 95.74925231933594, 98.46532440185547, 101.181396484375, 103.89747619628906, 106.6135482788086, 109.32962036132812, 112.04570007324219, 114.76177215576172, 117.47784423828125, 120.19392395019531]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 4.0, 0.0, 8.0, 8.0, 11.0, 10.0, 14.0, 24.0, 22.0, 24.0, 31.0, 32.0, 33.0, 29.0, 48.0, 33.0, 39.0, 40.0, 34.0, 40.0, 44.0, 40.0, 41.0, 37.0, 43.0, 31.0, 48.0, 29.0, 32.0, 26.0, 33.0, 19.0, 14.0, 16.0, 12.0, 5.0, 8.0, 9.0, 11.0, 9.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.774503707885742, -27.797649383544922, -26.8207950592041, -25.84394073486328, -24.867088317871094, -23.890233993530273, -22.913379669189453, -21.936525344848633, -20.959671020507812, -19.982816696166992, -19.005962371826172, -18.029109954833984, -17.052255630493164, -16.075401306152344, -15.098546981811523, -14.121692657470703, -13.144840240478516, -12.167985916137695, -11.191132545471191, -10.214278221130371, -9.237424850463867, -8.260570526123047, -7.283716201782227, -6.3068623542785645, -5.330008506774902, -4.35315465927124, -3.376300573348999, -2.399446487426758, -1.4225926399230957, -0.4457387924194336, 0.5311155319213867, 1.5079693794250488, 2.4848251342773438, 3.461678981781006, 4.438532829284668, 5.415387153625488, 6.39224100112915, 7.3690948486328125, 8.345949172973633, 9.322803497314453, 10.299656867980957, 11.276511192321777, 12.253364562988281, 13.230218887329102, 14.207073211669922, 15.183926582336426, 16.160781860351562, 17.13763427734375, 18.11448860168457, 19.09134292602539, 20.06819725036621, 21.04505157470703, 22.02190399169922, 22.99875831604004, 23.97561264038086, 24.95246696472168, 25.9293212890625, 26.90617561340332, 27.88302993774414, 28.859882354736328, 29.83673667907715, 30.81359100341797, 31.79044532775879, 32.76729965209961, 33.7441520690918]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 7.0, 11.0, 9.0, 8.0, 14.0, 19.0, 29.0, 29.0, 35.0, 36.0, 36.0, 35.0, 52.0, 53.0, 53.0, 64.0, 46.0, 41.0, 58.0, 37.0, 51.0, 39.0, 38.0, 41.0, 24.0, 35.0, 18.0, 15.0, 14.0, 18.0, 11.0, 7.0, 6.0, 2.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.35546875, -4.229248046875, -4.10302734375, -3.976806640625, -3.8505859375, -3.724365234375, -3.59814453125, -3.471923828125, -3.345703125, -3.219482421875, -3.09326171875, -2.967041015625, -2.8408203125, -2.714599609375, -2.58837890625, -2.462158203125, -2.3359375, -2.209716796875, -2.08349609375, -1.957275390625, -1.8310546875, -1.704833984375, -1.57861328125, -1.452392578125, -1.326171875, -1.199951171875, -1.07373046875, -0.947509765625, -0.8212890625, -0.695068359375, -0.56884765625, -0.442626953125, -0.31640625, -0.190185546875, -0.06396484375, 0.062255859375, 0.1884765625, 0.314697265625, 0.44091796875, 0.567138671875, 0.693359375, 0.819580078125, 0.94580078125, 1.072021484375, 1.1982421875, 1.324462890625, 1.45068359375, 1.576904296875, 1.703125, 1.829345703125, 1.95556640625, 2.081787109375, 2.2080078125, 2.334228515625, 2.46044921875, 2.586669921875, 2.712890625, 2.839111328125, 2.96533203125, 3.091552734375, 3.2177734375, 3.343994140625, 3.47021484375, 3.596435546875, 3.72265625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 8.0, 19.0, 15.0, 31.0, 45.0, 79.0, 132.0, 135.0, 268.0, 459.0, 709.0, 1092.0, 1729.0, 2871.0, 4432.0, 7306.0, 11597.0, 18498.0, 28850.0, 44104.0, 65303.0, 90502.0, 115756.0, 133501.0, 132451.0, 113405.0, 90003.0, 64573.0, 43506.0, 28725.0, 18026.0, 11410.0, 7137.0, 4351.0, 2829.0, 1765.0, 1109.0, 662.0, 428.0, 278.0, 180.0, 102.0, 70.0, 40.0, 22.0, 21.0, 7.0, 3.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.626953125, -0.6060409545898438, -0.5851287841796875, -0.5642166137695312, -0.543304443359375, -0.5223922729492188, -0.5014801025390625, -0.48056793212890625, -0.45965576171875, -0.43874359130859375, -0.4178314208984375, -0.39691925048828125, -0.376007080078125, -0.35509490966796875, -0.3341827392578125, -0.31327056884765625, -0.2923583984375, -0.27144622802734375, -0.2505340576171875, -0.22962188720703125, -0.208709716796875, -0.18779754638671875, -0.1668853759765625, -0.14597320556640625, -0.12506103515625, -0.10414886474609375, -0.0832366943359375, -0.06232452392578125, -0.041412353515625, -0.02050018310546875, 0.0004119873046875, 0.02132415771484375, 0.042236328125, 0.06314849853515625, 0.0840606689453125, 0.10497283935546875, 0.125885009765625, 0.14679718017578125, 0.1677093505859375, 0.18862152099609375, 0.20953369140625, 0.23044586181640625, 0.2513580322265625, 0.27227020263671875, 0.293182373046875, 0.31409454345703125, 0.3350067138671875, 0.35591888427734375, 0.3768310546875, 0.39774322509765625, 0.4186553955078125, 0.43956756591796875, 0.460479736328125, 0.48139190673828125, 0.5023040771484375, 0.5232162475585938, 0.54412841796875, 0.5650405883789062, 0.5859527587890625, 0.6068649291992188, 0.627777099609375, 0.6486892700195312, 0.6696014404296875, 0.6905136108398438, 0.71142578125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 8.0, 5.0, 6.0, 3.0, 18.0, 8.0, 14.0, 8.0, 17.0, 17.0, 21.0, 31.0, 23.0, 31.0, 25.0, 33.0, 25.0, 26.0, 41.0, 43.0, 40.0, 47.0, 1059.0, 37.0, 52.0, 37.0, 35.0, 44.0, 37.0, 35.0, 22.0, 20.0, 16.0, 23.0, 25.0, 20.0, 14.0, 9.0, 4.0, 10.0, 7.0, 9.0, 6.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5390625, -2.45782470703125, -2.3765869140625, -2.29534912109375, -2.214111328125, -2.13287353515625, -2.0516357421875, -1.97039794921875, -1.88916015625, -1.80792236328125, -1.7266845703125, -1.64544677734375, -1.564208984375, -1.48297119140625, -1.4017333984375, -1.32049560546875, -1.2392578125, -1.15802001953125, -1.0767822265625, -0.99554443359375, -0.914306640625, -0.83306884765625, -0.7518310546875, -0.67059326171875, -0.58935546875, -0.50811767578125, -0.4268798828125, -0.34564208984375, -0.264404296875, -0.18316650390625, -0.1019287109375, -0.02069091796875, 0.060546875, 0.14178466796875, 0.2230224609375, 0.30426025390625, 0.385498046875, 0.46673583984375, 0.5479736328125, 0.62921142578125, 0.71044921875, 0.79168701171875, 0.8729248046875, 0.95416259765625, 1.035400390625, 1.11663818359375, 1.1978759765625, 1.27911376953125, 1.3603515625, 1.44158935546875, 1.5228271484375, 1.60406494140625, 1.685302734375, 1.76654052734375, 1.8477783203125, 1.92901611328125, 2.01025390625, 2.09149169921875, 2.1727294921875, 2.25396728515625, 2.335205078125, 2.41644287109375, 2.4976806640625, 2.57891845703125, 2.66015625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 6.0, 4.0, 7.0, 6.0, 9.0, 12.0, 8.0, 18.0, 30.0, 42.0, 69.0, 215.0, 479.0, 1144.0, 2864.0, 8870.0, 26704.0, 123117.0, 1885914.0, 31780.0, 10129.0, 3448.0, 1275.0, 496.0, 222.0, 102.0, 68.0, 29.0, 18.0, 10.0, 11.0, 7.0, 1.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.61328125, -2.53179931640625, -2.4503173828125, -2.36883544921875, -2.287353515625, -2.20587158203125, -2.1243896484375, -2.04290771484375, -1.96142578125, -1.87994384765625, -1.7984619140625, -1.71697998046875, -1.635498046875, -1.55401611328125, -1.4725341796875, -1.39105224609375, -1.3095703125, -1.22808837890625, -1.1466064453125, -1.06512451171875, -0.983642578125, -0.90216064453125, -0.8206787109375, -0.73919677734375, -0.65771484375, -0.57623291015625, -0.4947509765625, -0.41326904296875, -0.331787109375, -0.25030517578125, -0.1688232421875, -0.08734130859375, -0.005859375, 0.07562255859375, 0.1571044921875, 0.23858642578125, 0.320068359375, 0.40155029296875, 0.4830322265625, 0.56451416015625, 0.64599609375, 0.72747802734375, 0.8089599609375, 0.89044189453125, 0.971923828125, 1.05340576171875, 1.1348876953125, 1.21636962890625, 1.2978515625, 1.37933349609375, 1.4608154296875, 1.54229736328125, 1.623779296875, 1.70526123046875, 1.7867431640625, 1.86822509765625, 1.94970703125, 2.03118896484375, 2.1126708984375, 2.19415283203125, 2.275634765625, 2.35711669921875, 2.4385986328125, 2.52008056640625, 2.6015625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 7.0, 6.0, 5.0, 8.0, 8.0, 17.0, 27.0, 15.0, 21.0, 24.0, 54.0, 64.0, 66.0, 97.0, 112.0, 121.0, 83.0, 56.0, 36.0, 39.0, 26.0, 21.0, 18.0, 20.0, 5.0, 3.0, 5.0, 7.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.06451416015625, -0.06275606155395508, -0.060997962951660156, -0.059239864349365234, -0.05748176574707031, -0.05572366714477539, -0.05396556854248047, -0.05220746994018555, -0.050449371337890625, -0.0486912727355957, -0.04693317413330078, -0.04517507553100586, -0.04341697692871094, -0.041658878326416016, -0.039900779724121094, -0.03814268112182617, -0.03638458251953125, -0.03462648391723633, -0.032868385314941406, -0.031110286712646484, -0.029352188110351562, -0.02759408950805664, -0.02583599090576172, -0.024077892303466797, -0.022319793701171875, -0.020561695098876953, -0.01880359649658203, -0.01704549789428711, -0.015287399291992188, -0.013529300689697266, -0.011771202087402344, -0.010013103485107422, -0.0082550048828125, -0.006496906280517578, -0.004738807678222656, -0.0029807090759277344, -0.0012226104736328125, 0.0005354881286621094, 0.0022935867309570312, 0.004051685333251953, 0.005809783935546875, 0.007567882537841797, 0.009325981140136719, 0.01108407974243164, 0.012842178344726562, 0.014600276947021484, 0.016358375549316406, 0.018116474151611328, 0.01987457275390625, 0.021632671356201172, 0.023390769958496094, 0.025148868560791016, 0.026906967163085938, 0.02866506576538086, 0.03042316436767578, 0.0321812629699707, 0.033939361572265625, 0.03569746017456055, 0.03745555877685547, 0.03921365737915039, 0.04097175598144531, 0.042729854583740234, 0.044487953186035156, 0.04624605178833008, 0.048004150390625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 5.0, 2.0, 4.0, 1.0, 4.0, 6.0, 4.0, 9.0, 7.0, 16.0, 15.0, 17.0, 45.0, 56.0, 142.0, 320.0, 982.0, 2719.0, 11522.0, 507408.0, 509235.0, 11670.0, 2827.0, 933.0, 311.0, 118.0, 48.0, 25.0, 19.0, 16.0, 11.0, 8.0, 8.0, 3.0, 3.0, 4.0, 4.0, 5.0, 5.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.2275390625, -1.189178466796875, -1.15081787109375, -1.112457275390625, -1.0740966796875, -1.035736083984375, -0.99737548828125, -0.959014892578125, -0.920654296875, -0.882293701171875, -0.84393310546875, -0.805572509765625, -0.7672119140625, -0.728851318359375, -0.69049072265625, -0.652130126953125, -0.61376953125, -0.575408935546875, -0.53704833984375, -0.498687744140625, -0.4603271484375, -0.421966552734375, -0.38360595703125, -0.345245361328125, -0.306884765625, -0.268524169921875, -0.23016357421875, -0.191802978515625, -0.1534423828125, -0.115081787109375, -0.07672119140625, -0.038360595703125, 0.0, 0.038360595703125, 0.07672119140625, 0.115081787109375, 0.1534423828125, 0.191802978515625, 0.23016357421875, 0.268524169921875, 0.306884765625, 0.345245361328125, 0.38360595703125, 0.421966552734375, 0.4603271484375, 0.498687744140625, 0.53704833984375, 0.575408935546875, 0.61376953125, 0.652130126953125, 0.69049072265625, 0.728851318359375, 0.7672119140625, 0.805572509765625, 0.84393310546875, 0.882293701171875, 0.920654296875, 0.959014892578125, 0.99737548828125, 1.035736083984375, 1.0740966796875, 1.112457275390625, 1.15081787109375, 1.189178466796875, 1.2275390625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 6.0, 3.0, 3.0, 7.0, 14.0, 12.0, 15.0, 20.0, 22.0, 25.0, 41.0, 50.0, 79.0, 100.0, 112.0, 133.0, 87.0, 74.0, 34.0, 40.0, 23.0, 23.0, 17.0, 14.0, 6.0, 7.0, 8.0, 9.0, 4.0, 3.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.221976637840271, -0.21581198275089264, -0.2096473127603531, -0.20348265767097473, -0.19731798768043518, -0.19115333259105682, -0.18498866260051727, -0.17882400751113892, -0.17265933752059937, -0.166494682431221, -0.16033001244068146, -0.1541653573513031, -0.14800068736076355, -0.1418360322713852, -0.13567136228084564, -0.12950670719146729, -0.12334204465150833, -0.11717738211154938, -0.11101271957159042, -0.10484805703163147, -0.09868339449167252, -0.09251873195171356, -0.0863540768623352, -0.08018940687179565, -0.0740247517824173, -0.06786008924245834, -0.06169542670249939, -0.055530764162540436, -0.04936610162258148, -0.04320143908262253, -0.03703678026795387, -0.03087211772799492, -0.024707451462745667, -0.018542788922786713, -0.012378127314150333, -0.006213465705513954, -4.8803165555000305e-05, 0.0061158593744039536, 0.012280520051717758, 0.018445182591676712, 0.024609845131635666, 0.03077450767159462, 0.036939170211553574, 0.04310382902622223, 0.04926849156618118, 0.05543315410614014, 0.06159781664609909, 0.06776247918605804, 0.073927141726017, 0.08009180426597595, 0.0862564668059349, 0.09242112934589386, 0.09858579188585281, 0.10475045442581177, 0.11091510951519012, 0.11707977950572968, 0.12324443459510803, 0.1294090896844864, 0.13557375967502594, 0.1417384147644043, 0.14790308475494385, 0.1540677398443222, 0.16023240983486176, 0.1663970649242401, 0.17256173491477966]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 8.0, 4.0, 6.0, 3.0, 12.0, 10.0, 15.0, 17.0, 18.0, 29.0, 26.0, 37.0, 35.0, 40.0, 36.0, 44.0, 40.0, 29.0, 49.0, 46.0, 53.0, 44.0, 43.0, 37.0, 26.0, 38.0, 40.0, 25.0, 32.0, 14.0, 23.0, 15.0, 17.0, 19.0, 14.0, 6.0, 18.0, 10.0, 11.0, 3.0, 6.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05632293224334717, -0.054756246507167816, -0.053189560770988464, -0.05162287876009941, -0.05005619302392006, -0.04848950728774071, -0.046922825276851654, -0.0453561395406723, -0.04378945380449295, -0.0422227680683136, -0.04065608233213425, -0.039089400321245193, -0.03752271458506584, -0.03595602884888649, -0.034389346837997437, -0.032822661101818085, -0.03125597536563873, -0.02968928962945938, -0.02812260575592518, -0.026555921882390976, -0.024989236146211624, -0.023422550410032272, -0.02185586653649807, -0.020289182662963867, -0.018722496926784515, -0.017155811190605164, -0.015589127317070961, -0.014022442512214184, -0.012455757707357407, -0.01088907290250063, -0.009322388097643852, -0.007755703292787075, -0.006189018487930298, -0.004622333683073521, -0.0030556488782167435, -0.0014889640733599663, 7.772073149681091e-05, 0.001644405536353588, 0.0032110903412103653, 0.0047777751460671425, 0.00634445995092392, 0.007911144755780697, 0.009477829560637474, 0.011044514365494251, 0.012611199170351028, 0.014177883975207806, 0.015744568780064583, 0.017311252653598785, 0.018877938389778137, 0.02044462412595749, 0.02201130799949169, 0.023577991873025894, 0.025144677609205246, 0.026711363345384598, 0.0282780472189188, 0.029844731092453003, 0.031411416828632355, 0.03297810256481171, 0.03454478830099106, 0.03611147031188011, 0.037678156048059464, 0.039244841784238815, 0.04081152379512787, 0.04237820953130722, 0.04394489526748657]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 5.0, 6.0, 7.0, 10.0, 11.0, 17.0, 19.0, 20.0, 35.0, 29.0, 29.0, 52.0, 32.0, 43.0, 47.0, 61.0, 44.0, 57.0, 37.0, 51.0, 50.0, 39.0, 44.0, 42.0, 40.0, 41.0, 28.0, 27.0, 21.0, 12.0, 8.0, 12.0, 9.0, 6.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.833984375, -3.709625244140625, -3.58526611328125, -3.460906982421875, -3.3365478515625, -3.212188720703125, -3.08782958984375, -2.963470458984375, -2.839111328125, -2.714752197265625, -2.59039306640625, -2.466033935546875, -2.3416748046875, -2.217315673828125, -2.09295654296875, -1.968597412109375, -1.84423828125, -1.719879150390625, -1.59552001953125, -1.471160888671875, -1.3468017578125, -1.222442626953125, -1.09808349609375, -0.973724365234375, -0.849365234375, -0.725006103515625, -0.60064697265625, -0.476287841796875, -0.3519287109375, -0.227569580078125, -0.10321044921875, 0.021148681640625, 0.1455078125, 0.269866943359375, 0.39422607421875, 0.518585205078125, 0.6429443359375, 0.767303466796875, 0.89166259765625, 1.016021728515625, 1.140380859375, 1.264739990234375, 1.38909912109375, 1.513458251953125, 1.6378173828125, 1.762176513671875, 1.88653564453125, 2.010894775390625, 2.13525390625, 2.259613037109375, 2.38397216796875, 2.508331298828125, 2.6326904296875, 2.757049560546875, 2.88140869140625, 3.005767822265625, 3.130126953125, 3.254486083984375, 3.37884521484375, 3.503204345703125, 3.6275634765625, 3.751922607421875, 3.87628173828125, 4.000640869140625, 4.125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 10.0, 11.0, 10.0, 20.0, 30.0, 32.0, 79.0, 75.0, 147.0, 217.0, 326.0, 461.0, 727.0, 1052.0, 1613.0, 2394.0, 3515.0, 5352.0, 7727.0, 11463.0, 17571.0, 26332.0, 42901.0, 71507.0, 121494.0, 187804.0, 198884.0, 133815.0, 79552.0, 47105.0, 29025.0, 18858.0, 12486.0, 8482.0, 5717.0, 3908.0, 2603.0, 1729.0, 1139.0, 826.0, 521.0, 355.0, 209.0, 166.0, 104.0, 61.0, 44.0, 30.0, 22.0, 16.0, 13.0, 6.0, 6.0, 2.0, 2.0, 4.0, 1.0, 2.0], "bins": [-2.205078125, -2.136383056640625, -2.06768798828125, -1.998992919921875, -1.9302978515625, -1.861602783203125, -1.79290771484375, -1.724212646484375, -1.655517578125, -1.586822509765625, -1.51812744140625, -1.449432373046875, -1.3807373046875, -1.312042236328125, -1.24334716796875, -1.174652099609375, -1.10595703125, -1.037261962890625, -0.96856689453125, -0.899871826171875, -0.8311767578125, -0.762481689453125, -0.69378662109375, -0.625091552734375, -0.556396484375, -0.487701416015625, -0.41900634765625, -0.350311279296875, -0.2816162109375, -0.212921142578125, -0.14422607421875, -0.075531005859375, -0.0068359375, 0.061859130859375, 0.13055419921875, 0.199249267578125, 0.2679443359375, 0.336639404296875, 0.40533447265625, 0.474029541015625, 0.542724609375, 0.611419677734375, 0.68011474609375, 0.748809814453125, 0.8175048828125, 0.886199951171875, 0.95489501953125, 1.023590087890625, 1.09228515625, 1.160980224609375, 1.22967529296875, 1.298370361328125, 1.3670654296875, 1.435760498046875, 1.50445556640625, 1.573150634765625, 1.641845703125, 1.710540771484375, 1.77923583984375, 1.847930908203125, 1.9166259765625, 1.985321044921875, 2.05401611328125, 2.122711181640625, 2.19140625]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 5.0, 5.0, 1.0, 4.0, 11.0, 9.0, 13.0, 20.0, 20.0, 13.0, 16.0, 20.0, 31.0, 39.0, 22.0, 35.0, 37.0, 42.0, 58.0, 90.0, 166.0, 286.0, 1364.0, 186.0, 107.0, 66.0, 67.0, 39.0, 30.0, 41.0, 17.0, 25.0, 22.0, 25.0, 23.0, 27.0, 7.0, 12.0, 7.0, 11.0, 5.0, 7.0, 5.0, 5.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-12.6015625, -12.2431640625, -11.884765625, -11.5263671875, -11.16796875, -10.8095703125, -10.451171875, -10.0927734375, -9.734375, -9.3759765625, -9.017578125, -8.6591796875, -8.30078125, -7.9423828125, -7.583984375, -7.2255859375, -6.8671875, -6.5087890625, -6.150390625, -5.7919921875, -5.43359375, -5.0751953125, -4.716796875, -4.3583984375, -4.0, -3.6416015625, -3.283203125, -2.9248046875, -2.56640625, -2.2080078125, -1.849609375, -1.4912109375, -1.1328125, -0.7744140625, -0.416015625, -0.0576171875, 0.30078125, 0.6591796875, 1.017578125, 1.3759765625, 1.734375, 2.0927734375, 2.451171875, 2.8095703125, 3.16796875, 3.5263671875, 3.884765625, 4.2431640625, 4.6015625, 4.9599609375, 5.318359375, 5.6767578125, 6.03515625, 6.3935546875, 6.751953125, 7.1103515625, 7.46875, 7.8271484375, 8.185546875, 8.5439453125, 8.90234375, 9.2607421875, 9.619140625, 9.9775390625, 10.3359375]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 8.0, 5.0, 6.0, 7.0, 12.0, 8.0, 17.0, 15.0, 28.0, 40.0, 28.0, 40.0, 45.0, 63.0, 115.0, 184.0, 298.0, 672.0, 2443.0, 16708.0, 271901.0, 2629171.0, 206139.0, 14141.0, 2070.0, 617.0, 303.0, 179.0, 97.0, 85.0, 58.0, 40.0, 31.0, 27.0, 17.0, 22.0, 16.0, 7.0, 14.0, 7.0, 7.0, 4.0, 3.0, 3.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.5625, -13.068603515625, -12.57470703125, -12.080810546875, -11.5869140625, -11.093017578125, -10.59912109375, -10.105224609375, -9.611328125, -9.117431640625, -8.62353515625, -8.129638671875, -7.6357421875, -7.141845703125, -6.64794921875, -6.154052734375, -5.66015625, -5.166259765625, -4.67236328125, -4.178466796875, -3.6845703125, -3.190673828125, -2.69677734375, -2.202880859375, -1.708984375, -1.215087890625, -0.72119140625, -0.227294921875, 0.2666015625, 0.760498046875, 1.25439453125, 1.748291015625, 2.2421875, 2.736083984375, 3.22998046875, 3.723876953125, 4.2177734375, 4.711669921875, 5.20556640625, 5.699462890625, 6.193359375, 6.687255859375, 7.18115234375, 7.675048828125, 8.1689453125, 8.662841796875, 9.15673828125, 9.650634765625, 10.14453125, 10.638427734375, 11.13232421875, 11.626220703125, 12.1201171875, 12.614013671875, 13.10791015625, 13.601806640625, 14.095703125, 14.589599609375, 15.08349609375, 15.577392578125, 16.0712890625, 16.565185546875, 17.05908203125, 17.552978515625, 18.046875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 16.0, 44.0, 138.0, 271.0, 297.0, 178.0, 54.0, 11.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.505570411682129, -10.514201164245605, -8.522830963134766, -6.531461715698242, -4.5400919914245605, -2.548722267150879, -0.5573530197143555, 1.4340171813964844, 3.425386428833008, 5.4167561531066895, 7.408125877380371, 9.399495124816895, 11.390865325927734, 13.382234573364258, 15.373603820800781, 17.364974975585938, 19.356342315673828, 21.34771156311035, 23.339080810546875, 25.33045196533203, 27.321821212768555, 29.313190460205078, 31.3045597076416, 33.295928955078125, 35.28730010986328, 37.27867126464844, 39.27003860473633, 41.261409759521484, 43.252777099609375, 45.24414825439453, 47.23551940917969, 49.22688674926758, 51.218257904052734, 53.20962905883789, 55.20099639892578, 57.19236755371094, 59.18373489379883, 61.175106048583984, 63.166473388671875, 65.15784454345703, 67.14921569824219, 69.14058685302734, 71.1319580078125, 73.12332153320312, 75.11469268798828, 77.10606384277344, 79.0974349975586, 81.08880615234375, 83.08016967773438, 85.07154083251953, 87.06291198730469, 89.05427551269531, 91.04564666748047, 93.03701782226562, 95.02838897705078, 97.01976013183594, 99.0111312866211, 101.00250244140625, 102.9938735961914, 104.98523712158203, 106.97660827636719, 108.96797943115234, 110.9593505859375, 112.95072174072266, 114.94208526611328]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 1.0, 5.0, 3.0, 11.0, 4.0, 5.0, 10.0, 12.0, 12.0, 17.0, 14.0, 18.0, 18.0, 20.0, 23.0, 26.0, 30.0, 35.0, 32.0, 44.0, 34.0, 37.0, 35.0, 34.0, 34.0, 42.0, 48.0, 32.0, 32.0, 39.0, 32.0, 30.0, 28.0, 32.0, 27.0, 17.0, 20.0, 20.0, 13.0, 14.0, 8.0, 12.0, 5.0, 5.0, 12.0, 8.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-35.90788650512695, -34.77826690673828, -33.64864730834961, -32.5190315246582, -31.38941192626953, -30.25979232788086, -29.130172729492188, -28.000553131103516, -26.870935440063477, -25.741315841674805, -24.611698150634766, -23.482078552246094, -22.352458953857422, -21.222841262817383, -20.09322166442871, -18.963603973388672, -17.833984375, -16.704364776611328, -15.574747085571289, -14.445127487182617, -13.315508842468262, -12.185890197753906, -11.056270599365234, -9.926651954650879, -8.797033309936523, -7.667414665222168, -6.537795543670654, -5.408176422119141, -4.278557777404785, -3.1489391326904297, -2.019320011138916, -0.8897008895874023, 0.23992156982421875, 1.3695404529571533, 2.499159336090088, 3.6287782192230225, 4.758397102355957, 5.8880157470703125, 7.017634868621826, 8.14725399017334, 9.276872634887695, 10.40649127960205, 11.536109924316406, 12.665729522705078, 13.795348167419434, 14.924966812133789, 16.05458641052246, 17.1842041015625, 18.313823699951172, 19.443443298339844, 20.573060989379883, 21.702680587768555, 22.832298278808594, 23.961917877197266, 25.091537475585938, 26.22115707397461, 27.35077476501465, 28.48039436340332, 29.61001205444336, 30.73963165283203, 31.869251251220703, 32.998870849609375, 34.12848663330078, 35.25810623168945, 36.387725830078125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 7.0, 10.0, 13.0, 12.0, 16.0, 24.0, 25.0, 27.0, 28.0, 40.0, 40.0, 21.0, 44.0, 60.0, 54.0, 47.0, 56.0, 42.0, 45.0, 44.0, 46.0, 43.0, 41.0, 40.0, 32.0, 34.0, 17.0, 18.0, 18.0, 12.0, 8.0, 8.0, 4.0, 5.0, 6.0, 2.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.5, -4.3731689453125, -4.246337890625, -4.1195068359375, -3.99267578125, -3.8658447265625, -3.739013671875, -3.6121826171875, -3.4853515625, -3.3585205078125, -3.231689453125, -3.1048583984375, -2.97802734375, -2.8511962890625, -2.724365234375, -2.5975341796875, -2.470703125, -2.3438720703125, -2.217041015625, -2.0902099609375, -1.96337890625, -1.8365478515625, -1.709716796875, -1.5828857421875, -1.4560546875, -1.3292236328125, -1.202392578125, -1.0755615234375, -0.94873046875, -0.8218994140625, -0.695068359375, -0.5682373046875, -0.44140625, -0.3145751953125, -0.187744140625, -0.0609130859375, 0.06591796875, 0.1927490234375, 0.319580078125, 0.4464111328125, 0.5732421875, 0.7000732421875, 0.826904296875, 0.9537353515625, 1.08056640625, 1.2073974609375, 1.334228515625, 1.4610595703125, 1.587890625, 1.7147216796875, 1.841552734375, 1.9683837890625, 2.09521484375, 2.2220458984375, 2.348876953125, 2.4757080078125, 2.6025390625, 2.7293701171875, 2.856201171875, 2.9830322265625, 3.10986328125, 3.2366943359375, 3.363525390625, 3.4903564453125, 3.6171875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 4.0, 3.0, 5.0, 6.0, 11.0, 23.0, 41.0, 50.0, 80.0, 129.0, 226.0, 414.0, 835.0, 1959.0, 5081.0, 14612.0, 46632.0, 168950.0, 724259.0, 2043102.0, 898857.0, 205642.0, 55975.0, 17381.0, 5889.0, 2148.0, 981.0, 439.0, 218.0, 111.0, 67.0, 42.0, 23.0, 25.0, 17.0, 11.0, 12.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-8.375, -8.14599609375, -7.9169921875, -7.68798828125, -7.458984375, -7.22998046875, -7.0009765625, -6.77197265625, -6.54296875, -6.31396484375, -6.0849609375, -5.85595703125, -5.626953125, -5.39794921875, -5.1689453125, -4.93994140625, -4.7109375, -4.48193359375, -4.2529296875, -4.02392578125, -3.794921875, -3.56591796875, -3.3369140625, -3.10791015625, -2.87890625, -2.64990234375, -2.4208984375, -2.19189453125, -1.962890625, -1.73388671875, -1.5048828125, -1.27587890625, -1.046875, -0.81787109375, -0.5888671875, -0.35986328125, -0.130859375, 0.09814453125, 0.3271484375, 0.55615234375, 0.78515625, 1.01416015625, 1.2431640625, 1.47216796875, 1.701171875, 1.93017578125, 2.1591796875, 2.38818359375, 2.6171875, 2.84619140625, 3.0751953125, 3.30419921875, 3.533203125, 3.76220703125, 3.9912109375, 4.22021484375, 4.44921875, 4.67822265625, 4.9072265625, 5.13623046875, 5.365234375, 5.59423828125, 5.8232421875, 6.05224609375, 6.28125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 4.0, 8.0, 9.0, 14.0, 10.0, 18.0, 31.0, 25.0, 45.0, 54.0, 77.0, 86.0, 117.0, 156.0, 209.0, 243.0, 273.0, 382.0, 380.0, 366.0, 319.0, 283.0, 201.0, 168.0, 143.0, 111.0, 97.0, 65.0, 50.0, 30.0, 26.0, 15.0, 16.0, 8.0, 13.0, 6.0, 6.0, 5.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2421875, -6.9888916015625, -6.735595703125, -6.4822998046875, -6.22900390625, -5.9757080078125, -5.722412109375, -5.4691162109375, -5.2158203125, -4.9625244140625, -4.709228515625, -4.4559326171875, -4.20263671875, -3.9493408203125, -3.696044921875, -3.4427490234375, -3.189453125, -2.9361572265625, -2.682861328125, -2.4295654296875, -2.17626953125, -1.9229736328125, -1.669677734375, -1.4163818359375, -1.1630859375, -0.9097900390625, -0.656494140625, -0.4031982421875, -0.14990234375, 0.1033935546875, 0.356689453125, 0.6099853515625, 0.86328125, 1.1165771484375, 1.369873046875, 1.6231689453125, 1.87646484375, 2.1297607421875, 2.383056640625, 2.6363525390625, 2.8896484375, 3.1429443359375, 3.396240234375, 3.6495361328125, 3.90283203125, 4.1561279296875, 4.409423828125, 4.6627197265625, 4.916015625, 5.1693115234375, 5.422607421875, 5.6759033203125, 5.92919921875, 6.1824951171875, 6.435791015625, 6.6890869140625, 6.9423828125, 7.1956787109375, 7.448974609375, 7.7022705078125, 7.95556640625, 8.2088623046875, 8.462158203125, 8.7154541015625, 8.96875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 9.0, 6.0, 9.0, 22.0, 23.0, 31.0, 45.0, 67.0, 109.0, 181.0, 294.0, 476.0, 958.0, 2118.0, 5284.0, 15262.0, 51149.0, 185298.0, 678691.0, 1816075.0, 1034812.0, 288714.0, 78830.0, 22739.0, 7445.0, 2836.0, 1271.0, 614.0, 310.0, 210.0, 123.0, 82.0, 56.0, 51.0, 22.0, 18.0, 12.0, 11.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-11.265625, -10.9310302734375, -10.596435546875, -10.2618408203125, -9.92724609375, -9.5926513671875, -9.258056640625, -8.9234619140625, -8.5888671875, -8.2542724609375, -7.919677734375, -7.5850830078125, -7.25048828125, -6.9158935546875, -6.581298828125, -6.2467041015625, -5.912109375, -5.5775146484375, -5.242919921875, -4.9083251953125, -4.57373046875, -4.2391357421875, -3.904541015625, -3.5699462890625, -3.2353515625, -2.9007568359375, -2.566162109375, -2.2315673828125, -1.89697265625, -1.5623779296875, -1.227783203125, -0.8931884765625, -0.55859375, -0.2239990234375, 0.110595703125, 0.4451904296875, 0.77978515625, 1.1143798828125, 1.448974609375, 1.7835693359375, 2.1181640625, 2.4527587890625, 2.787353515625, 3.1219482421875, 3.45654296875, 3.7911376953125, 4.125732421875, 4.4603271484375, 4.794921875, 5.1295166015625, 5.464111328125, 5.7987060546875, 6.13330078125, 6.4678955078125, 6.802490234375, 7.1370849609375, 7.4716796875, 7.8062744140625, 8.140869140625, 8.4754638671875, 8.81005859375, 9.1446533203125, 9.479248046875, 9.8138427734375, 10.1484375]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 13.0, 15.0, 44.0, 69.0, 83.0, 144.0, 135.0, 161.0, 123.0, 87.0, 65.0, 39.0, 16.0, 8.0, 8.0, 0.0, 3.0], "bins": [-122.98338317871094, -120.70271301269531, -118.42205047607422, -116.1413803100586, -113.8607177734375, -111.58004760742188, -109.29937744140625, -107.01871490478516, -104.73804473876953, -102.4573745727539, -100.17671203613281, -97.89604187011719, -95.61537170410156, -93.33470916748047, -91.05403900146484, -88.77337646484375, -86.49270629882812, -84.2120361328125, -81.9313735961914, -79.65070343017578, -77.37004089355469, -75.08937072753906, -72.80870056152344, -70.52803802490234, -68.24736785888672, -65.9666976928711, -63.68603515625, -61.405364990234375, -59.124698638916016, -56.844032287597656, -54.56336212158203, -52.28269577026367, -50.00202941894531, -47.72136306762695, -45.440696716308594, -43.16002655029297, -40.87936019897461, -38.59869384765625, -36.318023681640625, -34.037357330322266, -31.75669288635254, -29.476024627685547, -27.195358276367188, -24.914691925048828, -22.634023666381836, -20.353355407714844, -18.072689056396484, -15.792021751403809, -13.511354446411133, -11.230687141418457, -8.950019836425781, -6.6693525314331055, -4.38868522644043, -2.108017921447754, 0.17264938354492188, 2.4533166885375977, 4.733983993530273, 7.014651298522949, 9.295318603515625, 11.5759859085083, 13.856653213500977, 16.13732147216797, 18.417987823486328, 20.698654174804688, 22.97932243347168]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 6.0, 6.0, 5.0, 8.0, 4.0, 14.0, 15.0, 19.0, 12.0, 25.0, 23.0, 18.0, 21.0, 34.0, 26.0, 30.0, 30.0, 33.0, 24.0, 38.0, 43.0, 46.0, 46.0, 40.0, 36.0, 45.0, 41.0, 36.0, 30.0, 43.0, 29.0, 31.0, 16.0, 17.0, 22.0, 17.0, 8.0, 11.0, 7.0, 10.0, 8.0, 6.0, 9.0, 2.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.612579345703125, -29.65744400024414, -28.702308654785156, -27.747173309326172, -26.792037963867188, -25.836902618408203, -24.88176918029785, -23.926633834838867, -22.971498489379883, -22.0163631439209, -21.061227798461914, -20.10609245300293, -19.150959014892578, -18.195823669433594, -17.24068832397461, -16.285552978515625, -15.33041763305664, -14.375282287597656, -13.420146942138672, -12.465012550354004, -11.50987720489502, -10.554741859436035, -9.599607467651367, -8.644472122192383, -7.689336776733398, -6.734201431274414, -5.779066562652588, -4.823931694030762, -3.8687963485717773, -2.913661003112793, -1.9585261344909668, -1.0033912658691406, -0.04825782775878906, 0.9068772792816162, 1.8620123863220215, 2.8171474933624268, 3.772282600402832, 4.727417945861816, 5.682552814483643, 6.637687683105469, 7.592823028564453, 8.547958374023438, 9.503093719482422, 10.45822811126709, 11.413363456726074, 12.368498802185059, 13.323633193969727, 14.278768539428711, 15.233903884887695, 16.18903923034668, 17.144174575805664, 18.09930992126465, 19.054443359375, 20.009578704833984, 20.96471405029297, 21.919849395751953, 22.874984741210938, 23.830120086669922, 24.785255432128906, 25.74039077758789, 26.695526123046875, 27.65066146850586, 28.60579490661621, 29.560930252075195, 30.51606559753418]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 8.0, 9.0, 10.0, 16.0, 10.0, 15.0, 17.0, 20.0, 29.0, 29.0, 27.0, 40.0, 36.0, 47.0, 63.0, 64.0, 35.0, 49.0, 54.0, 42.0, 49.0, 41.0, 48.0, 39.0, 26.0, 25.0, 24.0, 30.0, 22.0, 20.0, 14.0, 11.0, 10.0, 12.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4609375, -4.332611083984375, -4.20428466796875, -4.075958251953125, -3.9476318359375, -3.819305419921875, -3.69097900390625, -3.562652587890625, -3.434326171875, -3.305999755859375, -3.17767333984375, -3.049346923828125, -2.9210205078125, -2.792694091796875, -2.66436767578125, -2.536041259765625, -2.40771484375, -2.279388427734375, -2.15106201171875, -2.022735595703125, -1.8944091796875, -1.766082763671875, -1.63775634765625, -1.509429931640625, -1.381103515625, -1.252777099609375, -1.12445068359375, -0.996124267578125, -0.8677978515625, -0.739471435546875, -0.61114501953125, -0.482818603515625, -0.3544921875, -0.226165771484375, -0.09783935546875, 0.030487060546875, 0.1588134765625, 0.287139892578125, 0.41546630859375, 0.543792724609375, 0.672119140625, 0.800445556640625, 0.92877197265625, 1.057098388671875, 1.1854248046875, 1.313751220703125, 1.44207763671875, 1.570404052734375, 1.69873046875, 1.827056884765625, 1.95538330078125, 2.083709716796875, 2.2120361328125, 2.340362548828125, 2.46868896484375, 2.597015380859375, 2.725341796875, 2.853668212890625, 2.98199462890625, 3.110321044921875, 3.2386474609375, 3.366973876953125, 3.49530029296875, 3.623626708984375, 3.751953125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 8.0, 17.0, 34.0, 26.0, 40.0, 66.0, 117.0, 152.0, 260.0, 369.0, 563.0, 910.0, 1479.0, 2355.0, 3785.0, 6173.0, 10528.0, 17439.0, 27290.0, 42919.0, 63941.0, 90123.0, 119069.0, 139714.0, 139291.0, 117709.0, 89342.0, 62856.0, 41802.0, 26751.0, 16914.0, 10163.0, 6303.0, 3768.0, 2345.0, 1443.0, 911.0, 535.0, 359.0, 230.0, 158.0, 88.0, 76.0, 40.0, 24.0, 17.0, 18.0, 7.0, 6.0, 9.0, 2.0, 4.0, 3.0, 2.0], "bins": [-0.8134765625, -0.7895355224609375, -0.765594482421875, -0.7416534423828125, -0.71771240234375, -0.6937713623046875, -0.669830322265625, -0.6458892822265625, -0.6219482421875, -0.5980072021484375, -0.574066162109375, -0.5501251220703125, -0.52618408203125, -0.5022430419921875, -0.478302001953125, -0.4543609619140625, -0.430419921875, -0.4064788818359375, -0.382537841796875, -0.3585968017578125, -0.33465576171875, -0.3107147216796875, -0.286773681640625, -0.2628326416015625, -0.2388916015625, -0.2149505615234375, -0.191009521484375, -0.1670684814453125, -0.14312744140625, -0.1191864013671875, -0.095245361328125, -0.0713043212890625, -0.04736328125, -0.0234222412109375, 0.000518798828125, 0.0244598388671875, 0.04840087890625, 0.0723419189453125, 0.096282958984375, 0.1202239990234375, 0.1441650390625, 0.1681060791015625, 0.192047119140625, 0.2159881591796875, 0.23992919921875, 0.2638702392578125, 0.287811279296875, 0.3117523193359375, 0.335693359375, 0.3596343994140625, 0.383575439453125, 0.4075164794921875, 0.43145751953125, 0.4553985595703125, 0.479339599609375, 0.5032806396484375, 0.5272216796875, 0.5511627197265625, 0.575103759765625, 0.5990447998046875, 0.62298583984375, 0.6469268798828125, 0.670867919921875, 0.6948089599609375, 0.71875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 6.0, 2.0, 7.0, 9.0, 4.0, 11.0, 12.0, 13.0, 20.0, 11.0, 24.0, 16.0, 30.0, 28.0, 21.0, 27.0, 34.0, 37.0, 37.0, 29.0, 47.0, 37.0, 1061.0, 32.0, 41.0, 41.0, 26.0, 35.0, 38.0, 32.0, 23.0, 24.0, 24.0, 25.0, 23.0, 18.0, 28.0, 15.0, 17.0, 12.0, 8.0, 12.0, 6.0, 10.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.330078125, -2.254852294921875, -2.17962646484375, -2.104400634765625, -2.0291748046875, -1.953948974609375, -1.87872314453125, -1.803497314453125, -1.728271484375, -1.653045654296875, -1.57781982421875, -1.502593994140625, -1.4273681640625, -1.352142333984375, -1.27691650390625, -1.201690673828125, -1.12646484375, -1.051239013671875, -0.97601318359375, -0.900787353515625, -0.8255615234375, -0.750335693359375, -0.67510986328125, -0.599884033203125, -0.524658203125, -0.449432373046875, -0.37420654296875, -0.298980712890625, -0.2237548828125, -0.148529052734375, -0.07330322265625, 0.001922607421875, 0.0771484375, 0.152374267578125, 0.22760009765625, 0.302825927734375, 0.3780517578125, 0.453277587890625, 0.52850341796875, 0.603729248046875, 0.678955078125, 0.754180908203125, 0.82940673828125, 0.904632568359375, 0.9798583984375, 1.055084228515625, 1.13031005859375, 1.205535888671875, 1.28076171875, 1.355987548828125, 1.43121337890625, 1.506439208984375, 1.5816650390625, 1.656890869140625, 1.73211669921875, 1.807342529296875, 1.882568359375, 1.957794189453125, 2.03302001953125, 2.108245849609375, 2.1834716796875, 2.258697509765625, 2.33392333984375, 2.409149169921875, 2.484375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 9.0, 7.0, 11.0, 9.0, 7.0, 20.0, 27.0, 30.0, 63.0, 96.0, 193.0, 312.0, 601.0, 1116.0, 2216.0, 4585.0, 9227.0, 19461.0, 42691.0, 1886357.0, 73887.0, 29208.0, 13691.0, 6534.0, 3271.0, 1618.0, 820.0, 440.0, 240.0, 131.0, 89.0, 46.0, 35.0, 30.0, 16.0, 8.0, 16.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7978515625, -1.744598388671875, -1.69134521484375, -1.638092041015625, -1.5848388671875, -1.531585693359375, -1.47833251953125, -1.425079345703125, -1.371826171875, -1.318572998046875, -1.26531982421875, -1.212066650390625, -1.1588134765625, -1.105560302734375, -1.05230712890625, -0.999053955078125, -0.94580078125, -0.892547607421875, -0.83929443359375, -0.786041259765625, -0.7327880859375, -0.679534912109375, -0.62628173828125, -0.573028564453125, -0.519775390625, -0.466522216796875, -0.41326904296875, -0.360015869140625, -0.3067626953125, -0.253509521484375, -0.20025634765625, -0.147003173828125, -0.09375, -0.040496826171875, 0.01275634765625, 0.066009521484375, 0.1192626953125, 0.172515869140625, 0.22576904296875, 0.279022216796875, 0.332275390625, 0.385528564453125, 0.43878173828125, 0.492034912109375, 0.5452880859375, 0.598541259765625, 0.65179443359375, 0.705047607421875, 0.75830078125, 0.811553955078125, 0.86480712890625, 0.918060302734375, 0.9713134765625, 1.024566650390625, 1.07781982421875, 1.131072998046875, 1.184326171875, 1.237579345703125, 1.29083251953125, 1.344085693359375, 1.3973388671875, 1.450592041015625, 1.50384521484375, 1.557098388671875, 1.6103515625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 3.0, 14.0, 37.0, 115.0, 417.0, 265.0, 81.0, 19.0, 12.0, 9.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.318359375, -0.3097190856933594, -0.30107879638671875, -0.2924385070800781, -0.2837982177734375, -0.2751579284667969, -0.26651763916015625, -0.2578773498535156, -0.249237060546875, -0.24059677124023438, -0.23195648193359375, -0.22331619262695312, -0.2146759033203125, -0.20603561401367188, -0.19739532470703125, -0.18875503540039062, -0.18011474609375, -0.17147445678710938, -0.16283416748046875, -0.15419387817382812, -0.1455535888671875, -0.13691329956054688, -0.12827301025390625, -0.11963272094726562, -0.110992431640625, -0.10235214233398438, -0.09371185302734375, -0.08507156372070312, -0.0764312744140625, -0.06779098510742188, -0.05915069580078125, -0.050510406494140625, -0.0418701171875, -0.033229827880859375, -0.02458953857421875, -0.015949249267578125, -0.0073089599609375, 0.001331329345703125, 0.00997161865234375, 0.018611907958984375, 0.027252197265625, 0.035892486572265625, 0.04453277587890625, 0.053173065185546875, 0.0618133544921875, 0.07045364379882812, 0.07909393310546875, 0.08773422241210938, 0.09637451171875, 0.10501480102539062, 0.11365509033203125, 0.12229537963867188, 0.1309356689453125, 0.13957595825195312, 0.14821624755859375, 0.15685653686523438, 0.165496826171875, 0.17413711547851562, 0.18277740478515625, 0.19141769409179688, 0.2000579833984375, 0.20869827270507812, 0.21733856201171875, 0.22597885131835938, 0.234619140625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 6.0, 5.0, 8.0, 7.0, 5.0, 11.0, 12.0, 12.0, 10.0, 24.0, 55.0, 189.0, 2101.0, 64027.0, 977926.0, 3663.0, 304.0, 52.0, 37.0, 21.0, 23.0, 10.0, 4.0, 4.0, 6.0, 8.0, 2.0, 8.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.140625, -3.98785400390625, -3.8350830078125, -3.68231201171875, -3.529541015625, -3.37677001953125, -3.2239990234375, -3.07122802734375, -2.91845703125, -2.76568603515625, -2.6129150390625, -2.46014404296875, -2.307373046875, -2.15460205078125, -2.0018310546875, -1.84906005859375, -1.6962890625, -1.54351806640625, -1.3907470703125, -1.23797607421875, -1.085205078125, -0.93243408203125, -0.7796630859375, -0.62689208984375, -0.47412109375, -0.32135009765625, -0.1685791015625, -0.01580810546875, 0.136962890625, 0.28973388671875, 0.4425048828125, 0.59527587890625, 0.748046875, 0.90081787109375, 1.0535888671875, 1.20635986328125, 1.359130859375, 1.51190185546875, 1.6646728515625, 1.81744384765625, 1.97021484375, 2.12298583984375, 2.2757568359375, 2.42852783203125, 2.581298828125, 2.73406982421875, 2.8868408203125, 3.03961181640625, 3.1923828125, 3.34515380859375, 3.4979248046875, 3.65069580078125, 3.803466796875, 3.95623779296875, 4.1090087890625, 4.26177978515625, 4.41455078125, 4.56732177734375, 4.7200927734375, 4.87286376953125, 5.025634765625, 5.17840576171875, 5.3311767578125, 5.48394775390625, 5.63671875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 17.0, 21.0, 57.0, 131.0, 358.0, 281.0, 76.0, 30.0, 20.0, 9.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.9718258380889893, -1.9352304935455322, -1.8986351490020752, -1.8620398044586182, -1.8254443407058716, -1.7888489961624146, -1.7522536516189575, -1.7156583070755005, -1.6790629625320435, -1.6424676179885864, -1.6058722734451294, -1.5692768096923828, -1.5326814651489258, -1.4960861206054688, -1.4594907760620117, -1.4228954315185547, -1.3863000869750977, -1.3497047424316406, -1.3131093978881836, -1.2765140533447266, -1.23991858959198, -1.203323245048523, -1.166727900505066, -1.1301325559616089, -1.0935370922088623, -1.0569417476654053, -1.0203464031219482, -0.9837509989738464, -0.9471556544303894, -0.9105602502822876, -0.8739649057388306, -0.8373695611953735, -0.800774097442627, -0.7641787528991699, -0.7275833487510681, -0.6909880042076111, -0.654392659664154, -0.6177972555160522, -0.5812019109725952, -0.5446065664291382, -0.5080112218856812, -0.47141584753990173, -0.4348205029964447, -0.3982251286506653, -0.36162978410720825, -0.32503440976142883, -0.2884390354156494, -0.2518436908721924, -0.21524831652641296, -0.17865295708179474, -0.1420575976371765, -0.1054622232913971, -0.06886686384677887, -0.032271504402160645, 0.004323869943618774, 0.040919214487075806, 0.07751458883285522, 0.11410994827747345, 0.15070530772209167, 0.1873006820678711, 0.22389604151248932, 0.26049140095710754, 0.29708677530288696, 0.333682119846344, 0.3702774941921234]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 5.0, 6.0, 9.0, 6.0, 8.0, 8.0, 13.0, 16.0, 16.0, 18.0, 16.0, 29.0, 37.0, 27.0, 29.0, 30.0, 37.0, 32.0, 32.0, 42.0, 39.0, 33.0, 41.0, 41.0, 48.0, 31.0, 39.0, 33.0, 32.0, 31.0, 23.0, 20.0, 24.0, 31.0, 17.0, 18.0, 21.0, 7.0, 10.0, 9.0, 9.0, 6.0, 9.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1584952473640442, -0.15327899158000946, -0.14806273579597473, -0.1428464949131012, -0.13763023912906647, -0.13241398334503174, -0.1271977424621582, -0.12198148667812347, -0.11676523089408875, -0.11154897511005402, -0.10633272677659988, -0.10111647844314575, -0.09590022265911102, -0.0906839668750763, -0.08546771854162216, -0.08025147020816803, -0.0750352144241333, -0.06981895864009857, -0.06460271030664444, -0.05938645824790001, -0.05417020618915558, -0.04895395413041115, -0.04373770207166672, -0.03852145001292229, -0.033305197954177856, -0.028088945895433426, -0.022872693836688995, -0.017656441777944565, -0.012440189719200134, -0.007223937660455704, -0.002007685601711273, 0.0032085664570331573, 0.008424818515777588, 0.013641070574522018, 0.01885732263326645, 0.02407357469201088, 0.02928982675075531, 0.03450607880949974, 0.03972233086824417, 0.0449385829269886, 0.05015483498573303, 0.05537108704447746, 0.06058733910322189, 0.06580358743667603, 0.07101984322071075, 0.07623609900474548, 0.08145234733819962, 0.08666859567165375, 0.09188485145568848, 0.0971011072397232, 0.10231735557317734, 0.10753360390663147, 0.1127498596906662, 0.11796611547470093, 0.12318236380815506, 0.1283986121416092, 0.13361486792564392, 0.13883112370967865, 0.14404737949371338, 0.14926362037658691, 0.15447987616062164, 0.15969613194465637, 0.1649123728275299, 0.17012862861156464, 0.17534488439559937]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 9.0, 12.0, 4.0, 9.0, 11.0, 25.0, 13.0, 22.0, 34.0, 23.0, 26.0, 26.0, 41.0, 41.0, 39.0, 38.0, 56.0, 48.0, 49.0, 49.0, 49.0, 45.0, 34.0, 43.0, 40.0, 34.0, 24.0, 26.0, 21.0, 29.0, 14.0, 9.0, 13.0, 10.0, 11.0, 10.0, 3.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.798828125, -3.678497314453125, -3.55816650390625, -3.437835693359375, -3.3175048828125, -3.197174072265625, -3.07684326171875, -2.956512451171875, -2.836181640625, -2.715850830078125, -2.59552001953125, -2.475189208984375, -2.3548583984375, -2.234527587890625, -2.11419677734375, -1.993865966796875, -1.87353515625, -1.753204345703125, -1.63287353515625, -1.512542724609375, -1.3922119140625, -1.271881103515625, -1.15155029296875, -1.031219482421875, -0.910888671875, -0.790557861328125, -0.67022705078125, -0.549896240234375, -0.4295654296875, -0.309234619140625, -0.18890380859375, -0.068572998046875, 0.0517578125, 0.172088623046875, 0.29241943359375, 0.412750244140625, 0.5330810546875, 0.653411865234375, 0.77374267578125, 0.894073486328125, 1.014404296875, 1.134735107421875, 1.25506591796875, 1.375396728515625, 1.4957275390625, 1.616058349609375, 1.73638916015625, 1.856719970703125, 1.97705078125, 2.097381591796875, 2.21771240234375, 2.338043212890625, 2.4583740234375, 2.578704833984375, 2.69903564453125, 2.819366455078125, 2.939697265625, 3.060028076171875, 3.18035888671875, 3.300689697265625, 3.4210205078125, 3.541351318359375, 3.66168212890625, 3.782012939453125, 3.90234375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 2.0, 7.0, 5.0, 19.0, 25.0, 34.0, 54.0, 66.0, 135.0, 251.0, 407.0, 768.0, 1253.0, 2387.0, 4152.0, 8267.0, 19480.0, 56656.0, 182972.0, 453838.0, 210924.0, 65247.0, 22410.0, 9027.0, 4433.0, 2389.0, 1406.0, 846.0, 440.0, 249.0, 148.0, 97.0, 45.0, 35.0, 20.0, 15.0, 15.0, 8.0, 2.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.8828125, -5.6964111328125, -5.510009765625, -5.3236083984375, -5.13720703125, -4.9508056640625, -4.764404296875, -4.5780029296875, -4.3916015625, -4.2052001953125, -4.018798828125, -3.8323974609375, -3.64599609375, -3.4595947265625, -3.273193359375, -3.0867919921875, -2.900390625, -2.7139892578125, -2.527587890625, -2.3411865234375, -2.15478515625, -1.9683837890625, -1.781982421875, -1.5955810546875, -1.4091796875, -1.2227783203125, -1.036376953125, -0.8499755859375, -0.66357421875, -0.4771728515625, -0.290771484375, -0.1043701171875, 0.08203125, 0.2684326171875, 0.454833984375, 0.6412353515625, 0.82763671875, 1.0140380859375, 1.200439453125, 1.3868408203125, 1.5732421875, 1.7596435546875, 1.946044921875, 2.1324462890625, 2.31884765625, 2.5052490234375, 2.691650390625, 2.8780517578125, 3.064453125, 3.2508544921875, 3.437255859375, 3.6236572265625, 3.81005859375, 3.9964599609375, 4.182861328125, 4.3692626953125, 4.5556640625, 4.7420654296875, 4.928466796875, 5.1148681640625, 5.30126953125, 5.4876708984375, 5.674072265625, 5.8604736328125, 6.046875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 1.0, 6.0, 10.0, 7.0, 12.0, 11.0, 15.0, 10.0, 23.0, 21.0, 24.0, 26.0, 31.0, 37.0, 41.0, 40.0, 33.0, 53.0, 90.0, 157.0, 307.0, 1381.0, 191.0, 104.0, 58.0, 42.0, 33.0, 33.0, 45.0, 39.0, 20.0, 29.0, 18.0, 16.0, 14.0, 15.0, 5.0, 11.0, 11.0, 5.0, 4.0, 5.0, 1.0, 7.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.3828125, -11.986328125, -11.58984375, -11.193359375, -10.796875, -10.400390625, -10.00390625, -9.607421875, -9.2109375, -8.814453125, -8.41796875, -8.021484375, -7.625, -7.228515625, -6.83203125, -6.435546875, -6.0390625, -5.642578125, -5.24609375, -4.849609375, -4.453125, -4.056640625, -3.66015625, -3.263671875, -2.8671875, -2.470703125, -2.07421875, -1.677734375, -1.28125, -0.884765625, -0.48828125, -0.091796875, 0.3046875, 0.701171875, 1.09765625, 1.494140625, 1.890625, 2.287109375, 2.68359375, 3.080078125, 3.4765625, 3.873046875, 4.26953125, 4.666015625, 5.0625, 5.458984375, 5.85546875, 6.251953125, 6.6484375, 7.044921875, 7.44140625, 7.837890625, 8.234375, 8.630859375, 9.02734375, 9.423828125, 9.8203125, 10.216796875, 10.61328125, 11.009765625, 11.40625, 11.802734375, 12.19921875, 12.595703125, 12.9921875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 3.0, 3.0, 6.0, 2.0, 7.0, 8.0, 7.0, 15.0, 24.0, 14.0, 29.0, 29.0, 61.0, 53.0, 82.0, 116.0, 203.0, 285.0, 651.0, 2115.0, 11147.0, 136324.0, 2772397.0, 203785.0, 14112.0, 2496.0, 710.0, 314.0, 177.0, 143.0, 71.0, 66.0, 60.0, 34.0, 31.0, 25.0, 25.0, 20.0, 17.0, 6.0, 4.0, 10.0, 3.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 4.0], "bins": [-24.390625, -23.723388671875, -23.05615234375, -22.388916015625, -21.7216796875, -21.054443359375, -20.38720703125, -19.719970703125, -19.052734375, -18.385498046875, -17.71826171875, -17.051025390625, -16.3837890625, -15.716552734375, -15.04931640625, -14.382080078125, -13.71484375, -13.047607421875, -12.38037109375, -11.713134765625, -11.0458984375, -10.378662109375, -9.71142578125, -9.044189453125, -8.376953125, -7.709716796875, -7.04248046875, -6.375244140625, -5.7080078125, -5.040771484375, -4.37353515625, -3.706298828125, -3.0390625, -2.371826171875, -1.70458984375, -1.037353515625, -0.3701171875, 0.297119140625, 0.96435546875, 1.631591796875, 2.298828125, 2.966064453125, 3.63330078125, 4.300537109375, 4.9677734375, 5.635009765625, 6.30224609375, 6.969482421875, 7.63671875, 8.303955078125, 8.97119140625, 9.638427734375, 10.3056640625, 10.972900390625, 11.64013671875, 12.307373046875, 12.974609375, 13.641845703125, 14.30908203125, 14.976318359375, 15.6435546875, 16.310791015625, 16.97802734375, 17.645263671875, 18.3125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 26.0, 179.0, 465.0, 296.0, 43.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.41252136230469, -47.642520904541016, -43.87251663208008, -40.102516174316406, -36.332515716552734, -32.56251525878906, -28.792510986328125, -25.022510528564453, -21.25250816345215, -17.482505798339844, -13.712505340576172, -9.942502975463867, -6.172501564025879, -2.4025001525878906, 1.367502212524414, 5.137502670288086, 8.90750503540039, 12.677506446838379, 16.447507858276367, 20.217510223388672, 23.987510681152344, 27.75751304626465, 31.527515411376953, 35.297515869140625, 39.06752014160156, 42.837520599365234, 46.60752487182617, 50.377525329589844, 54.147525787353516, 57.91752624511719, 61.687530517578125, 65.45753479003906, 69.22753143310547, 72.9975357055664, 76.76753234863281, 80.53753662109375, 84.30754089355469, 88.0775375366211, 91.84754180908203, 95.61753845214844, 99.38754272460938, 103.15754699707031, 106.92754364013672, 110.69754791259766, 114.4675521850586, 118.237548828125, 122.00755310058594, 125.77755737304688, 129.5475616455078, 133.31756591796875, 137.0875701904297, 140.85757446289062, 144.6275634765625, 148.39756774902344, 152.16757202148438, 155.9375762939453, 159.7075653076172, 163.47756958007812, 167.24757385253906, 171.017578125, 174.78756713867188, 178.5575714111328, 182.32757568359375, 186.0975799560547, 189.86758422851562]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 7.0, 6.0, 6.0, 15.0, 9.0, 12.0, 19.0, 16.0, 24.0, 28.0, 37.0, 46.0, 28.0, 30.0, 37.0, 43.0, 39.0, 41.0, 24.0, 44.0, 47.0, 40.0, 55.0, 42.0, 40.0, 19.0, 36.0, 39.0, 31.0, 17.0, 11.0, 23.0, 12.0, 10.0, 13.0, 15.0, 8.0, 8.0, 8.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-41.4267692565918, -40.08987045288086, -38.75297164916992, -37.41607666015625, -36.07917785644531, -34.742279052734375, -33.40538024902344, -32.0684814453125, -30.731584548950195, -29.394685745239258, -28.057788848876953, -26.720890045166016, -25.383991241455078, -24.047094345092773, -22.710195541381836, -21.37329864501953, -20.036399841308594, -18.699501037597656, -17.36260414123535, -16.025705337524414, -14.688807487487793, -13.351909637451172, -12.015010833740234, -10.678112983703613, -9.341215133666992, -8.004317283630371, -6.667418956756592, -5.3305206298828125, -3.9936227798461914, -2.6567249298095703, -1.3198261260986328, 0.01707172393798828, 1.3539657592773438, 2.690863847732544, 4.027761936187744, 5.364660263061523, 6.7015581130981445, 8.038455963134766, 9.375354766845703, 10.712252616882324, 12.049150466918945, 13.386048316955566, 14.722946166992188, 16.059844970703125, 17.396743774414062, 18.733640670776367, 20.070539474487305, 21.40743637084961, 22.744335174560547, 24.081233978271484, 25.41813087463379, 26.755029678344727, 28.09192657470703, 29.42882537841797, 30.765724182128906, 32.102622985839844, 33.43952178955078, 34.77642059326172, 36.113319396972656, 37.450218200683594, 38.787113189697266, 40.1240119934082, 41.46091079711914, 42.79780960083008, 44.13470458984375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 6.0, 2.0, 6.0, 13.0, 14.0, 18.0, 20.0, 13.0, 21.0, 20.0, 22.0, 26.0, 34.0, 40.0, 36.0, 26.0, 47.0, 45.0, 47.0, 37.0, 49.0, 40.0, 57.0, 41.0, 29.0, 41.0, 18.0, 28.0, 43.0, 23.0, 28.0, 22.0, 16.0, 15.0, 16.0, 8.0, 6.0, 4.0, 9.0, 2.0, 4.0, 6.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.1015625, -3.984405517578125, -3.86724853515625, -3.750091552734375, -3.6329345703125, -3.515777587890625, -3.39862060546875, -3.281463623046875, -3.164306640625, -3.047149658203125, -2.92999267578125, -2.812835693359375, -2.6956787109375, -2.578521728515625, -2.46136474609375, -2.344207763671875, -2.22705078125, -2.109893798828125, -1.99273681640625, -1.875579833984375, -1.7584228515625, -1.641265869140625, -1.52410888671875, -1.406951904296875, -1.289794921875, -1.172637939453125, -1.05548095703125, -0.938323974609375, -0.8211669921875, -0.704010009765625, -0.58685302734375, -0.469696044921875, -0.3525390625, -0.235382080078125, -0.11822509765625, -0.001068115234375, 0.1160888671875, 0.233245849609375, 0.35040283203125, 0.467559814453125, 0.584716796875, 0.701873779296875, 0.81903076171875, 0.936187744140625, 1.0533447265625, 1.170501708984375, 1.28765869140625, 1.404815673828125, 1.52197265625, 1.639129638671875, 1.75628662109375, 1.873443603515625, 1.9906005859375, 2.107757568359375, 2.22491455078125, 2.342071533203125, 2.459228515625, 2.576385498046875, 2.69354248046875, 2.810699462890625, 2.9278564453125, 3.045013427734375, 3.16217041015625, 3.279327392578125, 3.396484375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 17.0, 9.0, 25.0, 42.0, 63.0, 66.0, 113.0, 237.0, 366.0, 574.0, 1206.0, 2327.0, 4782.0, 10786.0, 25514.0, 63721.0, 173346.0, 504976.0, 1323528.0, 1309159.0, 496961.0, 169493.0, 62604.0, 24603.0, 10492.0, 4633.0, 2172.0, 1084.0, 568.0, 312.0, 190.0, 109.0, 71.0, 43.0, 27.0, 15.0, 14.0, 10.0, 3.0, 13.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5859375, -4.40948486328125, -4.2330322265625, -4.05657958984375, -3.880126953125, -3.70367431640625, -3.5272216796875, -3.35076904296875, -3.17431640625, -2.99786376953125, -2.8214111328125, -2.64495849609375, -2.468505859375, -2.29205322265625, -2.1156005859375, -1.93914794921875, -1.7626953125, -1.58624267578125, -1.4097900390625, -1.23333740234375, -1.056884765625, -0.88043212890625, -0.7039794921875, -0.52752685546875, -0.35107421875, -0.17462158203125, 0.0018310546875, 0.17828369140625, 0.354736328125, 0.53118896484375, 0.7076416015625, 0.88409423828125, 1.060546875, 1.23699951171875, 1.4134521484375, 1.58990478515625, 1.766357421875, 1.94281005859375, 2.1192626953125, 2.29571533203125, 2.47216796875, 2.64862060546875, 2.8250732421875, 3.00152587890625, 3.177978515625, 3.35443115234375, 3.5308837890625, 3.70733642578125, 3.8837890625, 4.06024169921875, 4.2366943359375, 4.41314697265625, 4.589599609375, 4.76605224609375, 4.9425048828125, 5.11895751953125, 5.29541015625, 5.47186279296875, 5.6483154296875, 5.82476806640625, 6.001220703125, 6.17767333984375, 6.3541259765625, 6.53057861328125, 6.70703125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 2.0, 1.0, 8.0, 8.0, 15.0, 8.0, 15.0, 25.0, 21.0, 33.0, 50.0, 67.0, 83.0, 95.0, 137.0, 182.0, 212.0, 260.0, 296.0, 337.0, 354.0, 379.0, 312.0, 264.0, 190.0, 173.0, 110.0, 102.0, 80.0, 53.0, 54.0, 39.0, 35.0, 17.0, 12.0, 10.0, 11.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.5234375, -8.26824951171875, -8.0130615234375, -7.75787353515625, -7.502685546875, -7.24749755859375, -6.9923095703125, -6.73712158203125, -6.48193359375, -6.22674560546875, -5.9715576171875, -5.71636962890625, -5.461181640625, -5.20599365234375, -4.9508056640625, -4.69561767578125, -4.4404296875, -4.18524169921875, -3.9300537109375, -3.67486572265625, -3.419677734375, -3.16448974609375, -2.9093017578125, -2.65411376953125, -2.39892578125, -2.14373779296875, -1.8885498046875, -1.63336181640625, -1.378173828125, -1.12298583984375, -0.8677978515625, -0.61260986328125, -0.357421875, -0.10223388671875, 0.1529541015625, 0.40814208984375, 0.663330078125, 0.91851806640625, 1.1737060546875, 1.42889404296875, 1.68408203125, 1.93927001953125, 2.1944580078125, 2.44964599609375, 2.704833984375, 2.96002197265625, 3.2152099609375, 3.47039794921875, 3.7255859375, 3.98077392578125, 4.2359619140625, 4.49114990234375, 4.746337890625, 5.00152587890625, 5.2567138671875, 5.51190185546875, 5.76708984375, 6.02227783203125, 6.2774658203125, 6.53265380859375, 6.787841796875, 7.04302978515625, 7.2982177734375, 7.55340576171875, 7.80859375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 5.0, 12.0, 12.0, 24.0, 25.0, 45.0, 66.0, 119.0, 157.0, 314.0, 519.0, 995.0, 2029.0, 4801.0, 12879.0, 38204.0, 122439.0, 393802.0, 1166701.0, 1552224.0, 614757.0, 192663.0, 59636.0, 19277.0, 6891.0, 2755.0, 1298.0, 641.0, 384.0, 203.0, 154.0, 82.0, 62.0, 31.0, 15.0, 15.0, 11.0, 11.0, 4.0, 6.0, 3.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.703125, -9.4017333984375, -9.100341796875, -8.7989501953125, -8.49755859375, -8.1961669921875, -7.894775390625, -7.5933837890625, -7.2919921875, -6.9906005859375, -6.689208984375, -6.3878173828125, -6.08642578125, -5.7850341796875, -5.483642578125, -5.1822509765625, -4.880859375, -4.5794677734375, -4.278076171875, -3.9766845703125, -3.67529296875, -3.3739013671875, -3.072509765625, -2.7711181640625, -2.4697265625, -2.1683349609375, -1.866943359375, -1.5655517578125, -1.26416015625, -0.9627685546875, -0.661376953125, -0.3599853515625, -0.05859375, 0.2427978515625, 0.544189453125, 0.8455810546875, 1.14697265625, 1.4483642578125, 1.749755859375, 2.0511474609375, 2.3525390625, 2.6539306640625, 2.955322265625, 3.2567138671875, 3.55810546875, 3.8594970703125, 4.160888671875, 4.4622802734375, 4.763671875, 5.0650634765625, 5.366455078125, 5.6678466796875, 5.96923828125, 6.2706298828125, 6.572021484375, 6.8734130859375, 7.1748046875, 7.4761962890625, 7.777587890625, 8.0789794921875, 8.38037109375, 8.6817626953125, 8.983154296875, 9.2845458984375, 9.5859375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 8.0, 9.0, 11.0, 14.0, 18.0, 27.0, 31.0, 39.0, 45.0, 43.0, 58.0, 54.0, 67.0, 63.0, 73.0, 45.0, 63.0, 57.0, 48.0, 49.0, 27.0, 37.0, 20.0, 27.0, 13.0, 12.0, 9.0, 5.0, 12.0, 0.0, 6.0, 4.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.460988998413086, -27.490966796875, -26.52094268798828, -25.550920486450195, -24.580896377563477, -23.61087417602539, -22.640850067138672, -21.670827865600586, -20.7008056640625, -19.730783462524414, -18.760759353637695, -17.79073715209961, -16.82071304321289, -15.850690841674805, -14.880667686462402, -13.91064453125, -12.940620422363281, -11.970597267150879, -11.000574111938477, -10.03055191040039, -9.060527801513672, -8.090505599975586, -7.120482444763184, -6.150459289550781, -5.180436134338379, -4.210412979125977, -3.2403900623321533, -2.27036714553833, -1.3003439903259277, -0.3303208351135254, 0.6397018432617188, 1.609724998474121, 2.5797462463378906, 3.549769401550293, 4.519792556762695, 5.4898152351379395, 6.459838390350342, 7.429861545562744, 8.399884223937988, 9.36990737915039, 10.339930534362793, 11.309953689575195, 12.279976844787598, 13.25, 14.220022201538086, 15.190046310424805, 16.16006851196289, 17.13009262084961, 18.100114822387695, 19.07013702392578, 20.0401611328125, 21.010183334350586, 21.980207443237305, 22.95022964477539, 23.92025375366211, 24.890275955200195, 25.86029815673828, 26.830320358276367, 27.800344467163086, 28.770366668701172, 29.74039077758789, 30.710412979125977, 31.680435180664062, 32.65045928955078, 33.6204833984375]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 6.0, 5.0, 6.0, 8.0, 11.0, 15.0, 20.0, 23.0, 29.0, 20.0, 32.0, 36.0, 37.0, 44.0, 45.0, 42.0, 47.0, 44.0, 49.0, 57.0, 60.0, 43.0, 38.0, 46.0, 39.0, 34.0, 24.0, 26.0, 27.0, 20.0, 15.0, 11.0, 11.0, 11.0, 4.0, 6.0, 6.0, 8.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.42072677612305, -38.1991081237793, -36.97749328613281, -35.75587463378906, -34.53425598144531, -33.31263732910156, -32.09102249145508, -30.869403839111328, -29.64778709411621, -28.426170349121094, -27.204551696777344, -25.982934951782227, -24.76131820678711, -23.53969955444336, -22.318082809448242, -21.096466064453125, -19.874847412109375, -18.653230667114258, -17.431612014770508, -16.20999526977539, -14.988377571105957, -13.766759872436523, -12.545143127441406, -11.323525428771973, -10.101907730102539, -8.880290031433105, -7.65867280960083, -6.437055587768555, -5.215437889099121, -3.9938201904296875, -2.772202968597412, -1.5505857467651367, -0.3289642333984375, 0.892653226852417, 2.1142706871032715, 3.335888147354126, 4.5575056076049805, 5.779123306274414, 7.0007405281066895, 8.222357749938965, 9.443975448608398, 10.665593147277832, 11.887210845947266, 13.108827590942383, 14.330445289611816, 15.55206298828125, 16.773679733276367, 17.995296478271484, 19.216915130615234, 20.43853187561035, 21.6601505279541, 22.88176727294922, 24.10338592529297, 25.325002670288086, 26.546619415283203, 27.768238067626953, 28.98985481262207, 30.211471557617188, 31.433090209960938, 32.65470886230469, 33.87632369995117, 35.09794235229492, 36.31956100463867, 37.541175842285156, 38.762794494628906]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 3.0, 12.0, 9.0, 7.0, 10.0, 14.0, 10.0, 19.0, 20.0, 17.0, 26.0, 20.0, 24.0, 30.0, 38.0, 33.0, 40.0, 34.0, 35.0, 42.0, 36.0, 42.0, 36.0, 53.0, 45.0, 43.0, 28.0, 29.0, 28.0, 26.0, 24.0, 23.0, 27.0, 25.0, 19.0, 10.0, 10.0, 11.0, 10.0, 7.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.62109375, -3.504791259765625, -3.38848876953125, -3.272186279296875, -3.1558837890625, -3.039581298828125, -2.92327880859375, -2.806976318359375, -2.690673828125, -2.574371337890625, -2.45806884765625, -2.341766357421875, -2.2254638671875, -2.109161376953125, -1.99285888671875, -1.876556396484375, -1.76025390625, -1.643951416015625, -1.52764892578125, -1.411346435546875, -1.2950439453125, -1.178741455078125, -1.06243896484375, -0.946136474609375, -0.829833984375, -0.713531494140625, -0.59722900390625, -0.480926513671875, -0.3646240234375, -0.248321533203125, -0.13201904296875, -0.015716552734375, 0.1005859375, 0.216888427734375, 0.33319091796875, 0.449493408203125, 0.5657958984375, 0.682098388671875, 0.79840087890625, 0.914703369140625, 1.031005859375, 1.147308349609375, 1.26361083984375, 1.379913330078125, 1.4962158203125, 1.612518310546875, 1.72882080078125, 1.845123291015625, 1.96142578125, 2.077728271484375, 2.19403076171875, 2.310333251953125, 2.4266357421875, 2.542938232421875, 2.65924072265625, 2.775543212890625, 2.891845703125, 3.008148193359375, 3.12445068359375, 3.240753173828125, 3.3570556640625, 3.473358154296875, 3.58966064453125, 3.705963134765625, 3.822265625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 9.0, 15.0, 29.0, 42.0, 57.0, 91.0, 159.0, 199.0, 298.0, 509.0, 775.0, 1205.0, 1776.0, 2666.0, 4133.0, 6156.0, 9227.0, 14124.0, 20771.0, 30136.0, 42234.0, 58599.0, 76725.0, 95271.0, 110663.0, 117041.0, 108734.0, 92383.0, 72976.0, 55159.0, 40185.0, 28024.0, 19242.0, 13130.0, 8791.0, 5777.0, 3847.0, 2542.0, 1675.0, 1064.0, 720.0, 462.0, 278.0, 215.0, 164.0, 86.0, 84.0, 36.0, 29.0, 18.0, 11.0, 8.0, 5.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.7275390625, -0.7050933837890625, -0.682647705078125, -0.6602020263671875, -0.63775634765625, -0.6153106689453125, -0.592864990234375, -0.5704193115234375, -0.5479736328125, -0.5255279541015625, -0.503082275390625, -0.4806365966796875, -0.45819091796875, -0.4357452392578125, -0.413299560546875, -0.3908538818359375, -0.368408203125, -0.3459625244140625, -0.323516845703125, -0.3010711669921875, -0.27862548828125, -0.2561798095703125, -0.233734130859375, -0.2112884521484375, -0.1888427734375, -0.1663970947265625, -0.143951416015625, -0.1215057373046875, -0.09906005859375, -0.0766143798828125, -0.054168701171875, -0.0317230224609375, -0.00927734375, 0.0131683349609375, 0.035614013671875, 0.0580596923828125, 0.08050537109375, 0.1029510498046875, 0.125396728515625, 0.1478424072265625, 0.1702880859375, 0.1927337646484375, 0.215179443359375, 0.2376251220703125, 0.26007080078125, 0.2825164794921875, 0.304962158203125, 0.3274078369140625, 0.349853515625, 0.3722991943359375, 0.394744873046875, 0.4171905517578125, 0.43963623046875, 0.4620819091796875, 0.484527587890625, 0.5069732666015625, 0.5294189453125, 0.5518646240234375, 0.574310302734375, 0.5967559814453125, 0.61920166015625, 0.6416473388671875, 0.664093017578125, 0.6865386962890625, 0.708984375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 5.0, 6.0, 8.0, 10.0, 10.0, 9.0, 16.0, 17.0, 18.0, 22.0, 25.0, 12.0, 21.0, 31.0, 37.0, 30.0, 24.0, 33.0, 42.0, 35.0, 40.0, 42.0, 1055.0, 25.0, 44.0, 29.0, 31.0, 29.0, 45.0, 30.0, 25.0, 31.0, 27.0, 29.0, 20.0, 21.0, 19.0, 12.0, 11.0, 14.0, 7.0, 5.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.849609375, -2.75872802734375, -2.6678466796875, -2.57696533203125, -2.486083984375, -2.39520263671875, -2.3043212890625, -2.21343994140625, -2.12255859375, -2.03167724609375, -1.9407958984375, -1.84991455078125, -1.759033203125, -1.66815185546875, -1.5772705078125, -1.48638916015625, -1.3955078125, -1.30462646484375, -1.2137451171875, -1.12286376953125, -1.031982421875, -0.94110107421875, -0.8502197265625, -0.75933837890625, -0.66845703125, -0.57757568359375, -0.4866943359375, -0.39581298828125, -0.304931640625, -0.21405029296875, -0.1231689453125, -0.03228759765625, 0.05859375, 0.14947509765625, 0.2403564453125, 0.33123779296875, 0.422119140625, 0.51300048828125, 0.6038818359375, 0.69476318359375, 0.78564453125, 0.87652587890625, 0.9674072265625, 1.05828857421875, 1.149169921875, 1.24005126953125, 1.3309326171875, 1.42181396484375, 1.5126953125, 1.60357666015625, 1.6944580078125, 1.78533935546875, 1.876220703125, 1.96710205078125, 2.0579833984375, 2.14886474609375, 2.23974609375, 2.33062744140625, 2.4215087890625, 2.51239013671875, 2.603271484375, 2.69415283203125, 2.7850341796875, 2.87591552734375, 2.966796875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 8.0, 2.0, 5.0, 3.0, 9.0, 12.0, 4.0, 17.0, 37.0, 29.0, 64.0, 132.0, 246.0, 502.0, 1184.0, 3047.0, 7331.0, 18876.0, 52560.0, 1929178.0, 52295.0, 18905.0, 7442.0, 2914.0, 1251.0, 540.0, 222.0, 120.0, 57.0, 39.0, 23.0, 17.0, 15.0, 12.0, 9.0, 11.0, 3.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.486328125, -2.40203857421875, -2.3177490234375, -2.23345947265625, -2.149169921875, -2.06488037109375, -1.9805908203125, -1.89630126953125, -1.81201171875, -1.72772216796875, -1.6434326171875, -1.55914306640625, -1.474853515625, -1.39056396484375, -1.3062744140625, -1.22198486328125, -1.1376953125, -1.05340576171875, -0.9691162109375, -0.88482666015625, -0.800537109375, -0.71624755859375, -0.6319580078125, -0.54766845703125, -0.46337890625, -0.37908935546875, -0.2947998046875, -0.21051025390625, -0.126220703125, -0.04193115234375, 0.0423583984375, 0.12664794921875, 0.2109375, 0.29522705078125, 0.3795166015625, 0.46380615234375, 0.548095703125, 0.63238525390625, 0.7166748046875, 0.80096435546875, 0.88525390625, 0.96954345703125, 1.0538330078125, 1.13812255859375, 1.222412109375, 1.30670166015625, 1.3909912109375, 1.47528076171875, 1.5595703125, 1.64385986328125, 1.7281494140625, 1.81243896484375, 1.896728515625, 1.98101806640625, 2.0653076171875, 2.14959716796875, 2.23388671875, 2.31817626953125, 2.4024658203125, 2.48675537109375, 2.571044921875, 2.65533447265625, 2.7396240234375, 2.82391357421875, 2.908203125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 9.0, 9.0, 22.0, 51.0, 95.0, 194.0, 239.0, 171.0, 85.0, 40.0, 22.0, 8.0, 6.0, 7.0, 10.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12152099609375, -0.11797714233398438, -0.11443328857421875, -0.11088943481445312, -0.1073455810546875, -0.10380172729492188, -0.10025787353515625, -0.09671401977539062, -0.093170166015625, -0.08962631225585938, -0.08608245849609375, -0.08253860473632812, -0.0789947509765625, -0.07545089721679688, -0.07190704345703125, -0.06836318969726562, -0.0648193359375, -0.061275482177734375, -0.05773162841796875, -0.054187774658203125, -0.0506439208984375, -0.047100067138671875, -0.04355621337890625, -0.040012359619140625, -0.036468505859375, -0.032924652099609375, -0.02938079833984375, -0.025836944580078125, -0.0222930908203125, -0.018749237060546875, -0.01520538330078125, -0.011661529541015625, -0.00811767578125, -0.004573822021484375, -0.00102996826171875, 0.002513885498046875, 0.0060577392578125, 0.009601593017578125, 0.01314544677734375, 0.016689300537109375, 0.020233154296875, 0.023777008056640625, 0.02732086181640625, 0.030864715576171875, 0.0344085693359375, 0.037952423095703125, 0.04149627685546875, 0.045040130615234375, 0.048583984375, 0.052127838134765625, 0.05567169189453125, 0.059215545654296875, 0.0627593994140625, 0.06630325317382812, 0.06984710693359375, 0.07339096069335938, 0.076934814453125, 0.08047866821289062, 0.08402252197265625, 0.08756637573242188, 0.0911102294921875, 0.09465408325195312, 0.09819793701171875, 0.10174179077148438, 0.10528564453125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 9.0, 5.0, 9.0, 6.0, 15.0, 22.0, 62.0, 298.0, 2736.0, 892946.0, 149794.0, 2227.0, 294.0, 49.0, 26.0, 11.0, 9.0, 8.0, 6.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.833984375, -2.7393798828125, -2.644775390625, -2.5501708984375, -2.45556640625, -2.3609619140625, -2.266357421875, -2.1717529296875, -2.0771484375, -1.9825439453125, -1.887939453125, -1.7933349609375, -1.69873046875, -1.6041259765625, -1.509521484375, -1.4149169921875, -1.3203125, -1.2257080078125, -1.131103515625, -1.0364990234375, -0.94189453125, -0.8472900390625, -0.752685546875, -0.6580810546875, -0.5634765625, -0.4688720703125, -0.374267578125, -0.2796630859375, -0.18505859375, -0.0904541015625, 0.004150390625, 0.0987548828125, 0.193359375, 0.2879638671875, 0.382568359375, 0.4771728515625, 0.57177734375, 0.6663818359375, 0.760986328125, 0.8555908203125, 0.9501953125, 1.0447998046875, 1.139404296875, 1.2340087890625, 1.32861328125, 1.4232177734375, 1.517822265625, 1.6124267578125, 1.70703125, 1.8016357421875, 1.896240234375, 1.9908447265625, 2.08544921875, 2.1800537109375, 2.274658203125, 2.3692626953125, 2.4638671875, 2.5584716796875, 2.653076171875, 2.7476806640625, 2.84228515625, 2.9368896484375, 3.031494140625, 3.1260986328125, 3.220703125]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 11.0, 8.0, 14.0, 14.0, 12.0, 27.0, 37.0, 49.0, 111.0, 155.0, 174.0, 132.0, 96.0, 58.0, 39.0, 14.0, 14.0, 9.0, 5.0, 9.0, 9.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1610490083694458, -0.15449491143226624, -0.14794082939624786, -0.1413867324590683, -0.13483263552188873, -0.12827855348587036, -0.1217244565486908, -0.11517036706209183, -0.10861627757549286, -0.10206218808889389, -0.09550809115171432, -0.08895400166511536, -0.08239991217851639, -0.07584582269191742, -0.06929172575473785, -0.06273763626813889, -0.05618353933095932, -0.04962944611907005, -0.043075356632471085, -0.03652126342058182, -0.0299671720713377, -0.023413080722093582, -0.016858987510204315, -0.010304898023605347, -0.0037508048117160797, 0.0028032870031893253, 0.00935737881809473, 0.015911471098661423, 0.02246556244790554, 0.029019653797149658, 0.035573747009038925, 0.042127836495637894, 0.04868192970752716, 0.05523602291941643, 0.061790112406015396, 0.06834420561790466, 0.07489829510450363, 0.0814523845911026, 0.08800648152828217, 0.09456057101488113, 0.1011146605014801, 0.10766874998807907, 0.11422284692525864, 0.1207769364118576, 0.12733103334903717, 0.13388511538505554, 0.1404392123222351, 0.14699330925941467, 0.15354740619659424, 0.1601015031337738, 0.16665558516979218, 0.17320968210697174, 0.1797637790441513, 0.18631786108016968, 0.19287195801734924, 0.1994260549545288, 0.20598013699054718, 0.21253423392772675, 0.21908831596374512, 0.22564241290092468, 0.23219650983810425, 0.23875059187412262, 0.24530468881130219, 0.25185877084732056, 0.2584128677845001]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 0.0, 4.0, 2.0, 6.0, 5.0, 6.0, 14.0, 5.0, 17.0, 18.0, 18.0, 18.0, 22.0, 27.0, 24.0, 33.0, 35.0, 44.0, 37.0, 30.0, 44.0, 42.0, 39.0, 35.0, 40.0, 38.0, 43.0, 33.0, 37.0, 35.0, 31.0, 34.0, 33.0, 31.0, 20.0, 14.0, 10.0, 14.0, 9.0, 9.0, 16.0, 8.0, 6.0, 5.0, 5.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.06505948305130005, -0.06303659081459045, -0.06101370230317116, -0.05899081379175186, -0.05696792155504227, -0.05494502931833267, -0.052922140806913376, -0.05089925229549408, -0.048876360058784485, -0.04685346782207489, -0.044830579310655594, -0.0428076907992363, -0.0407847985625267, -0.03876190632581711, -0.03673901781439781, -0.034716129302978516, -0.03269323706626892, -0.030670346692204475, -0.02864745631814003, -0.026624565944075584, -0.02460167557001114, -0.022578785195946693, -0.020555894821882248, -0.018533004447817802, -0.016510114073753357, -0.014487223699688911, -0.012464333325624466, -0.01044144295156002, -0.008418552577495575, -0.0063956622034311295, -0.004372771829366684, -0.0023498814553022385, -0.00032699108123779297, 0.0016958992928266525, 0.003718789666891098, 0.0057416800409555435, 0.007764570415019989, 0.009787460789084435, 0.01181035116314888, 0.013833241537213326, 0.01585613191127777, 0.017879022285342216, 0.019901912659406662, 0.021924803033471107, 0.023947693407535553, 0.0259705837816, 0.027993474155664444, 0.03001636452972889, 0.032039254903793335, 0.03406214714050293, 0.036085035651922226, 0.03810792416334152, 0.04013081640005112, 0.04215370863676071, 0.04417659714818001, 0.046199485659599304, 0.0482223778963089, 0.050245270133018494, 0.05226815864443779, 0.054291047155857086, 0.05631393939256668, 0.058336831629276276, 0.06035972014069557, 0.06238260865211487, 0.06440550088882446]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 8.0, 7.0, 13.0, 11.0, 16.0, 12.0, 17.0, 14.0, 15.0, 25.0, 23.0, 25.0, 36.0, 36.0, 36.0, 43.0, 30.0, 30.0, 36.0, 37.0, 36.0, 44.0, 30.0, 40.0, 39.0, 43.0, 30.0, 26.0, 34.0, 29.0, 25.0, 16.0, 19.0, 25.0, 15.0, 18.0, 10.0, 6.0, 6.0, 10.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.20703125, -3.09405517578125, -2.9810791015625, -2.86810302734375, -2.755126953125, -2.64215087890625, -2.5291748046875, -2.41619873046875, -2.30322265625, -2.19024658203125, -2.0772705078125, -1.96429443359375, -1.851318359375, -1.73834228515625, -1.6253662109375, -1.51239013671875, -1.3994140625, -1.28643798828125, -1.1734619140625, -1.06048583984375, -0.947509765625, -0.83453369140625, -0.7215576171875, -0.60858154296875, -0.49560546875, -0.38262939453125, -0.2696533203125, -0.15667724609375, -0.043701171875, 0.06927490234375, 0.1822509765625, 0.29522705078125, 0.408203125, 0.52117919921875, 0.6341552734375, 0.74713134765625, 0.860107421875, 0.97308349609375, 1.0860595703125, 1.19903564453125, 1.31201171875, 1.42498779296875, 1.5379638671875, 1.65093994140625, 1.763916015625, 1.87689208984375, 1.9898681640625, 2.10284423828125, 2.2158203125, 2.32879638671875, 2.4417724609375, 2.55474853515625, 2.667724609375, 2.78070068359375, 2.8936767578125, 3.00665283203125, 3.11962890625, 3.23260498046875, 3.3455810546875, 3.45855712890625, 3.571533203125, 3.68450927734375, 3.7974853515625, 3.91046142578125, 4.0234375]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 8.0, 6.0, 12.0, 12.0, 30.0, 40.0, 64.0, 100.0, 146.0, 213.0, 327.0, 577.0, 925.0, 1463.0, 2379.0, 3902.0, 6339.0, 10498.0, 17679.0, 32305.0, 71460.0, 184432.0, 336004.0, 213557.0, 81807.0, 35649.0, 19137.0, 11584.0, 6860.0, 4284.0, 2571.0, 1634.0, 974.0, 582.0, 347.0, 221.0, 143.0, 86.0, 70.0, 35.0, 32.0, 24.0, 12.0, 12.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37109375, -4.232666015625, -4.09423828125, -3.955810546875, -3.8173828125, -3.678955078125, -3.54052734375, -3.402099609375, -3.263671875, -3.125244140625, -2.98681640625, -2.848388671875, -2.7099609375, -2.571533203125, -2.43310546875, -2.294677734375, -2.15625, -2.017822265625, -1.87939453125, -1.740966796875, -1.6025390625, -1.464111328125, -1.32568359375, -1.187255859375, -1.048828125, -0.910400390625, -0.77197265625, -0.633544921875, -0.4951171875, -0.356689453125, -0.21826171875, -0.079833984375, 0.05859375, 0.197021484375, 0.33544921875, 0.473876953125, 0.6123046875, 0.750732421875, 0.88916015625, 1.027587890625, 1.166015625, 1.304443359375, 1.44287109375, 1.581298828125, 1.7197265625, 1.858154296875, 1.99658203125, 2.135009765625, 2.2734375, 2.411865234375, 2.55029296875, 2.688720703125, 2.8271484375, 2.965576171875, 3.10400390625, 3.242431640625, 3.380859375, 3.519287109375, 3.65771484375, 3.796142578125, 3.9345703125, 4.072998046875, 4.21142578125, 4.349853515625, 4.48828125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 7.0, 6.0, 5.0, 5.0, 12.0, 19.0, 16.0, 19.0, 21.0, 20.0, 30.0, 32.0, 30.0, 29.0, 42.0, 50.0, 65.0, 96.0, 159.0, 364.0, 1380.0, 167.0, 86.0, 66.0, 56.0, 38.0, 42.0, 39.0, 33.0, 18.0, 25.0, 21.0, 17.0, 8.0, 4.0, 7.0, 8.0, 3.0, 3.0, 6.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.46875, -15.9844970703125, -15.500244140625, -15.0159912109375, -14.53173828125, -14.0474853515625, -13.563232421875, -13.0789794921875, -12.5947265625, -12.1104736328125, -11.626220703125, -11.1419677734375, -10.65771484375, -10.1734619140625, -9.689208984375, -9.2049560546875, -8.720703125, -8.2364501953125, -7.752197265625, -7.2679443359375, -6.78369140625, -6.2994384765625, -5.815185546875, -5.3309326171875, -4.8466796875, -4.3624267578125, -3.878173828125, -3.3939208984375, -2.90966796875, -2.4254150390625, -1.941162109375, -1.4569091796875, -0.97265625, -0.4884033203125, -0.004150390625, 0.4801025390625, 0.96435546875, 1.4486083984375, 1.932861328125, 2.4171142578125, 2.9013671875, 3.3856201171875, 3.869873046875, 4.3541259765625, 4.83837890625, 5.3226318359375, 5.806884765625, 6.2911376953125, 6.775390625, 7.2596435546875, 7.743896484375, 8.2281494140625, 8.71240234375, 9.1966552734375, 9.680908203125, 10.1651611328125, 10.6494140625, 11.1336669921875, 11.617919921875, 12.1021728515625, 12.58642578125, 13.0706787109375, 13.554931640625, 14.0391845703125, 14.5234375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 5.0, 10.0, 11.0, 9.0, 6.0, 18.0, 18.0, 35.0, 31.0, 31.0, 56.0, 62.0, 108.0, 141.0, 270.0, 364.0, 807.0, 3974.0, 52654.0, 2773684.0, 299161.0, 11329.0, 1391.0, 509.0, 286.0, 180.0, 131.0, 90.0, 76.0, 47.0, 38.0, 40.0, 22.0, 21.0, 17.0, 15.0, 15.0, 15.0, 5.0, 9.0, 4.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-27.09375, -26.265625, -25.4375, -24.609375, -23.78125, -22.953125, -22.125, -21.296875, -20.46875, -19.640625, -18.8125, -17.984375, -17.15625, -16.328125, -15.5, -14.671875, -13.84375, -13.015625, -12.1875, -11.359375, -10.53125, -9.703125, -8.875, -8.046875, -7.21875, -6.390625, -5.5625, -4.734375, -3.90625, -3.078125, -2.25, -1.421875, -0.59375, 0.234375, 1.0625, 1.890625, 2.71875, 3.546875, 4.375, 5.203125, 6.03125, 6.859375, 7.6875, 8.515625, 9.34375, 10.171875, 11.0, 11.828125, 12.65625, 13.484375, 14.3125, 15.140625, 15.96875, 16.796875, 17.625, 18.453125, 19.28125, 20.109375, 20.9375, 21.765625, 22.59375, 23.421875, 24.25, 25.078125, 25.90625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 95.0, 544.0, 352.0, 21.0, 0.0, 1.0], "bins": [-281.0116882324219, -276.3140869140625, -271.6164855957031, -266.91888427734375, -262.2212829589844, -257.523681640625, -252.82606506347656, -248.1284637451172, -243.4308624267578, -238.73326110839844, -234.03565979003906, -229.3380584716797, -224.64044189453125, -219.94284057617188, -215.2452392578125, -210.54763793945312, -205.85003662109375, -201.15243530273438, -196.454833984375, -191.75723266601562, -187.05963134765625, -182.3620147705078, -177.66441345214844, -172.96681213378906, -168.2692108154297, -163.5716094970703, -158.87400817871094, -154.17640686035156, -149.47879028320312, -144.78118896484375, -140.08358764648438, -135.385986328125, -130.68838500976562, -125.99078369140625, -121.29318237304688, -116.59557342529297, -111.8979721069336, -107.20037078857422, -102.50276184082031, -97.80516052246094, -93.10755920410156, -88.40995788574219, -83.71235656738281, -79.0147476196289, -74.31714630126953, -69.61954498291016, -64.92193603515625, -60.224334716796875, -55.5267333984375, -50.829132080078125, -46.131526947021484, -41.433921813964844, -36.73632049560547, -32.038719177246094, -27.341114044189453, -22.643508911132812, -17.94590950012207, -13.248306274414062, -8.550703048706055, -3.853099822998047, 0.8445034027099609, 5.542106628417969, 10.239709854125977, 14.937314987182617, 19.634916305541992]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 3.0, 6.0, 9.0, 6.0, 14.0, 15.0, 18.0, 20.0, 17.0, 20.0, 20.0, 29.0, 28.0, 32.0, 39.0, 30.0, 34.0, 42.0, 35.0, 26.0, 40.0, 40.0, 46.0, 42.0, 41.0, 31.0, 36.0, 29.0, 31.0, 26.0, 27.0, 25.0, 16.0, 14.0, 15.0, 16.0, 18.0, 8.0, 7.0, 8.0, 4.0, 8.0, 8.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-30.806358337402344, -29.73038673400879, -28.654415130615234, -27.578445434570312, -26.502473831176758, -25.426502227783203, -24.35053062438965, -23.274559020996094, -22.198589324951172, -21.122617721557617, -20.046646118164062, -18.97067642211914, -17.894704818725586, -16.81873321533203, -15.742761611938477, -14.666790008544922, -13.590818405151367, -12.514846801757812, -11.438876152038574, -10.36290454864502, -9.286933898925781, -8.210962295532227, -7.134990692138672, -6.059019565582275, -4.983048439025879, -3.9070773124694824, -2.831105947494507, -1.7551345825195312, -0.6791634559631348, 0.3968076705932617, 1.4727792739868164, 2.548750400543213, 3.6247215270996094, 4.700692653656006, 5.776663780212402, 6.852635383605957, 7.9286065101623535, 9.00457763671875, 10.080549240112305, 11.15652084350586, 12.232491493225098, 13.308463096618652, 14.38443374633789, 15.460405349731445, 16.536376953125, 17.612346649169922, 18.68832015991211, 19.76428985595703, 20.840261459350586, 21.91623306274414, 22.992204666137695, 24.06817626953125, 25.144145965576172, 26.220117568969727, 27.29608917236328, 28.372060775756836, 29.44803237915039, 30.524003982543945, 31.5999755859375, 32.67594528198242, 33.75191879272461, 34.82788848876953, 35.90386199951172, 36.97983169555664, 38.05580139160156]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 3.0, 5.0, 3.0, 5.0, 9.0, 11.0, 7.0, 15.0, 18.0, 16.0, 14.0, 17.0, 10.0, 29.0, 24.0, 30.0, 33.0, 30.0, 39.0, 26.0, 39.0, 36.0, 35.0, 27.0, 38.0, 28.0, 35.0, 40.0, 37.0, 33.0, 22.0, 39.0, 29.0, 27.0, 34.0, 18.0, 17.0, 19.0, 24.0, 12.0, 18.0, 12.0, 9.0, 7.0, 2.0, 5.0, 3.0, 2.0, 5.0, 1.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.533203125, -3.4180908203125, -3.302978515625, -3.1878662109375, -3.07275390625, -2.9576416015625, -2.842529296875, -2.7274169921875, -2.6123046875, -2.4971923828125, -2.382080078125, -2.2669677734375, -2.15185546875, -2.0367431640625, -1.921630859375, -1.8065185546875, -1.69140625, -1.5762939453125, -1.461181640625, -1.3460693359375, -1.23095703125, -1.1158447265625, -1.000732421875, -0.8856201171875, -0.7705078125, -0.6553955078125, -0.540283203125, -0.4251708984375, -0.31005859375, -0.1949462890625, -0.079833984375, 0.0352783203125, 0.150390625, 0.2655029296875, 0.380615234375, 0.4957275390625, 0.61083984375, 0.7259521484375, 0.841064453125, 0.9561767578125, 1.0712890625, 1.1864013671875, 1.301513671875, 1.4166259765625, 1.53173828125, 1.6468505859375, 1.761962890625, 1.8770751953125, 1.9921875, 2.1072998046875, 2.222412109375, 2.3375244140625, 2.45263671875, 2.5677490234375, 2.682861328125, 2.7979736328125, 2.9130859375, 3.0281982421875, 3.143310546875, 3.2584228515625, 3.37353515625, 3.4886474609375, 3.603759765625, 3.7188720703125, 3.833984375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 1.0, 6.0, 11.0, 12.0, 20.0, 17.0, 25.0, 22.0, 26.0, 44.0, 44.0, 41.0, 70.0, 84.0, 121.0, 148.0, 290.0, 708.0, 2431.0, 10181.0, 60474.0, 466240.0, 2442651.0, 1056763.0, 128099.0, 19329.0, 4028.0, 1201.0, 419.0, 211.0, 121.0, 87.0, 55.0, 65.0, 40.0, 47.0, 26.0, 20.0, 23.0, 20.0, 14.0, 6.0, 8.0, 4.0, 8.0, 10.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.46875, -11.0950927734375, -10.721435546875, -10.3477783203125, -9.97412109375, -9.6004638671875, -9.226806640625, -8.8531494140625, -8.4794921875, -8.1058349609375, -7.732177734375, -7.3585205078125, -6.98486328125, -6.6112060546875, -6.237548828125, -5.8638916015625, -5.490234375, -5.1165771484375, -4.742919921875, -4.3692626953125, -3.99560546875, -3.6219482421875, -3.248291015625, -2.8746337890625, -2.5009765625, -2.1273193359375, -1.753662109375, -1.3800048828125, -1.00634765625, -0.6326904296875, -0.259033203125, 0.1146240234375, 0.48828125, 0.8619384765625, 1.235595703125, 1.6092529296875, 1.98291015625, 2.3565673828125, 2.730224609375, 3.1038818359375, 3.4775390625, 3.8511962890625, 4.224853515625, 4.5985107421875, 4.97216796875, 5.3458251953125, 5.719482421875, 6.0931396484375, 6.466796875, 6.8404541015625, 7.214111328125, 7.5877685546875, 7.96142578125, 8.3350830078125, 8.708740234375, 9.0823974609375, 9.4560546875, 9.8297119140625, 10.203369140625, 10.5770263671875, 10.95068359375, 11.3243408203125, 11.697998046875, 12.0716552734375, 12.4453125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 10.0, 11.0, 21.0, 48.0, 100.0, 134.0, 242.0, 429.0, 622.0, 773.0, 723.0, 432.0, 234.0, 143.0, 77.0, 31.0, 21.0, 15.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.640625, -25.0223388671875, -24.404052734375, -23.7857666015625, -23.16748046875, -22.5491943359375, -21.930908203125, -21.3126220703125, -20.6943359375, -20.0760498046875, -19.457763671875, -18.8394775390625, -18.22119140625, -17.6029052734375, -16.984619140625, -16.3663330078125, -15.748046875, -15.1297607421875, -14.511474609375, -13.8931884765625, -13.27490234375, -12.6566162109375, -12.038330078125, -11.4200439453125, -10.8017578125, -10.1834716796875, -9.565185546875, -8.9468994140625, -8.32861328125, -7.7103271484375, -7.092041015625, -6.4737548828125, -5.85546875, -5.2371826171875, -4.618896484375, -4.0006103515625, -3.38232421875, -2.7640380859375, -2.145751953125, -1.5274658203125, -0.9091796875, -0.2908935546875, 0.327392578125, 0.9456787109375, 1.56396484375, 2.1822509765625, 2.800537109375, 3.4188232421875, 4.037109375, 4.6553955078125, 5.273681640625, 5.8919677734375, 6.51025390625, 7.1285400390625, 7.746826171875, 8.3651123046875, 8.9833984375, 9.6016845703125, 10.219970703125, 10.8382568359375, 11.45654296875, 12.0748291015625, 12.693115234375, 13.3114013671875, 13.9296875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 23.0, 27.0, 57.0, 132.0, 287.0, 804.0, 6374.0, 1127948.0, 3039808.0, 17066.0, 1057.0, 329.0, 173.0, 93.0, 44.0, 25.0, 10.0, 12.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.90625, -32.37353515625, -30.8408203125, -29.30810546875, -27.775390625, -26.24267578125, -24.7099609375, -23.17724609375, -21.64453125, -20.11181640625, -18.5791015625, -17.04638671875, -15.513671875, -13.98095703125, -12.4482421875, -10.91552734375, -9.3828125, -7.85009765625, -6.3173828125, -4.78466796875, -3.251953125, -1.71923828125, -0.1865234375, 1.34619140625, 2.87890625, 4.41162109375, 5.9443359375, 7.47705078125, 9.009765625, 10.54248046875, 12.0751953125, 13.60791015625, 15.140625, 16.67333984375, 18.2060546875, 19.73876953125, 21.271484375, 22.80419921875, 24.3369140625, 25.86962890625, 27.40234375, 28.93505859375, 30.4677734375, 32.00048828125, 33.533203125, 35.06591796875, 36.5986328125, 38.13134765625, 39.6640625, 41.19677734375, 42.7294921875, 44.26220703125, 45.794921875, 47.32763671875, 48.8603515625, 50.39306640625, 51.92578125, 53.45849609375, 54.9912109375, 56.52392578125, 58.056640625, 59.58935546875, 61.1220703125, 62.65478515625, 64.1875]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 16.0, 34.0, 53.0, 64.0, 104.0, 124.0, 140.0, 128.0, 126.0, 83.0, 54.0, 40.0, 21.0, 11.0, 6.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.774452209472656, -45.384422302246094, -42.99439239501953, -40.604366302490234, -38.21433639526367, -35.82430648803711, -33.43428039550781, -31.04425048828125, -28.654220581054688, -26.264190673828125, -23.874162673950195, -21.484134674072266, -19.094104766845703, -16.70407485961914, -14.314046859741211, -11.924018859863281, -9.533988952636719, -7.143959999084473, -4.753931045532227, -2.3639020919799805, 0.026126861572265625, 2.4161558151245117, 4.806184768676758, 7.1962127685546875, 9.58624267578125, 11.976271629333496, 14.366300582885742, 16.756328582763672, 19.146358489990234, 21.536388397216797, 23.926416397094727, 26.316444396972656, 28.706466674804688, 31.09649658203125, 33.48652648925781, 35.87655258178711, 38.26658248901367, 40.656612396240234, 43.04663848876953, 45.436668395996094, 47.826698303222656, 50.21672821044922, 52.60675811767578, 54.99678421020508, 57.38681411743164, 59.7768440246582, 62.1668701171875, 64.55690002441406, 66.94692993164062, 69.33695983886719, 71.72698974609375, 74.11701965332031, 76.50704956054688, 78.8970718383789, 81.28710174560547, 83.67713165283203, 86.0671615600586, 88.45719146728516, 90.84722137451172, 93.23725128173828, 95.62727355957031, 98.01730346679688, 100.40733337402344, 102.79736328125, 105.18739318847656]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 5.0, 7.0, 5.0, 4.0, 4.0, 12.0, 12.0, 15.0, 14.0, 17.0, 22.0, 21.0, 26.0, 16.0, 21.0, 25.0, 37.0, 26.0, 26.0, 34.0, 47.0, 53.0, 49.0, 43.0, 37.0, 41.0, 36.0, 37.0, 35.0, 30.0, 32.0, 19.0, 27.0, 22.0, 21.0, 16.0, 15.0, 18.0, 8.0, 12.0, 13.0, 13.0, 8.0, 5.0, 8.0, 4.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-32.529579162597656, -31.45688247680664, -30.384187698364258, -29.311491012573242, -28.238794326782227, -27.166099548339844, -26.093402862548828, -25.020706176757812, -23.948009490966797, -22.87531280517578, -21.8026180267334, -20.729921340942383, -19.657224655151367, -18.584529876708984, -17.51183319091797, -16.439136505126953, -15.36644172668457, -14.293745994567871, -13.221049308776855, -12.148353576660156, -11.07565689086914, -10.002961158752441, -8.930265426635742, -7.857569217681885, -6.784873008728027, -5.71217679977417, -4.6394805908203125, -3.5667848587036133, -2.494088649749756, -1.4213924407958984, -0.3486967086791992, 0.7239995002746582, 1.7966957092285156, 2.869391918182373, 3.9420878887176514, 5.01478385925293, 6.087480068206787, 7.1601762771606445, 8.232872009277344, 9.30556869506836, 10.378264427185059, 11.450960159301758, 12.523656845092773, 13.596352577209473, 14.669048309326172, 15.741744995117188, 16.814441680908203, 17.887136459350586, 18.9598331451416, 20.032529830932617, 21.105224609375, 22.177921295166016, 23.25061798095703, 24.323314666748047, 25.39600944519043, 26.468706130981445, 27.541400909423828, 28.614097595214844, 29.686792373657227, 30.759489059448242, 31.832185745239258, 32.90488052368164, 33.977577209472656, 35.05027389526367, 36.12297058105469]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 13.0, 6.0, 7.0, 11.0, 12.0, 19.0, 12.0, 18.0, 23.0, 26.0, 29.0, 13.0, 25.0, 23.0, 29.0, 29.0, 28.0, 31.0, 40.0, 39.0, 40.0, 46.0, 31.0, 40.0, 36.0, 34.0, 35.0, 28.0, 34.0, 45.0, 32.0, 22.0, 23.0, 17.0, 15.0, 19.0, 19.0, 13.0, 9.0, 6.0, 7.0, 2.0, 4.0, 4.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.78515625, -3.66119384765625, -3.5372314453125, -3.41326904296875, -3.289306640625, -3.16534423828125, -3.0413818359375, -2.91741943359375, -2.79345703125, -2.66949462890625, -2.5455322265625, -2.42156982421875, -2.297607421875, -2.17364501953125, -2.0496826171875, -1.92572021484375, -1.8017578125, -1.67779541015625, -1.5538330078125, -1.42987060546875, -1.305908203125, -1.18194580078125, -1.0579833984375, -0.93402099609375, -0.81005859375, -0.68609619140625, -0.5621337890625, -0.43817138671875, -0.314208984375, -0.19024658203125, -0.0662841796875, 0.05767822265625, 0.181640625, 0.30560302734375, 0.4295654296875, 0.55352783203125, 0.677490234375, 0.80145263671875, 0.9254150390625, 1.04937744140625, 1.17333984375, 1.29730224609375, 1.4212646484375, 1.54522705078125, 1.669189453125, 1.79315185546875, 1.9171142578125, 2.04107666015625, 2.1650390625, 2.28900146484375, 2.4129638671875, 2.53692626953125, 2.660888671875, 2.78485107421875, 2.9088134765625, 3.03277587890625, 3.15673828125, 3.28070068359375, 3.4046630859375, 3.52862548828125, 3.652587890625, 3.77655029296875, 3.9005126953125, 4.02447509765625, 4.1484375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 8.0, 10.0, 15.0, 34.0, 36.0, 53.0, 84.0, 137.0, 197.0, 342.0, 497.0, 775.0, 1245.0, 1997.0, 3175.0, 5128.0, 8227.0, 13291.0, 21153.0, 33623.0, 51765.0, 76085.0, 104058.0, 129424.0, 140744.0, 130709.0, 104680.0, 77005.0, 52545.0, 33963.0, 21598.0, 13460.0, 8434.0, 5230.0, 3217.0, 2001.0, 1293.0, 828.0, 519.0, 360.0, 214.0, 121.0, 105.0, 79.0, 31.0, 17.0, 17.0, 13.0, 6.0, 7.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.81982421875, -0.7929611206054688, -0.7660980224609375, -0.7392349243164062, -0.712371826171875, -0.6855087280273438, -0.6586456298828125, -0.6317825317382812, -0.60491943359375, -0.5780563354492188, -0.5511932373046875, -0.5243301391601562, -0.497467041015625, -0.47060394287109375, -0.4437408447265625, -0.41687774658203125, -0.3900146484375, -0.36315155029296875, -0.3362884521484375, -0.30942535400390625, -0.282562255859375, -0.25569915771484375, -0.2288360595703125, -0.20197296142578125, -0.17510986328125, -0.14824676513671875, -0.1213836669921875, -0.09452056884765625, -0.067657470703125, -0.04079437255859375, -0.0139312744140625, 0.01293182373046875, 0.039794921875, 0.06665802001953125, 0.0935211181640625, 0.12038421630859375, 0.147247314453125, 0.17411041259765625, 0.2009735107421875, 0.22783660888671875, 0.25469970703125, 0.28156280517578125, 0.3084259033203125, 0.33528900146484375, 0.362152099609375, 0.38901519775390625, 0.4158782958984375, 0.44274139404296875, 0.4696044921875, 0.49646759033203125, 0.5233306884765625, 0.5501937866210938, 0.577056884765625, 0.6039199829101562, 0.6307830810546875, 0.6576461791992188, 0.68450927734375, 0.7113723754882812, 0.7382354736328125, 0.7650985717773438, 0.791961669921875, 0.8188247680664062, 0.8456878662109375, 0.8725509643554688, 0.8994140625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 7.0, 5.0, 8.0, 7.0, 9.0, 14.0, 24.0, 13.0, 16.0, 27.0, 30.0, 25.0, 22.0, 31.0, 38.0, 37.0, 29.0, 34.0, 46.0, 43.0, 1055.0, 31.0, 37.0, 32.0, 36.0, 33.0, 32.0, 43.0, 27.0, 35.0, 30.0, 28.0, 22.0, 21.0, 14.0, 8.0, 14.0, 7.0, 11.0, 12.0, 8.0, 6.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-3.853515625, -3.73992919921875, -3.6263427734375, -3.51275634765625, -3.399169921875, -3.28558349609375, -3.1719970703125, -3.05841064453125, -2.94482421875, -2.83123779296875, -2.7176513671875, -2.60406494140625, -2.490478515625, -2.37689208984375, -2.2633056640625, -2.14971923828125, -2.0361328125, -1.92254638671875, -1.8089599609375, -1.69537353515625, -1.581787109375, -1.46820068359375, -1.3546142578125, -1.24102783203125, -1.12744140625, -1.01385498046875, -0.9002685546875, -0.78668212890625, -0.673095703125, -0.55950927734375, -0.4459228515625, -0.33233642578125, -0.21875, -0.10516357421875, 0.0084228515625, 0.12200927734375, 0.235595703125, 0.34918212890625, 0.4627685546875, 0.57635498046875, 0.68994140625, 0.80352783203125, 0.9171142578125, 1.03070068359375, 1.144287109375, 1.25787353515625, 1.3714599609375, 1.48504638671875, 1.5986328125, 1.71221923828125, 1.8258056640625, 1.93939208984375, 2.052978515625, 2.16656494140625, 2.2801513671875, 2.39373779296875, 2.50732421875, 2.62091064453125, 2.7344970703125, 2.84808349609375, 2.961669921875, 3.07525634765625, 3.1888427734375, 3.30242919921875, 3.416015625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 7.0, 4.0, 10.0, 6.0, 20.0, 18.0, 37.0, 65.0, 106.0, 117.0, 199.0, 337.0, 502.0, 853.0, 1477.0, 2581.0, 4736.0, 8334.0, 15439.0, 29021.0, 66406.0, 1877041.0, 42165.0, 21608.0, 11421.0, 6226.0, 3569.0, 1996.0, 1132.0, 644.0, 379.0, 232.0, 140.0, 102.0, 63.0, 47.0, 26.0, 18.0, 15.0, 7.0, 6.0, 10.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6748046875, -1.6212310791015625, -1.567657470703125, -1.5140838623046875, -1.46051025390625, -1.4069366455078125, -1.353363037109375, -1.2997894287109375, -1.2462158203125, -1.1926422119140625, -1.139068603515625, -1.0854949951171875, -1.03192138671875, -0.9783477783203125, -0.924774169921875, -0.8712005615234375, -0.817626953125, -0.7640533447265625, -0.710479736328125, -0.6569061279296875, -0.60333251953125, -0.5497589111328125, -0.496185302734375, -0.4426116943359375, -0.3890380859375, -0.3354644775390625, -0.281890869140625, -0.2283172607421875, -0.17474365234375, -0.1211700439453125, -0.067596435546875, -0.0140228271484375, 0.03955078125, 0.0931243896484375, 0.146697998046875, 0.2002716064453125, 0.25384521484375, 0.3074188232421875, 0.360992431640625, 0.4145660400390625, 0.4681396484375, 0.5217132568359375, 0.575286865234375, 0.6288604736328125, 0.68243408203125, 0.7360076904296875, 0.789581298828125, 0.8431549072265625, 0.896728515625, 0.9503021240234375, 1.003875732421875, 1.0574493408203125, 1.11102294921875, 1.1645965576171875, 1.218170166015625, 1.2717437744140625, 1.3253173828125, 1.3788909912109375, 1.432464599609375, 1.4860382080078125, 1.53961181640625, 1.5931854248046875, 1.646759033203125, 1.7003326416015625, 1.75390625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 6.0, 5.0, 2.0, 4.0, 5.0, 2.0, 5.0, 9.0, 9.0, 12.0, 26.0, 23.0, 37.0, 46.0, 66.0, 112.0, 158.0, 135.0, 100.0, 59.0, 43.0, 25.0, 22.0, 17.0, 13.0, 11.0, 8.0, 5.0, 4.0, 4.0, 3.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08392333984375, -0.08150863647460938, -0.07909393310546875, -0.07667922973632812, -0.0742645263671875, -0.07184982299804688, -0.06943511962890625, -0.06702041625976562, -0.064605712890625, -0.062191009521484375, -0.05977630615234375, -0.057361602783203125, -0.0549468994140625, -0.052532196044921875, -0.05011749267578125, -0.047702789306640625, -0.0452880859375, -0.042873382568359375, -0.04045867919921875, -0.038043975830078125, -0.0356292724609375, -0.033214569091796875, -0.03079986572265625, -0.028385162353515625, -0.025970458984375, -0.023555755615234375, -0.02114105224609375, -0.018726348876953125, -0.0163116455078125, -0.013896942138671875, -0.01148223876953125, -0.009067535400390625, -0.00665283203125, -0.004238128662109375, -0.00182342529296875, 0.000591278076171875, 0.0030059814453125, 0.005420684814453125, 0.00783538818359375, 0.010250091552734375, 0.012664794921875, 0.015079498291015625, 0.01749420166015625, 0.019908905029296875, 0.0223236083984375, 0.024738311767578125, 0.02715301513671875, 0.029567718505859375, 0.031982421875, 0.034397125244140625, 0.03681182861328125, 0.039226531982421875, 0.0416412353515625, 0.044055938720703125, 0.04647064208984375, 0.048885345458984375, 0.051300048828125, 0.053714752197265625, 0.05612945556640625, 0.058544158935546875, 0.0609588623046875, 0.06337356567382812, 0.06578826904296875, 0.06820297241210938, 0.07061767578125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 7.0, 3.0, 3.0, 6.0, 8.0, 1.0, 7.0, 10.0, 8.0, 24.0, 59.0, 110.0, 282.0, 623.0, 1484.0, 3998.0, 13208.0, 97040.0, 903214.0, 19773.0, 5384.0, 1923.0, 772.0, 349.0, 147.0, 44.0, 21.0, 12.0, 11.0, 8.0, 6.0, 4.0, 2.0, 0.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.51953125, -1.453857421875, -1.38818359375, -1.322509765625, -1.2568359375, -1.191162109375, -1.12548828125, -1.059814453125, -0.994140625, -0.928466796875, -0.86279296875, -0.797119140625, -0.7314453125, -0.665771484375, -0.60009765625, -0.534423828125, -0.46875, -0.403076171875, -0.33740234375, -0.271728515625, -0.2060546875, -0.140380859375, -0.07470703125, -0.009033203125, 0.056640625, 0.122314453125, 0.18798828125, 0.253662109375, 0.3193359375, 0.385009765625, 0.45068359375, 0.516357421875, 0.58203125, 0.647705078125, 0.71337890625, 0.779052734375, 0.8447265625, 0.910400390625, 0.97607421875, 1.041748046875, 1.107421875, 1.173095703125, 1.23876953125, 1.304443359375, 1.3701171875, 1.435791015625, 1.50146484375, 1.567138671875, 1.6328125, 1.698486328125, 1.76416015625, 1.829833984375, 1.8955078125, 1.961181640625, 2.02685546875, 2.092529296875, 2.158203125, 2.223876953125, 2.28955078125, 2.355224609375, 2.4208984375, 2.486572265625, 2.55224609375, 2.617919921875, 2.68359375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 4.0, 7.0, 11.0, 13.0, 13.0, 14.0, 29.0, 26.0, 34.0, 51.0, 66.0, 108.0, 159.0, 149.0, 84.0, 57.0, 46.0, 22.0, 21.0, 14.0, 13.0, 7.0, 10.0, 14.0, 5.0, 1.0, 4.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41542819142341614, -0.3993523120880127, -0.38327643275260925, -0.3672005534172058, -0.35112470388412476, -0.3350487947463989, -0.31897294521331787, -0.30289706587791443, -0.286821186542511, -0.27074530720710754, -0.2546694278717041, -0.23859356343746185, -0.2225176841020584, -0.20644180476665497, -0.19036594033241272, -0.17429006099700928, -0.15821418166160583, -0.1421383023262024, -0.12606242299079895, -0.1099865585565567, -0.09391067922115326, -0.07783479988574982, -0.06175892800092697, -0.045683056116104126, -0.029607176780700684, -0.01353130117058754, 0.0025445744395256042, 0.018620450049638748, 0.03469632565975189, 0.050772204995155334, 0.06684807687997818, 0.08292394876480103, 0.09899979829788208, 0.11507567763328552, 0.13115155696868896, 0.1472274214029312, 0.16330330073833466, 0.1793791800737381, 0.19545504450798035, 0.2115309238433838, 0.22760680317878723, 0.24368268251419067, 0.2597585618495941, 0.27583444118499756, 0.2919102907180786, 0.30798619985580444, 0.3240620493888855, 0.34013792872428894, 0.3562138080596924, 0.3722896873950958, 0.38836556673049927, 0.4044414460659027, 0.42051732540130615, 0.4365931749343872, 0.45266905426979065, 0.4687449336051941, 0.48482081294059753, 0.500896692276001, 0.516972541809082, 0.5330484509468079, 0.5491243004798889, 0.5652002096176147, 0.5812760591506958, 0.5973519086837769, 0.6134278178215027]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 3.0, 4.0, 10.0, 12.0, 7.0, 8.0, 12.0, 12.0, 16.0, 21.0, 9.0, 32.0, 22.0, 31.0, 34.0, 38.0, 38.0, 36.0, 32.0, 29.0, 29.0, 41.0, 34.0, 31.0, 38.0, 46.0, 36.0, 33.0, 32.0, 26.0, 23.0, 24.0, 36.0, 31.0, 23.0, 12.0, 17.0, 21.0, 13.0, 6.0, 13.0, 8.0, 3.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.08817368745803833, -0.08555568009614944, -0.08293767273426056, -0.08031967282295227, -0.07770166546106339, -0.0750836580991745, -0.07246565818786621, -0.06984765082597733, -0.06722964346408844, -0.06461163610219955, -0.06199363246560097, -0.05937562882900238, -0.056757621467113495, -0.05413961410522461, -0.05152161046862602, -0.048903606832027435, -0.04628559947013855, -0.043667592108249664, -0.04104958847165108, -0.03843158483505249, -0.035813577473163605, -0.03319557011127472, -0.030577566474676132, -0.027959560975432396, -0.02534155547618866, -0.022723549976944923, -0.020105544477701187, -0.01748753897845745, -0.014869533479213715, -0.012251527979969978, -0.009633522480726242, -0.007015516981482506, -0.0043975114822387695, -0.0017795059829950333, 0.000838499516248703, 0.0034565050154924393, 0.0060745105147361755, 0.008692516013979912, 0.011310521513223648, 0.013928527012467384, 0.01654653251171112, 0.019164538010954857, 0.021782543510198593, 0.02440054900944233, 0.027018554508686066, 0.029636560007929802, 0.03225456550717354, 0.034872569143772125, 0.03749057650566101, 0.040108583867549896, 0.04272658750414848, 0.04534459114074707, 0.047962598502635956, 0.05058060586452484, 0.05319860950112343, 0.055816613137722015, 0.0584346204996109, 0.061052627861499786, 0.06367063522338867, 0.06628863513469696, 0.06890664249658585, 0.07152464985847473, 0.07414264976978302, 0.0767606571316719, 0.07937866449356079]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 9.0, 6.0, 6.0, 5.0, 6.0, 14.0, 11.0, 14.0, 20.0, 18.0, 16.0, 19.0, 22.0, 27.0, 22.0, 23.0, 28.0, 37.0, 37.0, 28.0, 39.0, 32.0, 31.0, 42.0, 50.0, 36.0, 39.0, 30.0, 37.0, 39.0, 24.0, 25.0, 32.0, 23.0, 25.0, 21.0, 23.0, 20.0, 17.0, 10.0, 5.0, 3.0, 8.0, 3.0, 3.0, 6.0, 2.0, 4.0, 3.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-3.669921875, -3.548858642578125, -3.42779541015625, -3.306732177734375, -3.1856689453125, -3.064605712890625, -2.94354248046875, -2.822479248046875, -2.701416015625, -2.580352783203125, -2.45928955078125, -2.338226318359375, -2.2171630859375, -2.096099853515625, -1.97503662109375, -1.853973388671875, -1.73291015625, -1.611846923828125, -1.49078369140625, -1.369720458984375, -1.2486572265625, -1.127593994140625, -1.00653076171875, -0.885467529296875, -0.764404296875, -0.643341064453125, -0.52227783203125, -0.401214599609375, -0.2801513671875, -0.159088134765625, -0.03802490234375, 0.083038330078125, 0.2041015625, 0.325164794921875, 0.44622802734375, 0.567291259765625, 0.6883544921875, 0.809417724609375, 0.93048095703125, 1.051544189453125, 1.172607421875, 1.293670654296875, 1.41473388671875, 1.535797119140625, 1.6568603515625, 1.777923583984375, 1.89898681640625, 2.020050048828125, 2.14111328125, 2.262176513671875, 2.38323974609375, 2.504302978515625, 2.6253662109375, 2.746429443359375, 2.86749267578125, 2.988555908203125, 3.109619140625, 3.230682373046875, 3.35174560546875, 3.472808837890625, 3.5938720703125, 3.714935302734375, 3.83599853515625, 3.957061767578125, 4.078125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 5.0, 4.0, 15.0, 17.0, 29.0, 40.0, 65.0, 116.0, 150.0, 274.0, 402.0, 698.0, 1078.0, 1650.0, 2603.0, 3969.0, 6085.0, 8989.0, 13683.0, 21471.0, 33322.0, 54172.0, 99180.0, 203659.0, 258220.0, 146344.0, 72827.0, 42433.0, 27062.0, 17471.0, 11431.0, 7228.0, 4856.0, 3193.0, 2116.0, 1252.0, 904.0, 607.0, 360.0, 223.0, 121.0, 88.0, 48.0, 38.0, 13.0, 11.0, 8.0, 15.0, 7.0, 3.0, 3.0, 1.0, 2.0], "bins": [-3.80859375, -3.700592041015625, -3.59259033203125, -3.484588623046875, -3.3765869140625, -3.268585205078125, -3.16058349609375, -3.052581787109375, -2.944580078125, -2.836578369140625, -2.72857666015625, -2.620574951171875, -2.5125732421875, -2.404571533203125, -2.29656982421875, -2.188568115234375, -2.08056640625, -1.972564697265625, -1.86456298828125, -1.756561279296875, -1.6485595703125, -1.540557861328125, -1.43255615234375, -1.324554443359375, -1.216552734375, -1.108551025390625, -1.00054931640625, -0.892547607421875, -0.7845458984375, -0.676544189453125, -0.56854248046875, -0.460540771484375, -0.3525390625, -0.244537353515625, -0.13653564453125, -0.028533935546875, 0.0794677734375, 0.187469482421875, 0.29547119140625, 0.403472900390625, 0.511474609375, 0.619476318359375, 0.72747802734375, 0.835479736328125, 0.9434814453125, 1.051483154296875, 1.15948486328125, 1.267486572265625, 1.37548828125, 1.483489990234375, 1.59149169921875, 1.699493408203125, 1.8074951171875, 1.915496826171875, 2.02349853515625, 2.131500244140625, 2.239501953125, 2.347503662109375, 2.45550537109375, 2.563507080078125, 2.6715087890625, 2.779510498046875, 2.88751220703125, 2.995513916015625, 3.103515625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 4.0, 1.0, 5.0, 5.0, 8.0, 6.0, 9.0, 15.0, 10.0, 17.0, 25.0, 19.0, 28.0, 35.0, 26.0, 39.0, 45.0, 47.0, 51.0, 73.0, 128.0, 300.0, 1411.0, 206.0, 92.0, 65.0, 45.0, 41.0, 37.0, 40.0, 42.0, 31.0, 30.0, 14.0, 27.0, 14.0, 13.0, 9.0, 8.0, 4.0, 4.0, 9.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.421875, -14.912109375, -14.40234375, -13.892578125, -13.3828125, -12.873046875, -12.36328125, -11.853515625, -11.34375, -10.833984375, -10.32421875, -9.814453125, -9.3046875, -8.794921875, -8.28515625, -7.775390625, -7.265625, -6.755859375, -6.24609375, -5.736328125, -5.2265625, -4.716796875, -4.20703125, -3.697265625, -3.1875, -2.677734375, -2.16796875, -1.658203125, -1.1484375, -0.638671875, -0.12890625, 0.380859375, 0.890625, 1.400390625, 1.91015625, 2.419921875, 2.9296875, 3.439453125, 3.94921875, 4.458984375, 4.96875, 5.478515625, 5.98828125, 6.498046875, 7.0078125, 7.517578125, 8.02734375, 8.537109375, 9.046875, 9.556640625, 10.06640625, 10.576171875, 11.0859375, 11.595703125, 12.10546875, 12.615234375, 13.125, 13.634765625, 14.14453125, 14.654296875, 15.1640625, 15.673828125, 16.18359375, 16.693359375, 17.203125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 1.0, 4.0, 4.0, 14.0, 18.0, 19.0, 17.0, 33.0, 47.0, 50.0, 84.0, 121.0, 163.0, 260.0, 521.0, 1742.0, 22871.0, 2851505.0, 261425.0, 4837.0, 941.0, 373.0, 176.0, 131.0, 95.0, 73.0, 46.0, 39.0, 24.0, 7.0, 13.0, 10.0, 14.0, 8.0, 7.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.03125, -37.76220703125, -36.4931640625, -35.22412109375, -33.955078125, -32.68603515625, -31.4169921875, -30.14794921875, -28.87890625, -27.60986328125, -26.3408203125, -25.07177734375, -23.802734375, -22.53369140625, -21.2646484375, -19.99560546875, -18.7265625, -17.45751953125, -16.1884765625, -14.91943359375, -13.650390625, -12.38134765625, -11.1123046875, -9.84326171875, -8.57421875, -7.30517578125, -6.0361328125, -4.76708984375, -3.498046875, -2.22900390625, -0.9599609375, 0.30908203125, 1.578125, 2.84716796875, 4.1162109375, 5.38525390625, 6.654296875, 7.92333984375, 9.1923828125, 10.46142578125, 11.73046875, 12.99951171875, 14.2685546875, 15.53759765625, 16.806640625, 18.07568359375, 19.3447265625, 20.61376953125, 21.8828125, 23.15185546875, 24.4208984375, 25.68994140625, 26.958984375, 28.22802734375, 29.4970703125, 30.76611328125, 32.03515625, 33.30419921875, 34.5732421875, 35.84228515625, 37.111328125, 38.38037109375, 39.6494140625, 40.91845703125, 42.1875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 141.0, 701.0, 176.0, 0.0, 1.0, 0.0, 1.0], "bins": [-435.0611267089844, -427.6274719238281, -420.19384765625, -412.76019287109375, -405.3265686035156, -397.8929138183594, -390.45928955078125, -383.025634765625, -375.5920104980469, -368.1583557128906, -360.7247314453125, -353.29107666015625, -345.8574523925781, -338.4237976074219, -330.99017333984375, -323.5565185546875, -316.12286376953125, -308.689208984375, -301.2555847167969, -293.8219299316406, -286.3883056640625, -278.95465087890625, -271.5210266113281, -264.0873718261719, -256.65374755859375, -249.22010803222656, -241.78646850585938, -234.3528289794922, -226.919189453125, -219.4855499267578, -212.05191040039062, -204.61825561523438, -197.18463134765625, -189.75099182128906, -182.31735229492188, -174.8837127685547, -167.4500732421875, -160.0164337158203, -152.58279418945312, -145.14913940429688, -137.71551513671875, -130.28187561035156, -122.84823608398438, -115.41459655761719, -107.98095703125, -100.54731750488281, -93.1136703491211, -85.6800308227539, -78.24638366699219, -70.812744140625, -63.37910461425781, -55.94546127319336, -48.51182174682617, -41.078182220458984, -33.64453887939453, -26.210899353027344, -18.777259826660156, -11.343619346618652, -3.9099788665771484, 3.523662567138672, 10.95730209350586, 18.390941619873047, 25.8245849609375, 33.25822448730469, 40.691864013671875]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 5.0, 8.0, 14.0, 11.0, 9.0, 11.0, 17.0, 18.0, 16.0, 29.0, 20.0, 25.0, 36.0, 43.0, 49.0, 42.0, 49.0, 39.0, 40.0, 48.0, 37.0, 45.0, 35.0, 45.0, 36.0, 42.0, 31.0, 31.0, 26.0, 25.0, 25.0, 22.0, 16.0, 6.0, 11.0, 9.0, 8.0, 8.0, 6.0, 5.0, 1.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-51.059810638427734, -49.48185729980469, -47.903907775878906, -46.32595443725586, -44.74800109863281, -43.17005157470703, -41.592098236083984, -40.01414489746094, -38.436195373535156, -36.85824203491211, -35.28029251098633, -33.70233917236328, -32.1243896484375, -30.546436309814453, -28.968482971191406, -27.390531539916992, -25.812580108642578, -24.234628677368164, -22.65667724609375, -21.078723907470703, -19.50077247619629, -17.922821044921875, -16.344867706298828, -14.766916275024414, -13.18896484375, -11.611013412475586, -10.033061027526855, -8.455108642578125, -6.877157211303711, -5.299205303192139, -3.7212533950805664, -2.143301010131836, -0.5653457641601562, 1.012606143951416, 2.5905580520629883, 4.1685099601745605, 5.746461868286133, 7.324413776397705, 8.902365684509277, 10.480318069458008, 12.058269500732422, 13.636220932006836, 15.214173316955566, 16.792125701904297, 18.37007713317871, 19.948028564453125, 21.525981903076172, 23.103933334350586, 24.681884765625, 26.259836196899414, 27.837787628173828, 29.415740966796875, 30.99369239807129, 32.5716438293457, 34.14959716796875, 35.72754669189453, 37.30550003051758, 38.883453369140625, 40.461402893066406, 42.03935623168945, 43.6173095703125, 45.19525909423828, 46.77321243286133, 48.351165771484375, 49.929115295410156]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 5.0, 8.0, 9.0, 13.0, 15.0, 13.0, 14.0, 18.0, 16.0, 17.0, 23.0, 24.0, 23.0, 27.0, 24.0, 36.0, 38.0, 33.0, 34.0, 35.0, 40.0, 42.0, 32.0, 40.0, 36.0, 29.0, 29.0, 33.0, 33.0, 27.0, 30.0, 32.0, 17.0, 24.0, 23.0, 16.0, 11.0, 12.0, 13.0, 9.0, 9.0, 4.0, 7.0, 2.0, 3.0, 2.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-3.8515625, -3.720947265625, -3.59033203125, -3.459716796875, -3.3291015625, -3.198486328125, -3.06787109375, -2.937255859375, -2.806640625, -2.676025390625, -2.54541015625, -2.414794921875, -2.2841796875, -2.153564453125, -2.02294921875, -1.892333984375, -1.76171875, -1.631103515625, -1.50048828125, -1.369873046875, -1.2392578125, -1.108642578125, -0.97802734375, -0.847412109375, -0.716796875, -0.586181640625, -0.45556640625, -0.324951171875, -0.1943359375, -0.063720703125, 0.06689453125, 0.197509765625, 0.328125, 0.458740234375, 0.58935546875, 0.719970703125, 0.8505859375, 0.981201171875, 1.11181640625, 1.242431640625, 1.373046875, 1.503662109375, 1.63427734375, 1.764892578125, 1.8955078125, 2.026123046875, 2.15673828125, 2.287353515625, 2.41796875, 2.548583984375, 2.67919921875, 2.809814453125, 2.9404296875, 3.071044921875, 3.20166015625, 3.332275390625, 3.462890625, 3.593505859375, 3.72412109375, 3.854736328125, 3.9853515625, 4.115966796875, 4.24658203125, 4.377197265625, 4.5078125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [6.0, 4.0, 3.0, 4.0, 4.0, 6.0, 8.0, 11.0, 11.0, 15.0, 14.0, 19.0, 20.0, 35.0, 66.0, 61.0, 134.0, 187.0, 394.0, 663.0, 1384.0, 3033.0, 7500.0, 18495.0, 52795.0, 159570.0, 493309.0, 1250745.0, 1348435.0, 574463.0, 185324.0, 61373.0, 21217.0, 8081.0, 3438.0, 1577.0, 787.0, 412.0, 219.0, 129.0, 92.0, 66.0, 47.0, 39.0, 28.0, 15.0, 13.0, 5.0, 11.0, 7.0, 10.0, 3.0, 4.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.796875, -5.59033203125, -5.3837890625, -5.17724609375, -4.970703125, -4.76416015625, -4.5576171875, -4.35107421875, -4.14453125, -3.93798828125, -3.7314453125, -3.52490234375, -3.318359375, -3.11181640625, -2.9052734375, -2.69873046875, -2.4921875, -2.28564453125, -2.0791015625, -1.87255859375, -1.666015625, -1.45947265625, -1.2529296875, -1.04638671875, -0.83984375, -0.63330078125, -0.4267578125, -0.22021484375, -0.013671875, 0.19287109375, 0.3994140625, 0.60595703125, 0.8125, 1.01904296875, 1.2255859375, 1.43212890625, 1.638671875, 1.84521484375, 2.0517578125, 2.25830078125, 2.46484375, 2.67138671875, 2.8779296875, 3.08447265625, 3.291015625, 3.49755859375, 3.7041015625, 3.91064453125, 4.1171875, 4.32373046875, 4.5302734375, 4.73681640625, 4.943359375, 5.14990234375, 5.3564453125, 5.56298828125, 5.76953125, 5.97607421875, 6.1826171875, 6.38916015625, 6.595703125, 6.80224609375, 7.0087890625, 7.21533203125, 7.421875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 12.0, 9.0, 16.0, 25.0, 27.0, 41.0, 65.0, 65.0, 97.0, 146.0, 167.0, 201.0, 263.0, 343.0, 392.0, 404.0, 374.0, 314.0, 271.0, 203.0, 166.0, 137.0, 90.0, 61.0, 37.0, 33.0, 23.0, 20.0, 18.0, 12.0, 9.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0703125, -9.7391357421875, -9.407958984375, -9.0767822265625, -8.74560546875, -8.4144287109375, -8.083251953125, -7.7520751953125, -7.4208984375, -7.0897216796875, -6.758544921875, -6.4273681640625, -6.09619140625, -5.7650146484375, -5.433837890625, -5.1026611328125, -4.771484375, -4.4403076171875, -4.109130859375, -3.7779541015625, -3.44677734375, -3.1156005859375, -2.784423828125, -2.4532470703125, -2.1220703125, -1.7908935546875, -1.459716796875, -1.1285400390625, -0.79736328125, -0.4661865234375, -0.135009765625, 0.1961669921875, 0.52734375, 0.8585205078125, 1.189697265625, 1.5208740234375, 1.85205078125, 2.1832275390625, 2.514404296875, 2.8455810546875, 3.1767578125, 3.5079345703125, 3.839111328125, 4.1702880859375, 4.50146484375, 4.8326416015625, 5.163818359375, 5.4949951171875, 5.826171875, 6.1573486328125, 6.488525390625, 6.8197021484375, 7.15087890625, 7.4820556640625, 7.813232421875, 8.1444091796875, 8.4755859375, 8.8067626953125, 9.137939453125, 9.4691162109375, 9.80029296875, 10.1314697265625, 10.462646484375, 10.7938232421875, 11.125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 8.0, 13.0, 11.0, 23.0, 35.0, 44.0, 60.0, 91.0, 134.0, 254.0, 441.0, 1229.0, 4945.0, 34159.0, 304980.0, 2143369.0, 1500545.0, 178271.0, 20436.0, 3294.0, 911.0, 390.0, 199.0, 133.0, 84.0, 61.0, 40.0, 32.0, 25.0, 18.0, 10.0, 8.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.578125, -17.995361328125, -17.41259765625, -16.829833984375, -16.2470703125, -15.664306640625, -15.08154296875, -14.498779296875, -13.916015625, -13.333251953125, -12.75048828125, -12.167724609375, -11.5849609375, -11.002197265625, -10.41943359375, -9.836669921875, -9.25390625, -8.671142578125, -8.08837890625, -7.505615234375, -6.9228515625, -6.340087890625, -5.75732421875, -5.174560546875, -4.591796875, -4.009033203125, -3.42626953125, -2.843505859375, -2.2607421875, -1.677978515625, -1.09521484375, -0.512451171875, 0.0703125, 0.653076171875, 1.23583984375, 1.818603515625, 2.4013671875, 2.984130859375, 3.56689453125, 4.149658203125, 4.732421875, 5.315185546875, 5.89794921875, 6.480712890625, 7.0634765625, 7.646240234375, 8.22900390625, 8.811767578125, 9.39453125, 9.977294921875, 10.56005859375, 11.142822265625, 11.7255859375, 12.308349609375, 12.89111328125, 13.473876953125, 14.056640625, 14.639404296875, 15.22216796875, 15.804931640625, 16.3876953125, 16.970458984375, 17.55322265625, 18.135986328125, 18.71875]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 12.0, 18.0, 41.0, 66.0, 125.0, 157.0, 176.0, 162.0, 121.0, 65.0, 36.0, 21.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.363365173339844, -55.38301086425781, -52.40265655517578, -49.422306060791016, -46.441951751708984, -43.46159744262695, -40.48124694824219, -37.500892639160156, -34.520538330078125, -31.540184020996094, -28.559831619262695, -25.579479217529297, -22.599124908447266, -19.618770599365234, -16.638418197631836, -13.658065795898438, -10.677711486816406, -7.697358131408691, -4.717004776000977, -1.7366514205932617, 1.2437019348144531, 4.224055290222168, 7.204408645629883, 10.184761047363281, 13.165115356445312, 16.145469665527344, 19.125822067260742, 22.10617446899414, 25.086528778076172, 28.066883087158203, 31.0472354888916, 34.027587890625, 37.0079345703125, 39.98828887939453, 42.96864318847656, 45.94899368286133, 48.92934799194336, 51.90970230102539, 54.890052795410156, 57.87040710449219, 60.85076141357422, 63.83111572265625, 66.81147003173828, 69.79182434082031, 72.77217102050781, 75.75252532958984, 78.73287963867188, 81.7132339477539, 84.69358825683594, 87.67394256591797, 90.654296875, 93.63465118408203, 96.61500549316406, 99.59535217285156, 102.5757064819336, 105.55606079101562, 108.53641510009766, 111.51676940917969, 114.49712371826172, 117.47747802734375, 120.45782470703125, 123.43817901611328, 126.41853332519531, 129.39889526367188, 132.37924194335938]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 6.0, 8.0, 5.0, 11.0, 6.0, 17.0, 11.0, 16.0, 24.0, 26.0, 20.0, 20.0, 23.0, 34.0, 27.0, 25.0, 38.0, 38.0, 42.0, 53.0, 47.0, 49.0, 41.0, 42.0, 36.0, 36.0, 24.0, 30.0, 32.0, 25.0, 23.0, 25.0, 18.0, 19.0, 17.0, 14.0, 9.0, 17.0, 10.0, 4.0, 3.0, 7.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-34.572418212890625, -33.45365905761719, -32.33489990234375, -31.216144561767578, -30.09738540649414, -28.978626251220703, -27.8598690032959, -26.741111755371094, -25.622352600097656, -24.50359344482422, -23.384836196899414, -22.26607894897461, -21.147319793701172, -20.028560638427734, -18.90980339050293, -17.791046142578125, -16.672286987304688, -15.553528785705566, -14.434770584106445, -13.316012382507324, -12.197254180908203, -11.078495979309082, -9.959737777709961, -8.84097957611084, -7.722221374511719, -6.603463172912598, -5.484704971313477, -4.3659467697143555, -3.2471885681152344, -2.1284303665161133, -1.0096721649169922, 0.1090860366821289, 1.2278404235839844, 2.3465986251831055, 3.4653568267822266, 4.584115028381348, 5.702873229980469, 6.82163143157959, 7.940389633178711, 9.059147834777832, 10.177906036376953, 11.296664237976074, 12.415422439575195, 13.534180641174316, 14.652938842773438, 15.771697044372559, 16.89045524597168, 18.009212493896484, 19.127971649169922, 20.24673080444336, 21.365488052368164, 22.48424530029297, 23.603004455566406, 24.721763610839844, 25.84052085876465, 26.959278106689453, 28.07803726196289, 29.196796417236328, 30.315553665161133, 31.434310913085938, 32.553070068359375, 33.67182922363281, 34.79058837890625, 35.90934371948242, 37.02810287475586]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 4.0, 9.0, 7.0, 5.0, 10.0, 13.0, 14.0, 12.0, 13.0, 17.0, 14.0, 19.0, 21.0, 24.0, 27.0, 18.0, 23.0, 30.0, 33.0, 35.0, 25.0, 40.0, 33.0, 37.0, 37.0, 46.0, 25.0, 39.0, 41.0, 31.0, 24.0, 35.0, 26.0, 23.0, 20.0, 26.0, 16.0, 21.0, 13.0, 17.0, 11.0, 11.0, 11.0, 8.0, 8.0, 9.0, 5.0, 5.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.494140625, -3.371368408203125, -3.24859619140625, -3.125823974609375, -3.0030517578125, -2.880279541015625, -2.75750732421875, -2.634735107421875, -2.511962890625, -2.389190673828125, -2.26641845703125, -2.143646240234375, -2.0208740234375, -1.898101806640625, -1.77532958984375, -1.652557373046875, -1.52978515625, -1.407012939453125, -1.28424072265625, -1.161468505859375, -1.0386962890625, -0.915924072265625, -0.79315185546875, -0.670379638671875, -0.547607421875, -0.424835205078125, -0.30206298828125, -0.179290771484375, -0.0565185546875, 0.066253662109375, 0.18902587890625, 0.311798095703125, 0.4345703125, 0.557342529296875, 0.68011474609375, 0.802886962890625, 0.9256591796875, 1.048431396484375, 1.17120361328125, 1.293975830078125, 1.416748046875, 1.539520263671875, 1.66229248046875, 1.785064697265625, 1.9078369140625, 2.030609130859375, 2.15338134765625, 2.276153564453125, 2.39892578125, 2.521697998046875, 2.64447021484375, 2.767242431640625, 2.8900146484375, 3.012786865234375, 3.13555908203125, 3.258331298828125, 3.381103515625, 3.503875732421875, 3.62664794921875, 3.749420166015625, 3.8721923828125, 3.994964599609375, 4.11773681640625, 4.240509033203125, 4.36328125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 6.0, 13.0, 13.0, 27.0, 40.0, 56.0, 91.0, 136.0, 214.0, 304.0, 416.0, 657.0, 1008.0, 1696.0, 2433.0, 3632.0, 5224.0, 7952.0, 11314.0, 16599.0, 23394.0, 32624.0, 44420.0, 58585.0, 74124.0, 89607.0, 102137.0, 105706.0, 101001.0, 87713.0, 72934.0, 56940.0, 43466.0, 31670.0, 22496.0, 16064.0, 10897.0, 7514.0, 5088.0, 3468.0, 2343.0, 1556.0, 1018.0, 688.0, 447.0, 298.0, 172.0, 129.0, 89.0, 43.0, 34.0, 24.0, 18.0, 12.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.689453125, -0.66680908203125, -0.6441650390625, -0.62152099609375, -0.598876953125, -0.57623291015625, -0.5535888671875, -0.53094482421875, -0.50830078125, -0.48565673828125, -0.4630126953125, -0.44036865234375, -0.417724609375, -0.39508056640625, -0.3724365234375, -0.34979248046875, -0.3271484375, -0.30450439453125, -0.2818603515625, -0.25921630859375, -0.236572265625, -0.21392822265625, -0.1912841796875, -0.16864013671875, -0.14599609375, -0.12335205078125, -0.1007080078125, -0.07806396484375, -0.055419921875, -0.03277587890625, -0.0101318359375, 0.01251220703125, 0.03515625, 0.05780029296875, 0.0804443359375, 0.10308837890625, 0.125732421875, 0.14837646484375, 0.1710205078125, 0.19366455078125, 0.21630859375, 0.23895263671875, 0.2615966796875, 0.28424072265625, 0.306884765625, 0.32952880859375, 0.3521728515625, 0.37481689453125, 0.3974609375, 0.42010498046875, 0.4427490234375, 0.46539306640625, 0.488037109375, 0.51068115234375, 0.5333251953125, 0.55596923828125, 0.57861328125, 0.60125732421875, 0.6239013671875, 0.64654541015625, 0.669189453125, 0.69183349609375, 0.7144775390625, 0.73712158203125, 0.759765625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 9.0, 4.0, 9.0, 10.0, 11.0, 10.0, 3.0, 19.0, 19.0, 14.0, 21.0, 17.0, 25.0, 30.0, 28.0, 34.0, 33.0, 54.0, 45.0, 45.0, 45.0, 1058.0, 48.0, 31.0, 39.0, 39.0, 45.0, 29.0, 30.0, 36.0, 21.0, 17.0, 31.0, 16.0, 16.0, 18.0, 14.0, 12.0, 4.0, 9.0, 8.0, 4.0, 7.0, 2.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26953125, -4.141326904296875, -4.01312255859375, -3.884918212890625, -3.7567138671875, -3.628509521484375, -3.50030517578125, -3.372100830078125, -3.243896484375, -3.115692138671875, -2.98748779296875, -2.859283447265625, -2.7310791015625, -2.602874755859375, -2.47467041015625, -2.346466064453125, -2.21826171875, -2.090057373046875, -1.96185302734375, -1.833648681640625, -1.7054443359375, -1.577239990234375, -1.44903564453125, -1.320831298828125, -1.192626953125, -1.064422607421875, -0.93621826171875, -0.808013916015625, -0.6798095703125, -0.551605224609375, -0.42340087890625, -0.295196533203125, -0.1669921875, -0.038787841796875, 0.08941650390625, 0.217620849609375, 0.3458251953125, 0.474029541015625, 0.60223388671875, 0.730438232421875, 0.858642578125, 0.986846923828125, 1.11505126953125, 1.243255615234375, 1.3714599609375, 1.499664306640625, 1.62786865234375, 1.756072998046875, 1.88427734375, 2.012481689453125, 2.14068603515625, 2.268890380859375, 2.3970947265625, 2.525299072265625, 2.65350341796875, 2.781707763671875, 2.909912109375, 3.038116455078125, 3.16632080078125, 3.294525146484375, 3.4227294921875, 3.550933837890625, 3.67913818359375, 3.807342529296875, 3.935546875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 9.0, 21.0, 31.0, 50.0, 135.0, 267.0, 599.0, 1294.0, 3395.0, 8666.0, 23284.0, 65670.0, 1925351.0, 42754.0, 15748.0, 5860.0, 2279.0, 906.0, 402.0, 186.0, 105.0, 47.0, 24.0, 13.0, 9.0, 4.0, 6.0, 5.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.396484375, -3.297454833984375, -3.19842529296875, -3.099395751953125, -3.0003662109375, -2.901336669921875, -2.80230712890625, -2.703277587890625, -2.604248046875, -2.505218505859375, -2.40618896484375, -2.307159423828125, -2.2081298828125, -2.109100341796875, -2.01007080078125, -1.911041259765625, -1.81201171875, -1.712982177734375, -1.61395263671875, -1.514923095703125, -1.4158935546875, -1.316864013671875, -1.21783447265625, -1.118804931640625, -1.019775390625, -0.920745849609375, -0.82171630859375, -0.722686767578125, -0.6236572265625, -0.524627685546875, -0.42559814453125, -0.326568603515625, -0.2275390625, -0.128509521484375, -0.02947998046875, 0.069549560546875, 0.1685791015625, 0.267608642578125, 0.36663818359375, 0.465667724609375, 0.564697265625, 0.663726806640625, 0.76275634765625, 0.861785888671875, 0.9608154296875, 1.059844970703125, 1.15887451171875, 1.257904052734375, 1.35693359375, 1.455963134765625, 1.55499267578125, 1.654022216796875, 1.7530517578125, 1.852081298828125, 1.95111083984375, 2.050140380859375, 2.149169921875, 2.248199462890625, 2.34722900390625, 2.446258544921875, 2.5452880859375, 2.644317626953125, 2.74334716796875, 2.842376708984375, 2.94140625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 3.0, 2.0, 3.0, 5.0, 2.0, 4.0, 5.0, 9.0, 7.0, 9.0, 17.0, 20.0, 32.0, 40.0, 49.0, 57.0, 73.0, 85.0, 107.0, 105.0, 81.0, 78.0, 46.0, 42.0, 21.0, 20.0, 10.0, 11.0, 14.0, 5.0, 8.0, 8.0, 7.0, 3.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.037750244140625, -0.03660297393798828, -0.03545570373535156, -0.034308433532714844, -0.033161163330078125, -0.032013893127441406, -0.030866622924804688, -0.02971935272216797, -0.02857208251953125, -0.02742481231689453, -0.026277542114257812, -0.025130271911621094, -0.023983001708984375, -0.022835731506347656, -0.021688461303710938, -0.02054119110107422, -0.0193939208984375, -0.01824665069580078, -0.017099380493164062, -0.015952110290527344, -0.014804840087890625, -0.013657569885253906, -0.012510299682617188, -0.011363029479980469, -0.01021575927734375, -0.009068489074707031, -0.007921218872070312, -0.006773948669433594, -0.005626678466796875, -0.004479408264160156, -0.0033321380615234375, -0.0021848678588867188, -0.00103759765625, 0.00010967254638671875, 0.0012569427490234375, 0.0024042129516601562, 0.003551483154296875, 0.004698753356933594, 0.0058460235595703125, 0.006993293762207031, 0.00814056396484375, 0.009287834167480469, 0.010435104370117188, 0.011582374572753906, 0.012729644775390625, 0.013876914978027344, 0.015024185180664062, 0.01617145538330078, 0.0173187255859375, 0.01846599578857422, 0.019613265991210938, 0.020760536193847656, 0.021907806396484375, 0.023055076599121094, 0.024202346801757812, 0.02534961700439453, 0.02649688720703125, 0.02764415740966797, 0.028791427612304688, 0.029938697814941406, 0.031085968017578125, 0.032233238220214844, 0.03338050842285156, 0.03452777862548828, 0.035675048828125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 7.0, 8.0, 6.0, 16.0, 10.0, 18.0, 23.0, 34.0, 45.0, 68.0, 127.0, 204.0, 652.0, 3981.0, 127735.0, 901279.0, 12316.0, 1226.0, 290.0, 149.0, 104.0, 70.0, 45.0, 34.0, 22.0, 16.0, 15.0, 7.0, 9.0, 3.0, 3.0, 5.0, 2.0, 3.0, 3.0, 4.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.57373046875, -0.5553512573242188, -0.5369720458984375, -0.5185928344726562, -0.500213623046875, -0.48183441162109375, -0.4634552001953125, -0.44507598876953125, -0.42669677734375, -0.40831756591796875, -0.3899383544921875, -0.37155914306640625, -0.353179931640625, -0.33480072021484375, -0.3164215087890625, -0.29804229736328125, -0.2796630859375, -0.26128387451171875, -0.2429046630859375, -0.22452545166015625, -0.206146240234375, -0.18776702880859375, -0.1693878173828125, -0.15100860595703125, -0.13262939453125, -0.11425018310546875, -0.0958709716796875, -0.07749176025390625, -0.059112548828125, -0.04073333740234375, -0.0223541259765625, -0.00397491455078125, 0.014404296875, 0.03278350830078125, 0.0511627197265625, 0.06954193115234375, 0.087921142578125, 0.10630035400390625, 0.1246795654296875, 0.14305877685546875, 0.16143798828125, 0.17981719970703125, 0.1981964111328125, 0.21657562255859375, 0.234954833984375, 0.25333404541015625, 0.2717132568359375, 0.29009246826171875, 0.3084716796875, 0.32685089111328125, 0.3452301025390625, 0.36360931396484375, 0.381988525390625, 0.40036773681640625, 0.4187469482421875, 0.43712615966796875, 0.45550537109375, 0.47388458251953125, 0.4922637939453125, 0.5106430053710938, 0.529022216796875, 0.5474014282226562, 0.5657806396484375, 0.5841598510742188, 0.6025390625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 6.0, 15.0, 40.0, 111.0, 302.0, 360.0, 121.0, 31.0, 18.0, 3.0, 0.0, 3.0], "bins": [-0.46202048659324646, -0.4539392292499542, -0.445857971906662, -0.43777668476104736, -0.4296954274177551, -0.4216141700744629, -0.41353291273117065, -0.4054516553878784, -0.3973703980445862, -0.38928914070129395, -0.3812078833580017, -0.3731266260147095, -0.36504533886909485, -0.3569640815258026, -0.3488828241825104, -0.34080156683921814, -0.3327202796936035, -0.3246390223503113, -0.31655776500701904, -0.3084765076637268, -0.3003952205181122, -0.29231396317481995, -0.2842327058315277, -0.2761514484882355, -0.26807019114494324, -0.259988933801651, -0.25190767645835876, -0.24382640421390533, -0.2357451468706131, -0.22766387462615967, -0.21958261728286743, -0.2115013599395752, -0.20342007279396057, -0.19533881545066833, -0.1872575432062149, -0.17917628586292267, -0.17109502851963043, -0.163013756275177, -0.15493249893188477, -0.14685124158859253, -0.1387699842453003, -0.13068872690200806, -0.12260746210813522, -0.11452619731426239, -0.10644493997097015, -0.09836367517709732, -0.09028241038322449, -0.08220115303993225, -0.07411988079547882, -0.06603861600160599, -0.05795735865831375, -0.04987609386444092, -0.04179483279585838, -0.03371357172727585, -0.025632306933403015, -0.01755104586482048, -0.009469788521528244, -0.0013885265216231346, 0.006692735478281975, 0.014773998409509659, 0.022855259478092194, 0.03093652054667473, 0.03901778534054756, 0.047099046409130096, 0.05518030747771263]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 5.0, 3.0, 7.0, 7.0, 12.0, 21.0, 15.0, 16.0, 16.0, 22.0, 23.0, 21.0, 40.0, 26.0, 33.0, 33.0, 43.0, 31.0, 47.0, 49.0, 48.0, 42.0, 46.0, 32.0, 42.0, 53.0, 37.0, 34.0, 36.0, 24.0, 22.0, 24.0, 26.0, 11.0, 8.0, 9.0, 7.0, 5.0, 3.0, 11.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04139822721481323, -0.0399148166179657, -0.038431402295827866, -0.03694798797369003, -0.0354645773768425, -0.033981166779994965, -0.03249775245785713, -0.03101433999836445, -0.029530927538871765, -0.02804751507937908, -0.0265641026198864, -0.025080690160393715, -0.02359727770090103, -0.022113865241408348, -0.020630452781915665, -0.01914704032242298, -0.017663627862930298, -0.016180215403437614, -0.014696802943944931, -0.013213390484452248, -0.011729978024959564, -0.01024656556546688, -0.008763153105974197, -0.007279740646481514, -0.005796328186988831, -0.004312915727496147, -0.0028295032680034637, -0.0013460908085107803, 0.00013732165098190308, 0.0016207341104745865, 0.00310414656996727, 0.004587559029459953, 0.006070971488952637, 0.00755438394844532, 0.009037796407938004, 0.010521208867430687, 0.01200462132692337, 0.013488033786416054, 0.014971446245908737, 0.01645485870540142, 0.017938271164894104, 0.019421683624386787, 0.02090509608387947, 0.022388508543372154, 0.023871921002864838, 0.02535533346235752, 0.026838745921850204, 0.028322158381342888, 0.02980557084083557, 0.031288981437683105, 0.03277239575982094, 0.03425581008195877, 0.035739220678806305, 0.03722263127565384, 0.03870604559779167, 0.040189459919929504, 0.04167287051677704, 0.04315628111362457, 0.044639695435762405, 0.04612310975790024, 0.04760652035474777, 0.049089930951595306, 0.05057334527373314, 0.05205675959587097, 0.053540170192718506]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 9.0, 8.0, 9.0, 13.0, 11.0, 17.0, 21.0, 20.0, 29.0, 17.0, 19.0, 33.0, 23.0, 34.0, 25.0, 22.0, 39.0, 44.0, 39.0, 39.0, 34.0, 38.0, 41.0, 44.0, 33.0, 40.0, 37.0, 33.0, 29.0, 25.0, 19.0, 21.0, 27.0, 15.0, 12.0, 13.0, 13.0, 8.0, 9.0, 9.0, 5.0, 4.0, 7.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.87890625, -3.74224853515625, -3.6055908203125, -3.46893310546875, -3.332275390625, -3.19561767578125, -3.0589599609375, -2.92230224609375, -2.78564453125, -2.64898681640625, -2.5123291015625, -2.37567138671875, -2.239013671875, -2.10235595703125, -1.9656982421875, -1.82904052734375, -1.6923828125, -1.55572509765625, -1.4190673828125, -1.28240966796875, -1.145751953125, -1.00909423828125, -0.8724365234375, -0.73577880859375, -0.59912109375, -0.46246337890625, -0.3258056640625, -0.18914794921875, -0.052490234375, 0.08416748046875, 0.2208251953125, 0.35748291015625, 0.494140625, 0.63079833984375, 0.7674560546875, 0.90411376953125, 1.040771484375, 1.17742919921875, 1.3140869140625, 1.45074462890625, 1.58740234375, 1.72406005859375, 1.8607177734375, 1.99737548828125, 2.134033203125, 2.27069091796875, 2.4073486328125, 2.54400634765625, 2.6806640625, 2.81732177734375, 2.9539794921875, 3.09063720703125, 3.227294921875, 3.36395263671875, 3.5006103515625, 3.63726806640625, 3.77392578125, 3.91058349609375, 4.0472412109375, 4.18389892578125, 4.320556640625, 4.45721435546875, 4.5938720703125, 4.73052978515625, 4.8671875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 10.0, 12.0, 32.0, 43.0, 97.0, 180.0, 390.0, 769.0, 1680.0, 3398.0, 7132.0, 14978.0, 31606.0, 63481.0, 127393.0, 237013.0, 263546.0, 149889.0, 75037.0, 37179.0, 18090.0, 8669.0, 4159.0, 1932.0, 896.0, 442.0, 233.0, 139.0, 64.0, 24.0, 18.0, 12.0, 3.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.66015625, -6.4649658203125, -6.269775390625, -6.0745849609375, -5.87939453125, -5.6842041015625, -5.489013671875, -5.2938232421875, -5.0986328125, -4.9034423828125, -4.708251953125, -4.5130615234375, -4.31787109375, -4.1226806640625, -3.927490234375, -3.7322998046875, -3.537109375, -3.3419189453125, -3.146728515625, -2.9515380859375, -2.75634765625, -2.5611572265625, -2.365966796875, -2.1707763671875, -1.9755859375, -1.7803955078125, -1.585205078125, -1.3900146484375, -1.19482421875, -0.9996337890625, -0.804443359375, -0.6092529296875, -0.4140625, -0.2188720703125, -0.023681640625, 0.1715087890625, 0.36669921875, 0.5618896484375, 0.757080078125, 0.9522705078125, 1.1474609375, 1.3426513671875, 1.537841796875, 1.7330322265625, 1.92822265625, 2.1234130859375, 2.318603515625, 2.5137939453125, 2.708984375, 2.9041748046875, 3.099365234375, 3.2945556640625, 3.48974609375, 3.6849365234375, 3.880126953125, 4.0753173828125, 4.2705078125, 4.4656982421875, 4.660888671875, 4.8560791015625, 5.05126953125, 5.2464599609375, 5.441650390625, 5.6368408203125, 5.83203125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 4.0, 2.0, 10.0, 9.0, 12.0, 18.0, 14.0, 19.0, 29.0, 32.0, 30.0, 53.0, 46.0, 68.0, 90.0, 146.0, 246.0, 1374.0, 225.0, 154.0, 81.0, 73.0, 35.0, 55.0, 46.0, 35.0, 25.0, 24.0, 16.0, 13.0, 14.0, 6.0, 11.0, 7.0, 7.0, 5.0, 8.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.484375, -20.822509765625, -20.16064453125, -19.498779296875, -18.8369140625, -18.175048828125, -17.51318359375, -16.851318359375, -16.189453125, -15.527587890625, -14.86572265625, -14.203857421875, -13.5419921875, -12.880126953125, -12.21826171875, -11.556396484375, -10.89453125, -10.232666015625, -9.57080078125, -8.908935546875, -8.2470703125, -7.585205078125, -6.92333984375, -6.261474609375, -5.599609375, -4.937744140625, -4.27587890625, -3.614013671875, -2.9521484375, -2.290283203125, -1.62841796875, -0.966552734375, -0.3046875, 0.357177734375, 1.01904296875, 1.680908203125, 2.3427734375, 3.004638671875, 3.66650390625, 4.328369140625, 4.990234375, 5.652099609375, 6.31396484375, 6.975830078125, 7.6376953125, 8.299560546875, 8.96142578125, 9.623291015625, 10.28515625, 10.947021484375, 11.60888671875, 12.270751953125, 12.9326171875, 13.594482421875, 14.25634765625, 14.918212890625, 15.580078125, 16.241943359375, 16.90380859375, 17.565673828125, 18.2275390625, 18.889404296875, 19.55126953125, 20.213134765625, 20.875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 7.0, 10.0, 12.0, 7.0, 21.0, 20.0, 34.0, 30.0, 37.0, 55.0, 91.0, 124.0, 169.0, 259.0, 461.0, 910.0, 7613.0, 823477.0, 2291602.0, 18175.0, 1179.0, 487.0, 288.0, 179.0, 125.0, 115.0, 60.0, 39.0, 37.0, 22.0, 14.0, 16.0, 10.0, 9.0, 4.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.75, -35.44287109375, -34.1357421875, -32.82861328125, -31.521484375, -30.21435546875, -28.9072265625, -27.60009765625, -26.29296875, -24.98583984375, -23.6787109375, -22.37158203125, -21.064453125, -19.75732421875, -18.4501953125, -17.14306640625, -15.8359375, -14.52880859375, -13.2216796875, -11.91455078125, -10.607421875, -9.30029296875, -7.9931640625, -6.68603515625, -5.37890625, -4.07177734375, -2.7646484375, -1.45751953125, -0.150390625, 1.15673828125, 2.4638671875, 3.77099609375, 5.078125, 6.38525390625, 7.6923828125, 8.99951171875, 10.306640625, 11.61376953125, 12.9208984375, 14.22802734375, 15.53515625, 16.84228515625, 18.1494140625, 19.45654296875, 20.763671875, 22.07080078125, 23.3779296875, 24.68505859375, 25.9921875, 27.29931640625, 28.6064453125, 29.91357421875, 31.220703125, 32.52783203125, 33.8349609375, 35.14208984375, 36.44921875, 37.75634765625, 39.0634765625, 40.37060546875, 41.677734375, 42.98486328125, 44.2919921875, 45.59912109375, 46.90625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 28.0, 121.0, 241.0, 347.0, 195.0, 65.0, 14.0, 3.0], "bins": [-207.34788513183594, -203.84934997558594, -200.350830078125, -196.852294921875, -193.353759765625, -189.85523986816406, -186.35670471191406, -182.85818481445312, -179.35964965820312, -175.86111450195312, -172.3625946044922, -168.8640594482422, -165.36553955078125, -161.86700439453125, -158.36846923828125, -154.8699493408203, -151.3714141845703, -147.8728790283203, -144.37435913085938, -140.87582397460938, -137.37728881835938, -133.87876892089844, -130.38023376464844, -126.88170623779297, -123.3831787109375, -119.88465118408203, -116.38612365722656, -112.88758850097656, -109.3890609741211, -105.89053344726562, -102.39199829101562, -98.89347076416016, -95.39494323730469, -91.89641571044922, -88.39788818359375, -84.89935302734375, -81.40082550048828, -77.90229797363281, -74.40376281738281, -70.90523529052734, -67.40670776367188, -63.908180236816406, -60.40964889526367, -56.91111755371094, -53.41259002685547, -49.9140625, -46.415531158447266, -42.91699981689453, -39.41847229003906, -35.919944763183594, -32.42141342163086, -28.922883987426758, -25.424354553222656, -21.925825119018555, -18.427295684814453, -14.928766250610352, -11.430238723754883, -7.931709289550781, -4.43317985534668, -0.9346504211425781, 2.5638790130615234, 6.062408447265625, 9.560937881469727, 13.059467315673828, 16.55799674987793]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 4.0, 8.0, 7.0, 12.0, 10.0, 8.0, 13.0, 19.0, 23.0, 20.0, 32.0, 26.0, 32.0, 27.0, 35.0, 29.0, 32.0, 34.0, 33.0, 29.0, 42.0, 37.0, 41.0, 36.0, 36.0, 30.0, 39.0, 38.0, 30.0, 32.0, 26.0, 27.0, 21.0, 15.0, 19.0, 9.0, 11.0, 7.0, 17.0, 8.0, 13.0, 3.0, 8.0, 2.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-39.865333557128906, -38.57297134399414, -37.280609130859375, -35.98824691772461, -34.695884704589844, -33.40351867675781, -32.11115646362305, -30.81879425048828, -29.526432037353516, -28.23406982421875, -26.941707611083984, -25.649343490600586, -24.35698127746582, -23.064619064331055, -21.772254943847656, -20.47989273071289, -19.187530517578125, -17.89516830444336, -16.602806091308594, -15.310441970825195, -14.01807975769043, -12.725717544555664, -11.433354377746582, -10.1409912109375, -8.848628997802734, -7.5562663078308105, -6.263903617858887, -4.971540927886963, -3.679178237915039, -2.3868155479431152, -1.0944528579711914, 0.19791030883789062, 1.4902687072753906, 2.7826313972473145, 4.074994087219238, 5.367356777191162, 6.659719467163086, 7.95208215713501, 9.244444847106934, 10.536808013916016, 11.829170227050781, 13.121532440185547, 14.413895606994629, 15.706258773803711, 16.998620986938477, 18.290983200073242, 19.58334732055664, 20.875709533691406, 22.168071746826172, 23.460433959960938, 24.752796173095703, 26.0451602935791, 27.337522506713867, 28.629884719848633, 29.92224884033203, 31.214611053466797, 32.50697326660156, 33.79933547973633, 35.091697692871094, 36.38405990600586, 37.676422119140625, 38.968788146972656, 40.26115036010742, 41.55351257324219, 42.84587478637695]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 4.0, 9.0, 7.0, 15.0, 6.0, 13.0, 12.0, 12.0, 22.0, 20.0, 23.0, 26.0, 23.0, 20.0, 30.0, 21.0, 31.0, 38.0, 31.0, 36.0, 37.0, 43.0, 24.0, 32.0, 35.0, 44.0, 31.0, 34.0, 33.0, 24.0, 19.0, 23.0, 23.0, 33.0, 28.0, 15.0, 22.0, 21.0, 10.0, 12.0, 10.0, 8.0, 7.0, 7.0, 7.0, 3.0, 7.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0], "bins": [-4.2265625, -4.0892333984375, -3.951904296875, -3.8145751953125, -3.67724609375, -3.5399169921875, -3.402587890625, -3.2652587890625, -3.1279296875, -2.9906005859375, -2.853271484375, -2.7159423828125, -2.57861328125, -2.4412841796875, -2.303955078125, -2.1666259765625, -2.029296875, -1.8919677734375, -1.754638671875, -1.6173095703125, -1.47998046875, -1.3426513671875, -1.205322265625, -1.0679931640625, -0.9306640625, -0.7933349609375, -0.656005859375, -0.5186767578125, -0.38134765625, -0.2440185546875, -0.106689453125, 0.0306396484375, 0.16796875, 0.3052978515625, 0.442626953125, 0.5799560546875, 0.71728515625, 0.8546142578125, 0.991943359375, 1.1292724609375, 1.2666015625, 1.4039306640625, 1.541259765625, 1.6785888671875, 1.81591796875, 1.9532470703125, 2.090576171875, 2.2279052734375, 2.365234375, 2.5025634765625, 2.639892578125, 2.7772216796875, 2.91455078125, 3.0518798828125, 3.189208984375, 3.3265380859375, 3.4638671875, 3.6011962890625, 3.738525390625, 3.8758544921875, 4.01318359375, 4.1505126953125, 4.287841796875, 4.4251708984375, 4.5625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 11.0, 6.0, 8.0, 6.0, 7.0, 12.0, 14.0, 22.0, 20.0, 26.0, 23.0, 31.0, 55.0, 87.0, 125.0, 270.0, 581.0, 1832.0, 7178.0, 40139.0, 264265.0, 1480605.0, 1911293.0, 411441.0, 61748.0, 10515.0, 2428.0, 708.0, 270.0, 139.0, 119.0, 65.0, 57.0, 37.0, 33.0, 17.0, 16.0, 13.0, 8.0, 12.0, 6.0, 6.0, 4.0, 8.0, 4.0, 5.0, 3.0, 1.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0], "bins": [-11.6171875, -11.2554931640625, -10.893798828125, -10.5321044921875, -10.17041015625, -9.8087158203125, -9.447021484375, -9.0853271484375, -8.7236328125, -8.3619384765625, -8.000244140625, -7.6385498046875, -7.27685546875, -6.9151611328125, -6.553466796875, -6.1917724609375, -5.830078125, -5.4683837890625, -5.106689453125, -4.7449951171875, -4.38330078125, -4.0216064453125, -3.659912109375, -3.2982177734375, -2.9365234375, -2.5748291015625, -2.213134765625, -1.8514404296875, -1.48974609375, -1.1280517578125, -0.766357421875, -0.4046630859375, -0.04296875, 0.3187255859375, 0.680419921875, 1.0421142578125, 1.40380859375, 1.7655029296875, 2.127197265625, 2.4888916015625, 2.8505859375, 3.2122802734375, 3.573974609375, 3.9356689453125, 4.29736328125, 4.6590576171875, 5.020751953125, 5.3824462890625, 5.744140625, 6.1058349609375, 6.467529296875, 6.8292236328125, 7.19091796875, 7.5526123046875, 7.914306640625, 8.2760009765625, 8.6376953125, 8.9993896484375, 9.361083984375, 9.7227783203125, 10.08447265625, 10.4461669921875, 10.807861328125, 11.1695556640625, 11.53125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 2.0, 6.0, 5.0, 14.0, 5.0, 6.0, 14.0, 20.0, 19.0, 15.0, 26.0, 36.0, 46.0, 65.0, 65.0, 92.0, 118.0, 122.0, 175.0, 189.0, 258.0, 313.0, 322.0, 315.0, 282.0, 306.0, 265.0, 202.0, 153.0, 123.0, 105.0, 96.0, 74.0, 61.0, 36.0, 26.0, 23.0, 18.0, 14.0, 15.0, 6.0, 7.0, 6.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.16015625, -6.88763427734375, -6.6151123046875, -6.34259033203125, -6.070068359375, -5.79754638671875, -5.5250244140625, -5.25250244140625, -4.97998046875, -4.70745849609375, -4.4349365234375, -4.16241455078125, -3.889892578125, -3.61737060546875, -3.3448486328125, -3.07232666015625, -2.7998046875, -2.52728271484375, -2.2547607421875, -1.98223876953125, -1.709716796875, -1.43719482421875, -1.1646728515625, -0.89215087890625, -0.61962890625, -0.34710693359375, -0.0745849609375, 0.19793701171875, 0.470458984375, 0.74298095703125, 1.0155029296875, 1.28802490234375, 1.560546875, 1.83306884765625, 2.1055908203125, 2.37811279296875, 2.650634765625, 2.92315673828125, 3.1956787109375, 3.46820068359375, 3.74072265625, 4.01324462890625, 4.2857666015625, 4.55828857421875, 4.830810546875, 5.10333251953125, 5.3758544921875, 5.64837646484375, 5.9208984375, 6.19342041015625, 6.4659423828125, 6.73846435546875, 7.010986328125, 7.28350830078125, 7.5560302734375, 7.82855224609375, 8.10107421875, 8.37359619140625, 8.6461181640625, 8.91864013671875, 9.191162109375, 9.46368408203125, 9.7362060546875, 10.00872802734375, 10.28125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 2.0, 6.0, 5.0, 7.0, 10.0, 17.0, 18.0, 23.0, 24.0, 35.0, 47.0, 66.0, 106.0, 137.0, 174.0, 289.0, 492.0, 1341.0, 6302.0, 47288.0, 423589.0, 2336191.0, 1211454.0, 145337.0, 16603.0, 2753.0, 797.0, 338.0, 215.0, 150.0, 104.0, 81.0, 62.0, 51.0, 29.0, 31.0, 19.0, 19.0, 18.0, 14.0, 6.0, 11.0, 6.0, 2.0, 6.0, 1.0, 4.0, 1.0, 2.0], "bins": [-20.890625, -20.322265625, -19.75390625, -19.185546875, -18.6171875, -18.048828125, -17.48046875, -16.912109375, -16.34375, -15.775390625, -15.20703125, -14.638671875, -14.0703125, -13.501953125, -12.93359375, -12.365234375, -11.796875, -11.228515625, -10.66015625, -10.091796875, -9.5234375, -8.955078125, -8.38671875, -7.818359375, -7.25, -6.681640625, -6.11328125, -5.544921875, -4.9765625, -4.408203125, -3.83984375, -3.271484375, -2.703125, -2.134765625, -1.56640625, -0.998046875, -0.4296875, 0.138671875, 0.70703125, 1.275390625, 1.84375, 2.412109375, 2.98046875, 3.548828125, 4.1171875, 4.685546875, 5.25390625, 5.822265625, 6.390625, 6.958984375, 7.52734375, 8.095703125, 8.6640625, 9.232421875, 9.80078125, 10.369140625, 10.9375, 11.505859375, 12.07421875, 12.642578125, 13.2109375, 13.779296875, 14.34765625, 14.916015625, 15.484375]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 13.0, 30.0, 57.0, 87.0, 123.0, 151.0, 158.0, 151.0, 102.0, 70.0, 30.0, 17.0, 10.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.0468521118164, -81.44014739990234, -78.83345031738281, -76.22674560546875, -73.62004852294922, -71.01334381103516, -68.40664672851562, -65.79994201660156, -63.193241119384766, -60.58654022216797, -57.97983932495117, -55.373138427734375, -52.76643371582031, -50.15973663330078, -47.55303192138672, -44.94633102416992, -42.339630126953125, -39.73292922973633, -37.12622833251953, -34.519527435302734, -31.912824630737305, -29.306123733520508, -26.699420928955078, -24.09272003173828, -21.486019134521484, -18.879318237304688, -16.27261734008789, -13.665914535522461, -11.059213638305664, -8.452512741088867, -5.845810890197754, -3.2391090393066406, -0.632415771484375, 1.97428560256958, 4.580986976623535, 7.18768835067749, 9.794389724731445, 12.401090621948242, 15.007792472839355, 17.61449432373047, 20.221195220947266, 22.827896118164062, 25.43459701538086, 28.04129981994629, 30.648000717163086, 33.25469970703125, 35.86140441894531, 38.46810531616211, 41.074806213378906, 43.6815071105957, 46.2882080078125, 48.8949089050293, 51.501609802246094, 54.108314514160156, 56.71501541137695, 59.32171630859375, 61.92841720581055, 64.53511810302734, 67.1418228149414, 69.74851989746094, 72.355224609375, 74.96192169189453, 77.5686264038086, 80.17532348632812, 82.78202819824219]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 9.0, 4.0, 5.0, 6.0, 6.0, 3.0, 9.0, 11.0, 11.0, 10.0, 11.0, 18.0, 24.0, 22.0, 22.0, 20.0, 31.0, 29.0, 31.0, 36.0, 39.0, 36.0, 42.0, 46.0, 39.0, 37.0, 44.0, 35.0, 33.0, 24.0, 38.0, 34.0, 32.0, 23.0, 15.0, 27.0, 21.0, 18.0, 16.0, 23.0, 10.0, 14.0, 10.0, 16.0, 6.0, 2.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-34.61216354370117, -33.53287124633789, -32.453582763671875, -31.374290466308594, -30.295000076293945, -29.215709686279297, -28.136417388916016, -27.057126998901367, -25.97783660888672, -24.89854621887207, -23.81925392150879, -22.73996353149414, -21.660673141479492, -20.581382751464844, -19.502090454101562, -18.422800064086914, -17.343507766723633, -16.264217376708984, -15.18492603302002, -14.105634689331055, -13.026344299316406, -11.947052955627441, -10.867761611938477, -9.788471221923828, -8.709179878234863, -7.629889011383057, -6.55059814453125, -5.471306800842285, -4.3920159339904785, -3.312725067138672, -2.233433723449707, -1.1541428565979004, -0.07485198974609375, 1.0044389963150024, 2.0837299823760986, 3.1630210876464844, 4.242311954498291, 5.321602821350098, 6.4008941650390625, 7.480185031890869, 8.559475898742676, 9.63876724243164, 10.718057632446289, 11.797348976135254, 12.876640319824219, 13.955930709838867, 15.035222053527832, 16.114513397216797, 17.193803787231445, 18.273094177246094, 19.352386474609375, 20.431676864624023, 21.510967254638672, 22.590259552001953, 23.6695499420166, 24.74884033203125, 25.82813262939453, 26.90742301940918, 27.98671531677246, 29.06600570678711, 30.145296096801758, 31.224586486816406, 32.30387878417969, 33.38317108154297, 34.462459564208984]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 5.0, 1.0, 5.0, 5.0, 7.0, 7.0, 10.0, 8.0, 11.0, 12.0, 17.0, 20.0, 23.0, 19.0, 28.0, 32.0, 35.0, 37.0, 30.0, 39.0, 48.0, 47.0, 47.0, 39.0, 43.0, 48.0, 36.0, 39.0, 28.0, 28.0, 28.0, 21.0, 30.0, 20.0, 25.0, 21.0, 23.0, 12.0, 15.0, 15.0, 11.0, 6.0, 4.0, 5.0, 9.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.17578125, -4.0247802734375, -3.873779296875, -3.7227783203125, -3.57177734375, -3.4207763671875, -3.269775390625, -3.1187744140625, -2.9677734375, -2.8167724609375, -2.665771484375, -2.5147705078125, -2.36376953125, -2.2127685546875, -2.061767578125, -1.9107666015625, -1.759765625, -1.6087646484375, -1.457763671875, -1.3067626953125, -1.15576171875, -1.0047607421875, -0.853759765625, -0.7027587890625, -0.5517578125, -0.4007568359375, -0.249755859375, -0.0987548828125, 0.05224609375, 0.2032470703125, 0.354248046875, 0.5052490234375, 0.65625, 0.8072509765625, 0.958251953125, 1.1092529296875, 1.26025390625, 1.4112548828125, 1.562255859375, 1.7132568359375, 1.8642578125, 2.0152587890625, 2.166259765625, 2.3172607421875, 2.46826171875, 2.6192626953125, 2.770263671875, 2.9212646484375, 3.072265625, 3.2232666015625, 3.374267578125, 3.5252685546875, 3.67626953125, 3.8272705078125, 3.978271484375, 4.1292724609375, 4.2802734375, 4.4312744140625, 4.582275390625, 4.7332763671875, 4.88427734375, 5.0352783203125, 5.186279296875, 5.3372802734375, 5.48828125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 10.0, 8.0, 11.0, 28.0, 36.0, 54.0, 80.0, 148.0, 262.0, 360.0, 570.0, 989.0, 1620.0, 2598.0, 4227.0, 6716.0, 10878.0, 16983.0, 26142.0, 39157.0, 56136.0, 77007.0, 99901.0, 118873.0, 127278.0, 118785.0, 98288.0, 76518.0, 55257.0, 38404.0, 26134.0, 16718.0, 10655.0, 6760.0, 4129.0, 2677.0, 1563.0, 1015.0, 610.0, 377.0, 244.0, 138.0, 71.0, 54.0, 42.0, 19.0, 13.0, 10.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82421875, -0.7962646484375, -0.768310546875, -0.7403564453125, -0.71240234375, -0.6844482421875, -0.656494140625, -0.6285400390625, -0.6005859375, -0.5726318359375, -0.544677734375, -0.5167236328125, -0.48876953125, -0.4608154296875, -0.432861328125, -0.4049072265625, -0.376953125, -0.3489990234375, -0.321044921875, -0.2930908203125, -0.26513671875, -0.2371826171875, -0.209228515625, -0.1812744140625, -0.1533203125, -0.1253662109375, -0.097412109375, -0.0694580078125, -0.04150390625, -0.0135498046875, 0.014404296875, 0.0423583984375, 0.0703125, 0.0982666015625, 0.126220703125, 0.1541748046875, 0.18212890625, 0.2100830078125, 0.238037109375, 0.2659912109375, 0.2939453125, 0.3218994140625, 0.349853515625, 0.3778076171875, 0.40576171875, 0.4337158203125, 0.461669921875, 0.4896240234375, 0.517578125, 0.5455322265625, 0.573486328125, 0.6014404296875, 0.62939453125, 0.6573486328125, 0.685302734375, 0.7132568359375, 0.7412109375, 0.7691650390625, 0.797119140625, 0.8250732421875, 0.85302734375, 0.8809814453125, 0.908935546875, 0.9368896484375, 0.96484375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 8.0, 10.0, 8.0, 8.0, 15.0, 16.0, 22.0, 25.0, 23.0, 23.0, 24.0, 36.0, 38.0, 37.0, 39.0, 28.0, 49.0, 39.0, 1071.0, 45.0, 53.0, 37.0, 47.0, 34.0, 35.0, 27.0, 31.0, 32.0, 18.0, 25.0, 23.0, 20.0, 11.0, 11.0, 6.0, 10.0, 15.0, 7.0, 11.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.51171875, -4.37469482421875, -4.2376708984375, -4.10064697265625, -3.963623046875, -3.82659912109375, -3.6895751953125, -3.55255126953125, -3.41552734375, -3.27850341796875, -3.1414794921875, -3.00445556640625, -2.867431640625, -2.73040771484375, -2.5933837890625, -2.45635986328125, -2.3193359375, -2.18231201171875, -2.0452880859375, -1.90826416015625, -1.771240234375, -1.63421630859375, -1.4971923828125, -1.36016845703125, -1.22314453125, -1.08612060546875, -0.9490966796875, -0.81207275390625, -0.675048828125, -0.53802490234375, -0.4010009765625, -0.26397705078125, -0.126953125, 0.01007080078125, 0.1470947265625, 0.28411865234375, 0.421142578125, 0.55816650390625, 0.6951904296875, 0.83221435546875, 0.96923828125, 1.10626220703125, 1.2432861328125, 1.38031005859375, 1.517333984375, 1.65435791015625, 1.7913818359375, 1.92840576171875, 2.0654296875, 2.20245361328125, 2.3394775390625, 2.47650146484375, 2.613525390625, 2.75054931640625, 2.8875732421875, 3.02459716796875, 3.16162109375, 3.29864501953125, 3.4356689453125, 3.57269287109375, 3.709716796875, 3.84674072265625, 3.9837646484375, 4.12078857421875, 4.2578125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 14.0, 7.0, 21.0, 39.0, 64.0, 79.0, 105.0, 174.0, 350.0, 552.0, 950.0, 1509.0, 2612.0, 4528.0, 7880.0, 13778.0, 24034.0, 44553.0, 1888848.0, 47245.0, 25443.0, 14606.0, 8300.0, 4822.0, 2713.0, 1565.0, 906.0, 546.0, 342.0, 203.0, 116.0, 67.0, 51.0, 36.0, 21.0, 15.0, 9.0, 6.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8525390625, -1.7918853759765625, -1.731231689453125, -1.6705780029296875, -1.60992431640625, -1.5492706298828125, -1.488616943359375, -1.4279632568359375, -1.3673095703125, -1.3066558837890625, -1.246002197265625, -1.1853485107421875, -1.12469482421875, -1.0640411376953125, -1.003387451171875, -0.9427337646484375, -0.882080078125, -0.8214263916015625, -0.760772705078125, -0.7001190185546875, -0.63946533203125, -0.5788116455078125, -0.518157958984375, -0.4575042724609375, -0.3968505859375, -0.3361968994140625, -0.275543212890625, -0.2148895263671875, -0.15423583984375, -0.0935821533203125, -0.032928466796875, 0.0277252197265625, 0.08837890625, 0.1490325927734375, 0.209686279296875, 0.2703399658203125, 0.33099365234375, 0.3916473388671875, 0.452301025390625, 0.5129547119140625, 0.5736083984375, 0.6342620849609375, 0.694915771484375, 0.7555694580078125, 0.81622314453125, 0.8768768310546875, 0.937530517578125, 0.9981842041015625, 1.058837890625, 1.1194915771484375, 1.180145263671875, 1.2407989501953125, 1.30145263671875, 1.3621063232421875, 1.422760009765625, 1.4834136962890625, 1.5440673828125, 1.6047210693359375, 1.665374755859375, 1.7260284423828125, 1.78668212890625, 1.8473358154296875, 1.907989501953125, 1.9686431884765625, 2.029296875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 6.0, 15.0, 9.0, 8.0, 22.0, 39.0, 59.0, 107.0, 161.0, 172.0, 151.0, 76.0, 54.0, 42.0, 21.0, 15.0, 4.0, 11.0, 3.0, 4.0, 1.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0709228515625, -0.06866264343261719, -0.06640243530273438, -0.06414222717285156, -0.06188201904296875, -0.05962181091308594, -0.057361602783203125, -0.05510139465332031, -0.0528411865234375, -0.05058097839355469, -0.048320770263671875, -0.04606056213378906, -0.04380035400390625, -0.04154014587402344, -0.039279937744140625, -0.03701972961425781, -0.034759521484375, -0.03249931335449219, -0.030239105224609375, -0.027978897094726562, -0.02571868896484375, -0.023458480834960938, -0.021198272705078125, -0.018938064575195312, -0.0166778564453125, -0.014417648315429688, -0.012157440185546875, -0.009897232055664062, -0.00763702392578125, -0.0053768157958984375, -0.003116607666015625, -0.0008563995361328125, 0.00140380859375, 0.0036640167236328125, 0.005924224853515625, 0.008184432983398438, 0.01044464111328125, 0.012704849243164062, 0.014965057373046875, 0.017225265502929688, 0.0194854736328125, 0.021745681762695312, 0.024005889892578125, 0.026266098022460938, 0.02852630615234375, 0.030786514282226562, 0.033046722412109375, 0.03530693054199219, 0.037567138671875, 0.03982734680175781, 0.042087554931640625, 0.04434776306152344, 0.04660797119140625, 0.04886817932128906, 0.051128387451171875, 0.05338859558105469, 0.0556488037109375, 0.05790901184082031, 0.060169219970703125, 0.06242942810058594, 0.06468963623046875, 0.06694984436035156, 0.06921005249023438, 0.07147026062011719, 0.07373046875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 5.0, 7.0, 13.0, 6.0, 17.0, 18.0, 42.0, 83.0, 130.0, 378.0, 1041.0, 4151.0, 124039.0, 910017.0, 6237.0, 1492.0, 467.0, 175.0, 78.0, 41.0, 27.0, 19.0, 13.0, 16.0, 11.0, 4.0, 3.0, 9.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.025390625, -0.9924468994140625, -0.959503173828125, -0.9265594482421875, -0.89361572265625, -0.8606719970703125, -0.827728271484375, -0.7947845458984375, -0.7618408203125, -0.7288970947265625, -0.695953369140625, -0.6630096435546875, -0.63006591796875, -0.5971221923828125, -0.564178466796875, -0.5312347412109375, -0.498291015625, -0.4653472900390625, -0.432403564453125, -0.3994598388671875, -0.36651611328125, -0.3335723876953125, -0.300628662109375, -0.2676849365234375, -0.2347412109375, -0.2017974853515625, -0.168853759765625, -0.1359100341796875, -0.10296630859375, -0.0700225830078125, -0.037078857421875, -0.0041351318359375, 0.02880859375, 0.0617523193359375, 0.094696044921875, 0.1276397705078125, 0.16058349609375, 0.1935272216796875, 0.226470947265625, 0.2594146728515625, 0.2923583984375, 0.3253021240234375, 0.358245849609375, 0.3911895751953125, 0.42413330078125, 0.4570770263671875, 0.490020751953125, 0.5229644775390625, 0.555908203125, 0.5888519287109375, 0.621795654296875, 0.6547393798828125, 0.68768310546875, 0.7206268310546875, 0.753570556640625, 0.7865142822265625, 0.8194580078125, 0.8524017333984375, 0.885345458984375, 0.9182891845703125, 0.95123291015625, 0.9841766357421875, 1.017120361328125, 1.0500640869140625, 1.0830078125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 26.0, 63.0, 228.0, 446.0, 180.0, 34.0, 20.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.7210639119148254, -0.7082905769348145, -0.6955171823501587, -0.6827438473701477, -0.6699704527854919, -0.657197117805481, -0.6444237232208252, -0.6316503882408142, -0.6188770532608032, -0.6061037182807922, -0.5933303236961365, -0.5805569887161255, -0.5677835941314697, -0.5550102591514587, -0.542236864566803, -0.529463529586792, -0.5166901350021362, -0.5039168000221252, -0.4911434054374695, -0.4783700406551361, -0.46559667587280273, -0.45282334089279175, -0.4400499761104584, -0.427276611328125, -0.4145032465457916, -0.40172988176345825, -0.3889565169811249, -0.3761831521987915, -0.3634098172187805, -0.35063642263412476, -0.33786308765411377, -0.3250897228717804, -0.312316358089447, -0.29954299330711365, -0.2867696285247803, -0.2739962637424469, -0.2612228989601135, -0.24844954907894135, -0.23567619919776917, -0.2229028344154358, -0.21012945473194122, -0.19735608994960785, -0.18458274006843567, -0.1718093752861023, -0.15903601050376892, -0.14626264572143555, -0.13348928093910217, -0.12071593105792999, -0.10794256627559662, -0.09516920149326324, -0.08239584416151047, -0.06962248682975769, -0.056849122047424316, -0.04407575726509094, -0.031302399933338165, -0.018529042601585388, -0.005755677819252014, 0.007017683237791061, 0.019791044294834137, 0.03256440535187721, 0.04533776640892029, 0.05811113119125366, 0.07088448852300644, 0.08365784585475922, 0.09643121063709259]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 7.0, 7.0, 14.0, 4.0, 14.0, 6.0, 7.0, 6.0, 18.0, 16.0, 16.0, 14.0, 25.0, 27.0, 25.0, 17.0, 25.0, 35.0, 60.0, 45.0, 33.0, 32.0, 35.0, 45.0, 37.0, 38.0, 35.0, 34.0, 43.0, 28.0, 29.0, 32.0, 26.0, 28.0, 18.0, 9.0, 15.0, 15.0, 11.0, 10.0, 11.0, 11.0, 5.0, 7.0, 7.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.060170531272888184, -0.05826113373041153, -0.056351736187934875, -0.05444234237074852, -0.052532944828271866, -0.05062354728579521, -0.048714153468608856, -0.0468047559261322, -0.04489535838365555, -0.042985960841178894, -0.04107656329870224, -0.039167169481515884, -0.03725777193903923, -0.035348374396562576, -0.03343898057937622, -0.03152958303689957, -0.029620185494422913, -0.02771078795194626, -0.025801392272114754, -0.02389199659228325, -0.021982599049806595, -0.02007320150732994, -0.018163805827498436, -0.01625441014766693, -0.014345012605190277, -0.012435615994036198, -0.010526219382882118, -0.008616822771728039, -0.006707426160573959, -0.00479802954941988, -0.0028886329382658005, -0.000979236327111721, 0.0009301602840423584, 0.002839556895196438, 0.004748953506350517, 0.006658350117504597, 0.008567746728658676, 0.010477143339812756, 0.012386539950966835, 0.014295936562120914, 0.016205333173274994, 0.018114730715751648, 0.020024126395583153, 0.021933522075414658, 0.02384291961789131, 0.025752317160367966, 0.02766171284019947, 0.029571108520030975, 0.03148050606250763, 0.03338990360498428, 0.03529930114746094, 0.03720869496464729, 0.03911809250712395, 0.0410274900496006, 0.04293688386678696, 0.04484628140926361, 0.046755678951740265, 0.04866507649421692, 0.05057447403669357, 0.05248386785387993, 0.05439326539635658, 0.05630266293883324, 0.05821205675601959, 0.060121454298496246, 0.0620308518409729]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 3.0, 9.0, 10.0, 7.0, 10.0, 16.0, 23.0, 16.0, 24.0, 21.0, 31.0, 25.0, 27.0, 28.0, 39.0, 38.0, 35.0, 55.0, 49.0, 53.0, 42.0, 36.0, 38.0, 32.0, 38.0, 30.0, 33.0, 26.0, 21.0, 25.0, 24.0, 24.0, 25.0, 20.0, 14.0, 13.0, 7.0, 8.0, 4.0, 4.0, 4.0, 3.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.53125, -4.3746337890625, -4.218017578125, -4.0614013671875, -3.90478515625, -3.7481689453125, -3.591552734375, -3.4349365234375, -3.2783203125, -3.1217041015625, -2.965087890625, -2.8084716796875, -2.65185546875, -2.4952392578125, -2.338623046875, -2.1820068359375, -2.025390625, -1.8687744140625, -1.712158203125, -1.5555419921875, -1.39892578125, -1.2423095703125, -1.085693359375, -0.9290771484375, -0.7724609375, -0.6158447265625, -0.459228515625, -0.3026123046875, -0.14599609375, 0.0106201171875, 0.167236328125, 0.3238525390625, 0.48046875, 0.6370849609375, 0.793701171875, 0.9503173828125, 1.10693359375, 1.2635498046875, 1.420166015625, 1.5767822265625, 1.7333984375, 1.8900146484375, 2.046630859375, 2.2032470703125, 2.35986328125, 2.5164794921875, 2.673095703125, 2.8297119140625, 2.986328125, 3.1429443359375, 3.299560546875, 3.4561767578125, 3.61279296875, 3.7694091796875, 3.926025390625, 4.0826416015625, 4.2392578125, 4.3958740234375, 4.552490234375, 4.7091064453125, 4.86572265625, 5.0223388671875, 5.178955078125, 5.3355712890625, 5.4921875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 10.0, 8.0, 11.0, 17.0, 33.0, 39.0, 65.0, 121.0, 267.0, 556.0, 1019.0, 2196.0, 4543.0, 9986.0, 21894.0, 49518.0, 119805.0, 290505.0, 314822.0, 133536.0, 54773.0, 24135.0, 11011.0, 5088.0, 2305.0, 1167.0, 503.0, 258.0, 154.0, 76.0, 48.0, 29.0, 19.0, 11.0, 9.0, 5.0, 4.0, 5.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4609375, -6.22216796875, -5.9833984375, -5.74462890625, -5.505859375, -5.26708984375, -5.0283203125, -4.78955078125, -4.55078125, -4.31201171875, -4.0732421875, -3.83447265625, -3.595703125, -3.35693359375, -3.1181640625, -2.87939453125, -2.640625, -2.40185546875, -2.1630859375, -1.92431640625, -1.685546875, -1.44677734375, -1.2080078125, -0.96923828125, -0.73046875, -0.49169921875, -0.2529296875, -0.01416015625, 0.224609375, 0.46337890625, 0.7021484375, 0.94091796875, 1.1796875, 1.41845703125, 1.6572265625, 1.89599609375, 2.134765625, 2.37353515625, 2.6123046875, 2.85107421875, 3.08984375, 3.32861328125, 3.5673828125, 3.80615234375, 4.044921875, 4.28369140625, 4.5224609375, 4.76123046875, 5.0, 5.23876953125, 5.4775390625, 5.71630859375, 5.955078125, 6.19384765625, 6.4326171875, 6.67138671875, 6.91015625, 7.14892578125, 7.3876953125, 7.62646484375, 7.865234375, 8.10400390625, 8.3427734375, 8.58154296875, 8.8203125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 6.0, 15.0, 14.0, 9.0, 18.0, 22.0, 19.0, 27.0, 26.0, 36.0, 32.0, 40.0, 33.0, 71.0, 86.0, 87.0, 180.0, 1313.0, 292.0, 158.0, 90.0, 72.0, 63.0, 44.0, 37.0, 42.0, 29.0, 42.0, 25.0, 20.0, 15.0, 14.0, 11.0, 10.0, 8.0, 6.0, 7.0, 3.0, 4.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.5, -15.9658203125, -15.431640625, -14.8974609375, -14.36328125, -13.8291015625, -13.294921875, -12.7607421875, -12.2265625, -11.6923828125, -11.158203125, -10.6240234375, -10.08984375, -9.5556640625, -9.021484375, -8.4873046875, -7.953125, -7.4189453125, -6.884765625, -6.3505859375, -5.81640625, -5.2822265625, -4.748046875, -4.2138671875, -3.6796875, -3.1455078125, -2.611328125, -2.0771484375, -1.54296875, -1.0087890625, -0.474609375, 0.0595703125, 0.59375, 1.1279296875, 1.662109375, 2.1962890625, 2.73046875, 3.2646484375, 3.798828125, 4.3330078125, 4.8671875, 5.4013671875, 5.935546875, 6.4697265625, 7.00390625, 7.5380859375, 8.072265625, 8.6064453125, 9.140625, 9.6748046875, 10.208984375, 10.7431640625, 11.27734375, 11.8115234375, 12.345703125, 12.8798828125, 13.4140625, 13.9482421875, 14.482421875, 15.0166015625, 15.55078125, 16.0849609375, 16.619140625, 17.1533203125, 17.6875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 11.0, 6.0, 17.0, 19.0, 26.0, 33.0, 34.0, 52.0, 75.0, 111.0, 170.0, 251.0, 423.0, 1113.0, 14156.0, 2774879.0, 349239.0, 3404.0, 683.0, 326.0, 190.0, 133.0, 114.0, 89.0, 38.0, 36.0, 24.0, 17.0, 12.0, 9.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.625, -53.05517578125, -51.4853515625, -49.91552734375, -48.345703125, -46.77587890625, -45.2060546875, -43.63623046875, -42.06640625, -40.49658203125, -38.9267578125, -37.35693359375, -35.787109375, -34.21728515625, -32.6474609375, -31.07763671875, -29.5078125, -27.93798828125, -26.3681640625, -24.79833984375, -23.228515625, -21.65869140625, -20.0888671875, -18.51904296875, -16.94921875, -15.37939453125, -13.8095703125, -12.23974609375, -10.669921875, -9.10009765625, -7.5302734375, -5.96044921875, -4.390625, -2.82080078125, -1.2509765625, 0.31884765625, 1.888671875, 3.45849609375, 5.0283203125, 6.59814453125, 8.16796875, 9.73779296875, 11.3076171875, 12.87744140625, 14.447265625, 16.01708984375, 17.5869140625, 19.15673828125, 20.7265625, 22.29638671875, 23.8662109375, 25.43603515625, 27.005859375, 28.57568359375, 30.1455078125, 31.71533203125, 33.28515625, 34.85498046875, 36.4248046875, 37.99462890625, 39.564453125, 41.13427734375, 42.7041015625, 44.27392578125, 45.84375]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 13.0, 25.0, 33.0, 61.0, 110.0, 142.0, 138.0, 138.0, 129.0, 85.0, 61.0, 29.0, 27.0, 14.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.09457778930664, -31.645435333251953, -30.196292877197266, -28.747150421142578, -27.29800796508789, -25.848865509033203, -24.399723052978516, -22.950580596923828, -21.50143814086914, -20.052295684814453, -18.603153228759766, -17.154010772705078, -15.70486831665039, -14.255725860595703, -12.806583404541016, -11.357440948486328, -9.90829849243164, -8.459156036376953, -7.010013580322266, -5.560871124267578, -4.111728668212891, -2.662586212158203, -1.2134437561035156, 0.23569869995117188, 1.6848411560058594, 3.133983612060547, 4.583126068115234, 6.032268524169922, 7.481410980224609, 8.930553436279297, 10.379695892333984, 11.828838348388672, 13.277976989746094, 14.727119445800781, 16.17626190185547, 17.625404357910156, 19.074546813964844, 20.52368927001953, 21.97283172607422, 23.421974182128906, 24.871116638183594, 26.32025909423828, 27.76940155029297, 29.218544006347656, 30.667686462402344, 32.11682891845703, 33.56597137451172, 35.015113830566406, 36.464256286621094, 37.91339874267578, 39.36254119873047, 40.811683654785156, 42.260826110839844, 43.70996856689453, 45.15911102294922, 46.608253479003906, 48.057395935058594, 49.50653839111328, 50.95568084716797, 52.404823303222656, 53.853965759277344, 55.30310821533203, 56.75225067138672, 58.201393127441406, 59.650535583496094]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 5.0, 9.0, 7.0, 8.0, 13.0, 16.0, 18.0, 17.0, 21.0, 22.0, 15.0, 23.0, 22.0, 29.0, 29.0, 44.0, 24.0, 39.0, 38.0, 33.0, 41.0, 37.0, 35.0, 34.0, 50.0, 36.0, 35.0, 36.0, 26.0, 25.0, 30.0, 19.0, 22.0, 22.0, 16.0, 19.0, 22.0, 8.0, 8.0, 10.0, 10.0, 5.0, 5.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-50.956722259521484, -49.449100494384766, -47.94148254394531, -46.433860778808594, -44.926239013671875, -43.418617248535156, -41.9109992980957, -40.403377532958984, -38.89575958251953, -37.38813781738281, -35.88051986694336, -34.37289810180664, -32.86527633666992, -31.357656478881836, -29.85003662109375, -28.34241485595703, -26.834793090820312, -25.327173233032227, -23.819551467895508, -22.311931610107422, -20.804309844970703, -19.296689987182617, -17.78907012939453, -16.281448364257812, -14.773828506469727, -13.266207695007324, -11.758586883544922, -10.250967025756836, -8.743346214294434, -7.235725402832031, -5.728105545043945, -4.220484733581543, -2.7128677368164062, -1.205247163772583, 0.30237340927124023, 1.8099937438964844, 3.3176145553588867, 4.825235366821289, 6.332855224609375, 7.840476036071777, 9.34809684753418, 10.855717658996582, 12.363338470458984, 13.87095832824707, 15.378579139709473, 16.886199951171875, 18.39381980895996, 19.901439666748047, 21.409061431884766, 22.91668128967285, 24.42430305480957, 25.931922912597656, 27.439544677734375, 28.94716453552246, 30.454784393310547, 31.962406158447266, 33.47002410888672, 34.97764587402344, 36.48526382446289, 37.99288558959961, 39.50050735473633, 41.00812530517578, 42.5157470703125, 44.02336883544922, 45.53099060058594]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 8.0, 8.0, 6.0, 4.0, 10.0, 8.0, 11.0, 11.0, 14.0, 25.0, 20.0, 24.0, 32.0, 29.0, 34.0, 23.0, 32.0, 29.0, 36.0, 26.0, 42.0, 46.0, 46.0, 41.0, 34.0, 38.0, 37.0, 34.0, 22.0, 21.0, 28.0, 27.0, 29.0, 20.0, 13.0, 20.0, 11.0, 26.0, 11.0, 8.0, 11.0, 12.0, 5.0, 4.0, 6.0, 3.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-5.1171875, -4.960205078125, -4.80322265625, -4.646240234375, -4.4892578125, -4.332275390625, -4.17529296875, -4.018310546875, -3.861328125, -3.704345703125, -3.54736328125, -3.390380859375, -3.2333984375, -3.076416015625, -2.91943359375, -2.762451171875, -2.60546875, -2.448486328125, -2.29150390625, -2.134521484375, -1.9775390625, -1.820556640625, -1.66357421875, -1.506591796875, -1.349609375, -1.192626953125, -1.03564453125, -0.878662109375, -0.7216796875, -0.564697265625, -0.40771484375, -0.250732421875, -0.09375, 0.063232421875, 0.22021484375, 0.377197265625, 0.5341796875, 0.691162109375, 0.84814453125, 1.005126953125, 1.162109375, 1.319091796875, 1.47607421875, 1.633056640625, 1.7900390625, 1.947021484375, 2.10400390625, 2.260986328125, 2.41796875, 2.574951171875, 2.73193359375, 2.888916015625, 3.0458984375, 3.202880859375, 3.35986328125, 3.516845703125, 3.673828125, 3.830810546875, 3.98779296875, 4.144775390625, 4.3017578125, 4.458740234375, 4.61572265625, 4.772705078125, 4.9296875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 7.0, 5.0, 9.0, 7.0, 10.0, 10.0, 14.0, 14.0, 21.0, 29.0, 36.0, 48.0, 60.0, 99.0, 143.0, 228.0, 399.0, 1087.0, 3879.0, 18673.0, 107965.0, 632305.0, 2005547.0, 1156888.0, 220316.0, 36769.0, 6793.0, 1598.0, 553.0, 263.0, 127.0, 72.0, 74.0, 46.0, 34.0, 31.0, 21.0, 23.0, 19.0, 17.0, 8.0, 8.0, 5.0, 6.0, 4.0, 3.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-10.9609375, -10.6038818359375, -10.246826171875, -9.8897705078125, -9.53271484375, -9.1756591796875, -8.818603515625, -8.4615478515625, -8.1044921875, -7.7474365234375, -7.390380859375, -7.0333251953125, -6.67626953125, -6.3192138671875, -5.962158203125, -5.6051025390625, -5.248046875, -4.8909912109375, -4.533935546875, -4.1768798828125, -3.81982421875, -3.4627685546875, -3.105712890625, -2.7486572265625, -2.3916015625, -2.0345458984375, -1.677490234375, -1.3204345703125, -0.96337890625, -0.6063232421875, -0.249267578125, 0.1077880859375, 0.46484375, 0.8218994140625, 1.178955078125, 1.5360107421875, 1.89306640625, 2.2501220703125, 2.607177734375, 2.9642333984375, 3.3212890625, 3.6783447265625, 4.035400390625, 4.3924560546875, 4.74951171875, 5.1065673828125, 5.463623046875, 5.8206787109375, 6.177734375, 6.5347900390625, 6.891845703125, 7.2489013671875, 7.60595703125, 7.9630126953125, 8.320068359375, 8.6771240234375, 9.0341796875, 9.3912353515625, 9.748291015625, 10.1053466796875, 10.46240234375, 10.8194580078125, 11.176513671875, 11.5335693359375, 11.890625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 6.0, 10.0, 15.0, 14.0, 34.0, 26.0, 40.0, 55.0, 71.0, 116.0, 138.0, 190.0, 219.0, 296.0, 330.0, 394.0, 388.0, 406.0, 303.0, 261.0, 198.0, 135.0, 105.0, 76.0, 64.0, 45.0, 31.0, 18.0, 24.0, 14.0, 15.0, 7.0, 5.0, 6.0, 7.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.078125, -9.720458984375, -9.36279296875, -9.005126953125, -8.6474609375, -8.289794921875, -7.93212890625, -7.574462890625, -7.216796875, -6.859130859375, -6.50146484375, -6.143798828125, -5.7861328125, -5.428466796875, -5.07080078125, -4.713134765625, -4.35546875, -3.997802734375, -3.64013671875, -3.282470703125, -2.9248046875, -2.567138671875, -2.20947265625, -1.851806640625, -1.494140625, -1.136474609375, -0.77880859375, -0.421142578125, -0.0634765625, 0.294189453125, 0.65185546875, 1.009521484375, 1.3671875, 1.724853515625, 2.08251953125, 2.440185546875, 2.7978515625, 3.155517578125, 3.51318359375, 3.870849609375, 4.228515625, 4.586181640625, 4.94384765625, 5.301513671875, 5.6591796875, 6.016845703125, 6.37451171875, 6.732177734375, 7.08984375, 7.447509765625, 7.80517578125, 8.162841796875, 8.5205078125, 8.878173828125, 9.23583984375, 9.593505859375, 9.951171875, 10.308837890625, 10.66650390625, 11.024169921875, 11.3818359375, 11.739501953125, 12.09716796875, 12.454833984375, 12.8125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 9.0, 6.0, 8.0, 10.0, 19.0, 15.0, 29.0, 38.0, 44.0, 64.0, 68.0, 121.0, 169.0, 266.0, 475.0, 2055.0, 64075.0, 2968538.0, 1139471.0, 16487.0, 1093.0, 379.0, 225.0, 196.0, 128.0, 64.0, 58.0, 47.0, 25.0, 28.0, 20.0, 11.0, 14.0, 6.0, 6.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.34375, -39.185546875, -38.02734375, -36.869140625, -35.7109375, -34.552734375, -33.39453125, -32.236328125, -31.078125, -29.919921875, -28.76171875, -27.603515625, -26.4453125, -25.287109375, -24.12890625, -22.970703125, -21.8125, -20.654296875, -19.49609375, -18.337890625, -17.1796875, -16.021484375, -14.86328125, -13.705078125, -12.546875, -11.388671875, -10.23046875, -9.072265625, -7.9140625, -6.755859375, -5.59765625, -4.439453125, -3.28125, -2.123046875, -0.96484375, 0.193359375, 1.3515625, 2.509765625, 3.66796875, 4.826171875, 5.984375, 7.142578125, 8.30078125, 9.458984375, 10.6171875, 11.775390625, 12.93359375, 14.091796875, 15.25, 16.408203125, 17.56640625, 18.724609375, 19.8828125, 21.041015625, 22.19921875, 23.357421875, 24.515625, 25.673828125, 26.83203125, 27.990234375, 29.1484375, 30.306640625, 31.46484375, 32.623046875, 33.78125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 9.0, 18.0, 32.0, 38.0, 69.0, 97.0, 129.0, 157.0, 138.0, 108.0, 80.0, 57.0, 43.0, 24.0, 13.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.25884246826172, -84.75608825683594, -82.25334167480469, -79.7505874633789, -77.24783325195312, -74.74508666992188, -72.2423324584961, -69.73957824707031, -67.23683166503906, -64.73407745361328, -62.23133087158203, -59.72857666015625, -57.225826263427734, -54.72307586669922, -52.22032165527344, -49.71757125854492, -47.214820861816406, -44.71207046508789, -42.209320068359375, -39.706565856933594, -37.20381546020508, -34.70106506347656, -32.19831085205078, -29.695560455322266, -27.19281005859375, -24.690059661865234, -22.187307357788086, -19.684555053710938, -17.181804656982422, -14.67905330657959, -12.176301956176758, -9.67354965209961, -7.1707916259765625, -4.6680402755737305, -2.1652889251708984, 0.3374624252319336, 2.8402137756347656, 5.342965126037598, 7.84571647644043, 10.348468780517578, 12.851219177246094, 15.353970527648926, 17.856721878051758, 20.359474182128906, 22.862224578857422, 25.364974975585938, 27.867727279663086, 30.370479583740234, 32.87322998046875, 35.375980377197266, 37.87873077392578, 40.38148498535156, 42.88423538208008, 45.386985778808594, 47.889739990234375, 50.39249038696289, 52.895240783691406, 55.39799118041992, 57.90074157714844, 60.40349578857422, 62.906246185302734, 65.40899658203125, 67.91175079345703, 70.41450500488281, 72.91725158691406]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 6.0, 8.0, 11.0, 10.0, 13.0, 12.0, 17.0, 19.0, 26.0, 24.0, 33.0, 39.0, 39.0, 43.0, 42.0, 40.0, 44.0, 41.0, 41.0, 63.0, 43.0, 46.0, 37.0, 33.0, 45.0, 29.0, 27.0, 28.0, 23.0, 29.0, 14.0, 17.0, 8.0, 12.0, 6.0, 8.0, 9.0, 2.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.82818603515625, -46.40855026245117, -44.98891067504883, -43.56927490234375, -42.149635314941406, -40.72999954223633, -39.31036376953125, -37.890724182128906, -36.47108840942383, -35.05145263671875, -33.631813049316406, -32.21217727661133, -30.792539596557617, -29.372901916503906, -27.953266143798828, -26.533628463745117, -25.113990783691406, -23.694353103637695, -22.274715423583984, -20.855079650878906, -19.435441970825195, -18.015804290771484, -16.596168518066406, -15.176530838012695, -13.756893157958984, -12.337255477905273, -10.917618751525879, -9.497982025146484, -8.078344345092773, -6.658707141876221, -5.239069938659668, -3.8194332122802734, -2.3997955322265625, -0.9801583290100098, 0.43947887420654297, 1.8591160774230957, 3.2787532806396484, 4.698390483856201, 6.118027687072754, 7.537664413452148, 8.95730209350586, 10.37693977355957, 11.796576499938965, 13.21621322631836, 14.63585090637207, 16.05548858642578, 17.47512435913086, 18.89476203918457, 20.31439971923828, 21.734037399291992, 23.153675079345703, 24.57331085205078, 25.992948532104492, 27.412586212158203, 28.83222198486328, 30.251859664916992, 31.671497344970703, 33.09113311767578, 34.510772705078125, 35.9304084777832, 37.35004425048828, 38.769683837890625, 40.1893196105957, 41.60895538330078, 43.028594970703125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 7.0, 2.0, 1.0, 2.0, 8.0, 3.0, 10.0, 5.0, 11.0, 8.0, 7.0, 20.0, 12.0, 23.0, 20.0, 30.0, 30.0, 27.0, 30.0, 32.0, 43.0, 29.0, 27.0, 35.0, 34.0, 44.0, 44.0, 29.0, 31.0, 30.0, 43.0, 25.0, 33.0, 28.0, 27.0, 24.0, 22.0, 27.0, 28.0, 15.0, 18.0, 12.0, 12.0, 7.0, 16.0, 9.0, 7.0, 1.0, 3.0, 5.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.46875, -4.31683349609375, -4.1649169921875, -4.01300048828125, -3.861083984375, -3.70916748046875, -3.5572509765625, -3.40533447265625, -3.25341796875, -3.10150146484375, -2.9495849609375, -2.79766845703125, -2.645751953125, -2.49383544921875, -2.3419189453125, -2.19000244140625, -2.0380859375, -1.88616943359375, -1.7342529296875, -1.58233642578125, -1.430419921875, -1.27850341796875, -1.1265869140625, -0.97467041015625, -0.82275390625, -0.67083740234375, -0.5189208984375, -0.36700439453125, -0.215087890625, -0.06317138671875, 0.0887451171875, 0.24066162109375, 0.392578125, 0.54449462890625, 0.6964111328125, 0.84832763671875, 1.000244140625, 1.15216064453125, 1.3040771484375, 1.45599365234375, 1.60791015625, 1.75982666015625, 1.9117431640625, 2.06365966796875, 2.215576171875, 2.36749267578125, 2.5194091796875, 2.67132568359375, 2.8232421875, 2.97515869140625, 3.1270751953125, 3.27899169921875, 3.430908203125, 3.58282470703125, 3.7347412109375, 3.88665771484375, 4.03857421875, 4.19049072265625, 4.3424072265625, 4.49432373046875, 4.646240234375, 4.79815673828125, 4.9500732421875, 5.10198974609375, 5.25390625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 10.0, 6.0, 17.0, 28.0, 23.0, 53.0, 66.0, 119.0, 156.0, 257.0, 371.0, 612.0, 941.0, 1580.0, 2540.0, 4246.0, 6957.0, 11336.0, 17831.0, 28419.0, 43846.0, 65187.0, 91033.0, 116940.0, 135993.0, 135315.0, 115490.0, 89475.0, 63428.0, 42704.0, 27517.0, 17627.0, 10924.0, 6679.0, 4143.0, 2577.0, 1507.0, 904.0, 602.0, 392.0, 228.0, 167.0, 99.0, 66.0, 50.0, 26.0, 22.0, 12.0, 5.0, 14.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 3.0], "bins": [-1.009765625, -0.978179931640625, -0.94659423828125, -0.915008544921875, -0.8834228515625, -0.851837158203125, -0.82025146484375, -0.788665771484375, -0.757080078125, -0.725494384765625, -0.69390869140625, -0.662322998046875, -0.6307373046875, -0.599151611328125, -0.56756591796875, -0.535980224609375, -0.50439453125, -0.472808837890625, -0.44122314453125, -0.409637451171875, -0.3780517578125, -0.346466064453125, -0.31488037109375, -0.283294677734375, -0.251708984375, -0.220123291015625, -0.18853759765625, -0.156951904296875, -0.1253662109375, -0.093780517578125, -0.06219482421875, -0.030609130859375, 0.0009765625, 0.032562255859375, 0.06414794921875, 0.095733642578125, 0.1273193359375, 0.158905029296875, 0.19049072265625, 0.222076416015625, 0.253662109375, 0.285247802734375, 0.31683349609375, 0.348419189453125, 0.3800048828125, 0.411590576171875, 0.44317626953125, 0.474761962890625, 0.50634765625, 0.537933349609375, 0.56951904296875, 0.601104736328125, 0.6326904296875, 0.664276123046875, 0.69586181640625, 0.727447509765625, 0.759033203125, 0.790618896484375, 0.82220458984375, 0.853790283203125, 0.8853759765625, 0.916961669921875, 0.94854736328125, 0.980133056640625, 1.01171875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 4.0, 3.0, 1.0, 7.0, 8.0, 4.0, 4.0, 13.0, 8.0, 6.0, 14.0, 18.0, 10.0, 14.0, 24.0, 19.0, 18.0, 27.0, 24.0, 28.0, 29.0, 33.0, 27.0, 31.0, 38.0, 29.0, 30.0, 1071.0, 29.0, 36.0, 37.0, 42.0, 28.0, 35.0, 26.0, 32.0, 24.0, 24.0, 23.0, 22.0, 23.0, 13.0, 18.0, 13.0, 14.0, 7.0, 10.0, 4.0, 8.0, 3.0, 3.0, 2.0, 6.0, 2.0, 1.0, 0.0, 3.0, 3.0], "bins": [-3.97265625, -3.85357666015625, -3.7344970703125, -3.61541748046875, -3.496337890625, -3.37725830078125, -3.2581787109375, -3.13909912109375, -3.02001953125, -2.90093994140625, -2.7818603515625, -2.66278076171875, -2.543701171875, -2.42462158203125, -2.3055419921875, -2.18646240234375, -2.0673828125, -1.94830322265625, -1.8292236328125, -1.71014404296875, -1.591064453125, -1.47198486328125, -1.3529052734375, -1.23382568359375, -1.11474609375, -0.99566650390625, -0.8765869140625, -0.75750732421875, -0.638427734375, -0.51934814453125, -0.4002685546875, -0.28118896484375, -0.162109375, -0.04302978515625, 0.0760498046875, 0.19512939453125, 0.314208984375, 0.43328857421875, 0.5523681640625, 0.67144775390625, 0.79052734375, 0.90960693359375, 1.0286865234375, 1.14776611328125, 1.266845703125, 1.38592529296875, 1.5050048828125, 1.62408447265625, 1.7431640625, 1.86224365234375, 1.9813232421875, 2.10040283203125, 2.219482421875, 2.33856201171875, 2.4576416015625, 2.57672119140625, 2.69580078125, 2.81488037109375, 2.9339599609375, 3.05303955078125, 3.172119140625, 3.29119873046875, 3.4102783203125, 3.52935791015625, 3.6484375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 3.0, 5.0, 11.0, 8.0, 26.0, 28.0, 43.0, 53.0, 76.0, 141.0, 217.0, 347.0, 577.0, 903.0, 1581.0, 2494.0, 3884.0, 6688.0, 10920.0, 18369.0, 31042.0, 78481.0, 1849749.0, 37255.0, 21482.0, 12753.0, 7657.0, 4671.0, 2817.0, 1791.0, 1136.0, 669.0, 470.0, 289.0, 143.0, 130.0, 78.0, 43.0, 31.0, 29.0, 13.0, 11.0, 12.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.955078125, -1.89947509765625, -1.8438720703125, -1.78826904296875, -1.732666015625, -1.67706298828125, -1.6214599609375, -1.56585693359375, -1.51025390625, -1.45465087890625, -1.3990478515625, -1.34344482421875, -1.287841796875, -1.23223876953125, -1.1766357421875, -1.12103271484375, -1.0654296875, -1.00982666015625, -0.9542236328125, -0.89862060546875, -0.843017578125, -0.78741455078125, -0.7318115234375, -0.67620849609375, -0.62060546875, -0.56500244140625, -0.5093994140625, -0.45379638671875, -0.398193359375, -0.34259033203125, -0.2869873046875, -0.23138427734375, -0.17578125, -0.12017822265625, -0.0645751953125, -0.00897216796875, 0.046630859375, 0.10223388671875, 0.1578369140625, 0.21343994140625, 0.26904296875, 0.32464599609375, 0.3802490234375, 0.43585205078125, 0.491455078125, 0.54705810546875, 0.6026611328125, 0.65826416015625, 0.7138671875, 0.76947021484375, 0.8250732421875, 0.88067626953125, 0.936279296875, 0.99188232421875, 1.0474853515625, 1.10308837890625, 1.15869140625, 1.21429443359375, 1.2698974609375, 1.32550048828125, 1.381103515625, 1.43670654296875, 1.4923095703125, 1.54791259765625, 1.603515625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 6.0, 1.0, 5.0, 7.0, 13.0, 12.0, 14.0, 20.0, 26.0, 39.0, 118.0, 341.0, 238.0, 57.0, 30.0, 23.0, 14.0, 11.0, 9.0, 4.0, 1.0, 5.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2724609375, -0.2626304626464844, -0.25279998779296875, -0.24296951293945312, -0.2331390380859375, -0.22330856323242188, -0.21347808837890625, -0.20364761352539062, -0.193817138671875, -0.18398666381835938, -0.17415618896484375, -0.16432571411132812, -0.1544952392578125, -0.14466476440429688, -0.13483428955078125, -0.12500381469726562, -0.11517333984375, -0.10534286499023438, -0.09551239013671875, -0.08568191528320312, -0.0758514404296875, -0.06602096557617188, -0.05619049072265625, -0.046360015869140625, -0.036529541015625, -0.026699066162109375, -0.01686859130859375, -0.007038116455078125, 0.0027923583984375, 0.012622833251953125, 0.02245330810546875, 0.032283782958984375, 0.0421142578125, 0.051944732666015625, 0.06177520751953125, 0.07160568237304688, 0.0814361572265625, 0.09126663208007812, 0.10109710693359375, 0.11092758178710938, 0.120758056640625, 0.13058853149414062, 0.14041900634765625, 0.15024948120117188, 0.1600799560546875, 0.16991043090820312, 0.17974090576171875, 0.18957138061523438, 0.19940185546875, 0.20923233032226562, 0.21906280517578125, 0.22889328002929688, 0.2387237548828125, 0.24855422973632812, 0.25838470458984375, 0.2682151794433594, 0.278045654296875, 0.2878761291503906, 0.29770660400390625, 0.3075370788574219, 0.3173675537109375, 0.3271980285644531, 0.33702850341796875, 0.3468589782714844, 0.356689453125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 3.0, 2.0, 12.0, 22.0, 21.0, 34.0, 80.0, 242.0, 1732.0, 48819.0, 992790.0, 4110.0, 419.0, 109.0, 45.0, 32.0, 19.0, 16.0, 13.0, 3.0, 1.0, 10.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.1015625, -5.932861328125, -5.76416015625, -5.595458984375, -5.4267578125, -5.258056640625, -5.08935546875, -4.920654296875, -4.751953125, -4.583251953125, -4.41455078125, -4.245849609375, -4.0771484375, -3.908447265625, -3.73974609375, -3.571044921875, -3.40234375, -3.233642578125, -3.06494140625, -2.896240234375, -2.7275390625, -2.558837890625, -2.39013671875, -2.221435546875, -2.052734375, -1.884033203125, -1.71533203125, -1.546630859375, -1.3779296875, -1.209228515625, -1.04052734375, -0.871826171875, -0.703125, -0.534423828125, -0.36572265625, -0.197021484375, -0.0283203125, 0.140380859375, 0.30908203125, 0.477783203125, 0.646484375, 0.815185546875, 0.98388671875, 1.152587890625, 1.3212890625, 1.489990234375, 1.65869140625, 1.827392578125, 1.99609375, 2.164794921875, 2.33349609375, 2.502197265625, 2.6708984375, 2.839599609375, 3.00830078125, 3.177001953125, 3.345703125, 3.514404296875, 3.68310546875, 3.851806640625, 4.0205078125, 4.189208984375, 4.35791015625, 4.526611328125, 4.6953125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 12.0, 27.0, 53.0, 110.0, 305.0, 271.0, 119.0, 49.0, 19.0, 20.0, 7.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1162141561508179, -1.0777323246002197, -1.039250373840332, -1.0007685422897339, -0.9622867107391357, -0.9238048195838928, -0.8853229284286499, -0.8468410968780518, -0.8083592057228088, -0.7698773145675659, -0.7313954830169678, -0.6929135918617249, -0.6544317007064819, -0.6159498691558838, -0.5774679780006409, -0.538986086845398, -0.5005042552947998, -0.4620223939418793, -0.42354053258895874, -0.3850586414337158, -0.3465767800807953, -0.30809491872787476, -0.26961302757263184, -0.2311311662197113, -0.19264930486679077, -0.15416744351387024, -0.11568556725978851, -0.07720369845628738, -0.038721829652786255, -0.00023996829986572266, 0.038241907954216, 0.07672378420829773, 0.11520576477050781, 0.15368762612342834, 0.19216950237751007, 0.2306513786315918, 0.26913323998451233, 0.30761510133743286, 0.3460969924926758, 0.3845788538455963, 0.42306071519851685, 0.4615425765514374, 0.5000244379043579, 0.5385063290596008, 0.5769882202148438, 0.6154700517654419, 0.6539519429206848, 0.6924338340759277, 0.7309156656265259, 0.7693975567817688, 0.8078793883323669, 0.8463612794876099, 0.884843111038208, 0.9233250021934509, 0.9618068933486938, 1.000288724899292, 1.0387706756591797, 1.0772525072097778, 1.1157344579696655, 1.1542162895202637, 1.1926981210708618, 1.23117995262146, 1.2696619033813477, 1.3081437349319458, 1.346625566482544]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 7.0, 4.0, 12.0, 11.0, 14.0, 11.0, 19.0, 19.0, 18.0, 15.0, 28.0, 25.0, 27.0, 34.0, 50.0, 40.0, 41.0, 42.0, 42.0, 50.0, 47.0, 39.0, 46.0, 41.0, 37.0, 37.0, 39.0, 22.0, 34.0, 23.0, 19.0, 18.0, 19.0, 13.0, 7.0, 9.0, 10.0, 9.0, 4.0, 6.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.44784456491470337, -0.4333411753177643, -0.4188377857208252, -0.4043343961238861, -0.389831006526947, -0.37532761693000793, -0.36082422733306885, -0.34632083773612976, -0.3318174481391907, -0.3173140585422516, -0.3028106689453125, -0.2883072793483734, -0.2738038897514343, -0.25930050015449524, -0.24479711055755615, -0.23029372096061707, -0.21579033136367798, -0.2012869417667389, -0.1867835521697998, -0.17228016257286072, -0.15777677297592163, -0.14327338337898254, -0.12876999378204346, -0.11426660418510437, -0.09976321458816528, -0.0852598249912262, -0.07075643539428711, -0.05625304579734802, -0.041749656200408936, -0.02724626660346985, -0.012742877006530762, 0.0017605125904083252, 0.016263902187347412, 0.0307672917842865, 0.045270681381225586, 0.05977407097816467, 0.07427746057510376, 0.08878085017204285, 0.10328423976898193, 0.11778762936592102, 0.1322910189628601, 0.1467944085597992, 0.16129779815673828, 0.17580118775367737, 0.19030457735061646, 0.20480796694755554, 0.21931135654449463, 0.23381474614143372, 0.2483181357383728, 0.2628215253353119, 0.277324914932251, 0.29182830452919006, 0.30633169412612915, 0.32083508372306824, 0.3353384733200073, 0.3498418629169464, 0.3643452525138855, 0.3788486421108246, 0.39335203170776367, 0.40785542130470276, 0.42235881090164185, 0.43686220049858093, 0.45136559009552, 0.4658689796924591, 0.4803723692893982]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 4.0, 5.0, 2.0, 2.0, 6.0, 6.0, 7.0, 12.0, 11.0, 15.0, 8.0, 12.0, 25.0, 17.0, 20.0, 29.0, 32.0, 32.0, 38.0, 43.0, 31.0, 39.0, 34.0, 32.0, 38.0, 40.0, 38.0, 29.0, 31.0, 41.0, 35.0, 40.0, 26.0, 28.0, 29.0, 18.0, 24.0, 18.0, 14.0, 16.0, 17.0, 10.0, 11.0, 9.0, 5.0, 8.0, 6.0, 5.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.83203125, -4.67755126953125, -4.5230712890625, -4.36859130859375, -4.214111328125, -4.05963134765625, -3.9051513671875, -3.75067138671875, -3.59619140625, -3.44171142578125, -3.2872314453125, -3.13275146484375, -2.978271484375, -2.82379150390625, -2.6693115234375, -2.51483154296875, -2.3603515625, -2.20587158203125, -2.0513916015625, -1.89691162109375, -1.742431640625, -1.58795166015625, -1.4334716796875, -1.27899169921875, -1.12451171875, -0.97003173828125, -0.8155517578125, -0.66107177734375, -0.506591796875, -0.35211181640625, -0.1976318359375, -0.04315185546875, 0.111328125, 0.26580810546875, 0.4202880859375, 0.57476806640625, 0.729248046875, 0.88372802734375, 1.0382080078125, 1.19268798828125, 1.34716796875, 1.50164794921875, 1.6561279296875, 1.81060791015625, 1.965087890625, 2.11956787109375, 2.2740478515625, 2.42852783203125, 2.5830078125, 2.73748779296875, 2.8919677734375, 3.04644775390625, 3.200927734375, 3.35540771484375, 3.5098876953125, 3.66436767578125, 3.81884765625, 3.97332763671875, 4.1278076171875, 4.28228759765625, 4.436767578125, 4.59124755859375, 4.7457275390625, 4.90020751953125, 5.0546875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 16.0, 23.0, 26.0, 85.0, 176.0, 377.0, 933.0, 2378.0, 5771.0, 15886.0, 44267.0, 135622.0, 422445.0, 282808.0, 89725.0, 29978.0, 10987.0, 4218.0, 1639.0, 660.0, 270.0, 126.0, 64.0, 22.0, 13.0, 11.0, 6.0, 7.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9140625, -6.59716796875, -6.2802734375, -5.96337890625, -5.646484375, -5.32958984375, -5.0126953125, -4.69580078125, -4.37890625, -4.06201171875, -3.7451171875, -3.42822265625, -3.111328125, -2.79443359375, -2.4775390625, -2.16064453125, -1.84375, -1.52685546875, -1.2099609375, -0.89306640625, -0.576171875, -0.25927734375, 0.0576171875, 0.37451171875, 0.69140625, 1.00830078125, 1.3251953125, 1.64208984375, 1.958984375, 2.27587890625, 2.5927734375, 2.90966796875, 3.2265625, 3.54345703125, 3.8603515625, 4.17724609375, 4.494140625, 4.81103515625, 5.1279296875, 5.44482421875, 5.76171875, 6.07861328125, 6.3955078125, 6.71240234375, 7.029296875, 7.34619140625, 7.6630859375, 7.97998046875, 8.296875, 8.61376953125, 8.9306640625, 9.24755859375, 9.564453125, 9.88134765625, 10.1982421875, 10.51513671875, 10.83203125, 11.14892578125, 11.4658203125, 11.78271484375, 12.099609375, 12.41650390625, 12.7333984375, 13.05029296875, 13.3671875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 1.0, 8.0, 10.0, 8.0, 10.0, 14.0, 17.0, 19.0, 21.0, 34.0, 35.0, 36.0, 39.0, 50.0, 62.0, 80.0, 177.0, 341.0, 1390.0, 201.0, 90.0, 66.0, 69.0, 43.0, 38.0, 31.0, 34.0, 18.0, 22.0, 18.0, 12.0, 13.0, 7.0, 6.0, 8.0, 4.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.140625, -18.458984375, -17.77734375, -17.095703125, -16.4140625, -15.732421875, -15.05078125, -14.369140625, -13.6875, -13.005859375, -12.32421875, -11.642578125, -10.9609375, -10.279296875, -9.59765625, -8.916015625, -8.234375, -7.552734375, -6.87109375, -6.189453125, -5.5078125, -4.826171875, -4.14453125, -3.462890625, -2.78125, -2.099609375, -1.41796875, -0.736328125, -0.0546875, 0.626953125, 1.30859375, 1.990234375, 2.671875, 3.353515625, 4.03515625, 4.716796875, 5.3984375, 6.080078125, 6.76171875, 7.443359375, 8.125, 8.806640625, 9.48828125, 10.169921875, 10.8515625, 11.533203125, 12.21484375, 12.896484375, 13.578125, 14.259765625, 14.94140625, 15.623046875, 16.3046875, 16.986328125, 17.66796875, 18.349609375, 19.03125, 19.712890625, 20.39453125, 21.076171875, 21.7578125, 22.439453125, 23.12109375, 23.802734375, 24.484375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 6.0, 7.0, 15.0, 25.0, 31.0, 40.0, 49.0, 58.0, 100.0, 137.0, 207.0, 309.0, 591.0, 2482.0, 242882.0, 2885905.0, 10698.0, 936.0, 409.0, 252.0, 163.0, 111.0, 68.0, 58.0, 37.0, 19.0, 28.0, 11.0, 12.0, 14.0, 6.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-62.0, -60.18798828125, -58.3759765625, -56.56396484375, -54.751953125, -52.93994140625, -51.1279296875, -49.31591796875, -47.50390625, -45.69189453125, -43.8798828125, -42.06787109375, -40.255859375, -38.44384765625, -36.6318359375, -34.81982421875, -33.0078125, -31.19580078125, -29.3837890625, -27.57177734375, -25.759765625, -23.94775390625, -22.1357421875, -20.32373046875, -18.51171875, -16.69970703125, -14.8876953125, -13.07568359375, -11.263671875, -9.45166015625, -7.6396484375, -5.82763671875, -4.015625, -2.20361328125, -0.3916015625, 1.42041015625, 3.232421875, 5.04443359375, 6.8564453125, 8.66845703125, 10.48046875, 12.29248046875, 14.1044921875, 15.91650390625, 17.728515625, 19.54052734375, 21.3525390625, 23.16455078125, 24.9765625, 26.78857421875, 28.6005859375, 30.41259765625, 32.224609375, 34.03662109375, 35.8486328125, 37.66064453125, 39.47265625, 41.28466796875, 43.0966796875, 44.90869140625, 46.720703125, 48.53271484375, 50.3447265625, 52.15673828125, 53.96875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 196.0, 802.0, 20.0], "bins": [-741.6276245117188, -729.7186889648438, -717.809814453125, -705.90087890625, -693.991943359375, -682.0830078125, -670.1741333007812, -658.2651977539062, -646.3562622070312, -634.4473266601562, -622.5384521484375, -610.6295166015625, -598.7205810546875, -586.8116455078125, -574.9027709960938, -562.9938354492188, -551.0849609375, -539.176025390625, -527.2671508789062, -515.3582153320312, -503.44927978515625, -491.5403747558594, -479.6314697265625, -467.7225341796875, -455.8135986328125, -443.9046936035156, -431.9957580566406, -420.08685302734375, -408.17791748046875, -396.2690124511719, -384.360107421875, -372.451171875, -360.542236328125, -348.6333312988281, -336.7243957519531, -324.81549072265625, -312.90655517578125, -300.9976501464844, -289.0887451171875, -277.1798095703125, -265.2709045410156, -253.3619842529297, -241.45306396484375, -229.54415893554688, -217.63523864746094, -205.726318359375, -193.81739807128906, -181.90847778320312, -169.9995574951172, -158.09063720703125, -146.1817169189453, -134.27279663085938, -122.3638916015625, -110.45497131347656, -98.54605102539062, -86.63713836669922, -74.72822570800781, -62.81930923461914, -50.91039276123047, -39.00147247314453, -27.09255599975586, -15.183639526367188, -3.27471923828125, 8.634193420410156, 20.54311752319336]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 6.0, 4.0, 9.0, 7.0, 13.0, 15.0, 19.0, 14.0, 11.0, 22.0, 16.0, 27.0, 21.0, 25.0, 24.0, 29.0, 31.0, 32.0, 35.0, 39.0, 53.0, 36.0, 37.0, 37.0, 50.0, 26.0, 32.0, 39.0, 29.0, 27.0, 29.0, 27.0, 25.0, 30.0, 14.0, 14.0, 18.0, 12.0, 11.0, 11.0, 7.0, 6.0, 9.0, 7.0, 4.0, 0.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-40.99949645996094, -39.665733337402344, -38.331974029541016, -36.99821090698242, -35.66444778442383, -34.3306884765625, -32.996925354003906, -31.663162231445312, -30.32940101623535, -28.99563980102539, -27.661876678466797, -26.328115463256836, -24.994354248046875, -23.66059112548828, -22.32682991027832, -20.99306869506836, -19.659305572509766, -18.325544357299805, -16.99178123474121, -15.65802001953125, -14.324257850646973, -12.990495681762695, -11.656734466552734, -10.322972297668457, -8.98921012878418, -7.655447959899902, -6.321686267852783, -4.987924575805664, -3.6541624069213867, -2.3204002380371094, -0.9866390228271484, 0.3471231460571289, 1.6808853149414062, 3.0146472454071045, 4.348409175872803, 5.682170867919922, 7.015933036804199, 8.349695205688477, 9.683456420898438, 11.017218589782715, 12.350980758666992, 13.68474292755127, 15.018505096435547, 16.352266311645508, 17.68602752685547, 19.019790649414062, 20.353551864624023, 21.687313079833984, 23.021076202392578, 24.35483741760254, 25.688600540161133, 27.022361755371094, 28.356124877929688, 29.68988609313965, 31.02364730834961, 32.3574104309082, 33.69116973876953, 35.024932861328125, 36.35869216918945, 37.69245529174805, 39.02621841430664, 40.35997772216797, 41.69374084472656, 43.027503967285156, 44.36126708984375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 4.0, 5.0, 8.0, 8.0, 10.0, 9.0, 20.0, 19.0, 15.0, 22.0, 27.0, 27.0, 32.0, 34.0, 18.0, 44.0, 28.0, 36.0, 32.0, 41.0, 48.0, 41.0, 36.0, 35.0, 30.0, 32.0, 31.0, 31.0, 31.0, 17.0, 30.0, 28.0, 24.0, 20.0, 23.0, 15.0, 16.0, 8.0, 6.0, 10.0, 3.0, 9.0, 6.0, 6.0, 4.0, 4.0, 1.0, 7.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-5.25390625, -5.0821533203125, -4.910400390625, -4.7386474609375, -4.56689453125, -4.3951416015625, -4.223388671875, -4.0516357421875, -3.8798828125, -3.7081298828125, -3.536376953125, -3.3646240234375, -3.19287109375, -3.0211181640625, -2.849365234375, -2.6776123046875, -2.505859375, -2.3341064453125, -2.162353515625, -1.9906005859375, -1.81884765625, -1.6470947265625, -1.475341796875, -1.3035888671875, -1.1318359375, -0.9600830078125, -0.788330078125, -0.6165771484375, -0.44482421875, -0.2730712890625, -0.101318359375, 0.0704345703125, 0.2421875, 0.4139404296875, 0.585693359375, 0.7574462890625, 0.92919921875, 1.1009521484375, 1.272705078125, 1.4444580078125, 1.6162109375, 1.7879638671875, 1.959716796875, 2.1314697265625, 2.30322265625, 2.4749755859375, 2.646728515625, 2.8184814453125, 2.990234375, 3.1619873046875, 3.333740234375, 3.5054931640625, 3.67724609375, 3.8489990234375, 4.020751953125, 4.1925048828125, 4.3642578125, 4.5360107421875, 4.707763671875, 4.8795166015625, 5.05126953125, 5.2230224609375, 5.394775390625, 5.5665283203125, 5.73828125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 3.0, 12.0, 6.0, 16.0, 8.0, 32.0, 31.0, 40.0, 51.0, 77.0, 117.0, 191.0, 290.0, 549.0, 1339.0, 3549.0, 10743.0, 35153.0, 119056.0, 400490.0, 1082205.0, 1470781.0, 736448.0, 233456.0, 68495.0, 20327.0, 6508.0, 2234.0, 897.0, 424.0, 235.0, 151.0, 81.0, 72.0, 55.0, 43.0, 34.0, 23.0, 13.0, 5.0, 7.0, 5.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.37109375, -7.11932373046875, -6.8675537109375, -6.61578369140625, -6.364013671875, -6.11224365234375, -5.8604736328125, -5.60870361328125, -5.35693359375, -5.10516357421875, -4.8533935546875, -4.60162353515625, -4.349853515625, -4.09808349609375, -3.8463134765625, -3.59454345703125, -3.3427734375, -3.09100341796875, -2.8392333984375, -2.58746337890625, -2.335693359375, -2.08392333984375, -1.8321533203125, -1.58038330078125, -1.32861328125, -1.07684326171875, -0.8250732421875, -0.57330322265625, -0.321533203125, -0.06976318359375, 0.1820068359375, 0.43377685546875, 0.685546875, 0.93731689453125, 1.1890869140625, 1.44085693359375, 1.692626953125, 1.94439697265625, 2.1961669921875, 2.44793701171875, 2.69970703125, 2.95147705078125, 3.2032470703125, 3.45501708984375, 3.706787109375, 3.95855712890625, 4.2103271484375, 4.46209716796875, 4.7138671875, 4.96563720703125, 5.2174072265625, 5.46917724609375, 5.720947265625, 5.97271728515625, 6.2244873046875, 6.47625732421875, 6.72802734375, 6.97979736328125, 7.2315673828125, 7.48333740234375, 7.735107421875, 7.98687744140625, 8.2386474609375, 8.49041748046875, 8.7421875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 5.0, 10.0, 10.0, 8.0, 12.0, 32.0, 30.0, 50.0, 60.0, 88.0, 126.0, 138.0, 175.0, 260.0, 307.0, 346.0, 414.0, 394.0, 369.0, 279.0, 241.0, 187.0, 138.0, 101.0, 71.0, 43.0, 43.0, 32.0, 29.0, 22.0, 13.0, 14.0, 8.0, 4.0, 6.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7421875, -9.37841796875, -9.0146484375, -8.65087890625, -8.287109375, -7.92333984375, -7.5595703125, -7.19580078125, -6.83203125, -6.46826171875, -6.1044921875, -5.74072265625, -5.376953125, -5.01318359375, -4.6494140625, -4.28564453125, -3.921875, -3.55810546875, -3.1943359375, -2.83056640625, -2.466796875, -2.10302734375, -1.7392578125, -1.37548828125, -1.01171875, -0.64794921875, -0.2841796875, 0.07958984375, 0.443359375, 0.80712890625, 1.1708984375, 1.53466796875, 1.8984375, 2.26220703125, 2.6259765625, 2.98974609375, 3.353515625, 3.71728515625, 4.0810546875, 4.44482421875, 4.80859375, 5.17236328125, 5.5361328125, 5.89990234375, 6.263671875, 6.62744140625, 6.9912109375, 7.35498046875, 7.71875, 8.08251953125, 8.4462890625, 8.81005859375, 9.173828125, 9.53759765625, 9.9013671875, 10.26513671875, 10.62890625, 10.99267578125, 11.3564453125, 11.72021484375, 12.083984375, 12.44775390625, 12.8115234375, 13.17529296875, 13.5390625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 10.0, 8.0, 12.0, 17.0, 24.0, 25.0, 40.0, 45.0, 61.0, 86.0, 106.0, 163.0, 267.0, 386.0, 920.0, 16847.0, 1098197.0, 3000606.0, 73144.0, 1944.0, 442.0, 252.0, 169.0, 149.0, 96.0, 76.0, 59.0, 45.0, 21.0, 14.0, 9.0, 9.0, 10.0, 4.0, 7.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-42.34375, -41.17333984375, -40.0029296875, -38.83251953125, -37.662109375, -36.49169921875, -35.3212890625, -34.15087890625, -32.98046875, -31.81005859375, -30.6396484375, -29.46923828125, -28.298828125, -27.12841796875, -25.9580078125, -24.78759765625, -23.6171875, -22.44677734375, -21.2763671875, -20.10595703125, -18.935546875, -17.76513671875, -16.5947265625, -15.42431640625, -14.25390625, -13.08349609375, -11.9130859375, -10.74267578125, -9.572265625, -8.40185546875, -7.2314453125, -6.06103515625, -4.890625, -3.72021484375, -2.5498046875, -1.37939453125, -0.208984375, 0.96142578125, 2.1318359375, 3.30224609375, 4.47265625, 5.64306640625, 6.8134765625, 7.98388671875, 9.154296875, 10.32470703125, 11.4951171875, 12.66552734375, 13.8359375, 15.00634765625, 16.1767578125, 17.34716796875, 18.517578125, 19.68798828125, 20.8583984375, 22.02880859375, 23.19921875, 24.36962890625, 25.5400390625, 26.71044921875, 27.880859375, 29.05126953125, 30.2216796875, 31.39208984375, 32.5625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 3.0, 7.0, 8.0, 15.0, 18.0, 30.0, 28.0, 43.0, 46.0, 49.0, 59.0, 70.0, 63.0, 71.0, 78.0, 69.0, 69.0, 63.0, 47.0, 38.0, 35.0, 17.0, 22.0, 19.0, 11.0, 9.0, 8.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.73601150512695, -36.53300094604492, -35.329994201660156, -34.126983642578125, -32.92397689819336, -31.720966339111328, -30.51795768737793, -29.31494903564453, -28.1119384765625, -26.9089298248291, -25.705921173095703, -24.502910614013672, -23.299901962280273, -22.096893310546875, -20.893884658813477, -19.690876007080078, -18.48786735534668, -17.28485870361328, -16.081850051879883, -14.878840446472168, -13.675830841064453, -12.472822189331055, -11.269813537597656, -10.066803932189941, -8.863795280456543, -7.660786151885986, -6.45777702331543, -5.254768371582031, -4.051759243011475, -2.848750114440918, -1.6457414627075195, -0.4427318572998047, 0.7602767944335938, 1.9632858037948608, 3.166294813156128, 4.3693037033081055, 5.572312831878662, 6.775321960449219, 7.978330612182617, 9.181340217590332, 10.38434886932373, 11.587357521057129, 12.790367126464844, 13.993375778198242, 15.19638442993164, 16.399394989013672, 17.602401733398438, 18.80541229248047, 20.008420944213867, 21.211429595947266, 22.414438247680664, 23.617446899414062, 24.820457458496094, 26.023466110229492, 27.22647476196289, 28.429485321044922, 29.632492065429688, 30.835500717163086, 32.038509368896484, 33.241519927978516, 34.44452667236328, 35.64753723144531, 36.850547790527344, 38.05355453491211, 39.25656509399414]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 10.0, 11.0, 10.0, 15.0, 17.0, 20.0, 24.0, 29.0, 32.0, 26.0, 31.0, 31.0, 34.0, 41.0, 42.0, 35.0, 37.0, 45.0, 40.0, 44.0, 35.0, 32.0, 42.0, 29.0, 29.0, 24.0, 34.0, 29.0, 29.0, 26.0, 11.0, 21.0, 12.0, 16.0, 12.0, 6.0, 8.0, 2.0, 3.0, 5.0, 4.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.173336029052734, -36.96659851074219, -35.759857177734375, -34.55311965942383, -33.34638214111328, -32.13964080810547, -30.932903289794922, -29.726163864135742, -28.519424438476562, -27.312685012817383, -26.105947494506836, -24.899208068847656, -23.692468643188477, -22.485729217529297, -21.27899169921875, -20.07225227355957, -18.865514755249023, -17.658775329589844, -16.452037811279297, -15.245298385620117, -14.038558959960938, -12.831820487976074, -11.625082015991211, -10.418342590332031, -9.211604118347168, -8.004865646362305, -6.798126220703125, -5.591387748718262, -4.38464879989624, -3.1779098510742188, -1.9711713790893555, -0.7644319534301758, 0.4423065185546875, 1.6490453481674194, 2.8557841777801514, 4.062522888183594, 5.269261837005615, 6.476000785827637, 7.6827392578125, 8.88947868347168, 10.096217155456543, 11.302955627441406, 12.509695053100586, 13.71643352508545, 14.923171997070312, 16.129911422729492, 17.336650848388672, 18.54338836669922, 19.7501277923584, 20.956867218017578, 22.163604736328125, 23.370344161987305, 24.577083587646484, 25.78382110595703, 26.99056053161621, 28.19729995727539, 29.404037475585938, 30.610776901245117, 31.817514419555664, 33.024253845214844, 34.23099136352539, 35.4377326965332, 36.64447021484375, 37.85121154785156, 39.05794906616211]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 9.0, 8.0, 13.0, 10.0, 14.0, 7.0, 13.0, 13.0, 23.0, 26.0, 36.0, 25.0, 34.0, 35.0, 32.0, 52.0, 42.0, 35.0, 35.0, 38.0, 38.0, 29.0, 42.0, 29.0, 34.0, 41.0, 28.0, 42.0, 26.0, 26.0, 18.0, 18.0, 17.0, 25.0, 12.0, 7.0, 7.0, 10.0, 10.0, 8.0, 7.0, 6.0, 2.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.2421875, -5.0726318359375, -4.903076171875, -4.7335205078125, -4.56396484375, -4.3944091796875, -4.224853515625, -4.0552978515625, -3.8857421875, -3.7161865234375, -3.546630859375, -3.3770751953125, -3.20751953125, -3.0379638671875, -2.868408203125, -2.6988525390625, -2.529296875, -2.3597412109375, -2.190185546875, -2.0206298828125, -1.85107421875, -1.6815185546875, -1.511962890625, -1.3424072265625, -1.1728515625, -1.0032958984375, -0.833740234375, -0.6641845703125, -0.49462890625, -0.3250732421875, -0.155517578125, 0.0140380859375, 0.18359375, 0.3531494140625, 0.522705078125, 0.6922607421875, 0.86181640625, 1.0313720703125, 1.200927734375, 1.3704833984375, 1.5400390625, 1.7095947265625, 1.879150390625, 2.0487060546875, 2.21826171875, 2.3878173828125, 2.557373046875, 2.7269287109375, 2.896484375, 3.0660400390625, 3.235595703125, 3.4051513671875, 3.57470703125, 3.7442626953125, 3.913818359375, 4.0833740234375, 4.2529296875, 4.4224853515625, 4.592041015625, 4.7615966796875, 4.93115234375, 5.1007080078125, 5.270263671875, 5.4398193359375, 5.609375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 6.0, 9.0, 18.0, 21.0, 54.0, 123.0, 299.0, 903.0, 2602.0, 7171.0, 19202.0, 48034.0, 109813.0, 203741.0, 261448.0, 204860.0, 110514.0, 48812.0, 19508.0, 7328.0, 2658.0, 901.0, 325.0, 112.0, 58.0, 12.0, 12.0, 6.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.94140625, -1.881683349609375, -1.82196044921875, -1.762237548828125, -1.7025146484375, -1.642791748046875, -1.58306884765625, -1.523345947265625, -1.463623046875, -1.403900146484375, -1.34417724609375, -1.284454345703125, -1.2247314453125, -1.165008544921875, -1.10528564453125, -1.045562744140625, -0.98583984375, -0.926116943359375, -0.86639404296875, -0.806671142578125, -0.7469482421875, -0.687225341796875, -0.62750244140625, -0.567779541015625, -0.508056640625, -0.448333740234375, -0.38861083984375, -0.328887939453125, -0.2691650390625, -0.209442138671875, -0.14971923828125, -0.089996337890625, -0.0302734375, 0.029449462890625, 0.08917236328125, 0.148895263671875, 0.2086181640625, 0.268341064453125, 0.32806396484375, 0.387786865234375, 0.447509765625, 0.507232666015625, 0.56695556640625, 0.626678466796875, 0.6864013671875, 0.746124267578125, 0.80584716796875, 0.865570068359375, 0.92529296875, 0.985015869140625, 1.04473876953125, 1.104461669921875, 1.1641845703125, 1.223907470703125, 1.28363037109375, 1.343353271484375, 1.403076171875, 1.462799072265625, 1.52252197265625, 1.582244873046875, 1.6419677734375, 1.701690673828125, 1.76141357421875, 1.821136474609375, 1.880859375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 5.0, 6.0, 7.0, 8.0, 13.0, 9.0, 9.0, 18.0, 14.0, 12.0, 10.0, 22.0, 22.0, 17.0, 24.0, 26.0, 36.0, 27.0, 30.0, 32.0, 44.0, 31.0, 25.0, 40.0, 1052.0, 39.0, 38.0, 32.0, 24.0, 36.0, 33.0, 28.0, 27.0, 31.0, 27.0, 29.0, 19.0, 11.0, 16.0, 15.0, 18.0, 10.0, 6.0, 8.0, 8.0, 7.0, 3.0, 6.0, 4.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0], "bins": [-4.12890625, -4.0068359375, -3.884765625, -3.7626953125, -3.640625, -3.5185546875, -3.396484375, -3.2744140625, -3.15234375, -3.0302734375, -2.908203125, -2.7861328125, -2.6640625, -2.5419921875, -2.419921875, -2.2978515625, -2.17578125, -2.0537109375, -1.931640625, -1.8095703125, -1.6875, -1.5654296875, -1.443359375, -1.3212890625, -1.19921875, -1.0771484375, -0.955078125, -0.8330078125, -0.7109375, -0.5888671875, -0.466796875, -0.3447265625, -0.22265625, -0.1005859375, 0.021484375, 0.1435546875, 0.265625, 0.3876953125, 0.509765625, 0.6318359375, 0.75390625, 0.8759765625, 0.998046875, 1.1201171875, 1.2421875, 1.3642578125, 1.486328125, 1.6083984375, 1.73046875, 1.8525390625, 1.974609375, 2.0966796875, 2.21875, 2.3408203125, 2.462890625, 2.5849609375, 2.70703125, 2.8291015625, 2.951171875, 3.0732421875, 3.1953125, 3.3173828125, 3.439453125, 3.5615234375, 3.68359375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 7.0, 4.0, 4.0, 12.0, 20.0, 26.0, 41.0, 80.0, 130.0, 202.0, 380.0, 585.0, 1012.0, 1716.0, 2777.0, 4805.0, 8208.0, 14065.0, 23961.0, 43182.0, 1881922.0, 49798.0, 26582.0, 15285.0, 9179.0, 5305.0, 3140.0, 1885.0, 1114.0, 698.0, 408.0, 234.0, 146.0, 92.0, 43.0, 37.0, 19.0, 14.0, 5.0, 5.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.046875, -1.9859619140625, -1.925048828125, -1.8641357421875, -1.80322265625, -1.7423095703125, -1.681396484375, -1.6204833984375, -1.5595703125, -1.4986572265625, -1.437744140625, -1.3768310546875, -1.31591796875, -1.2550048828125, -1.194091796875, -1.1331787109375, -1.072265625, -1.0113525390625, -0.950439453125, -0.8895263671875, -0.82861328125, -0.7677001953125, -0.706787109375, -0.6458740234375, -0.5849609375, -0.5240478515625, -0.463134765625, -0.4022216796875, -0.34130859375, -0.2803955078125, -0.219482421875, -0.1585693359375, -0.09765625, -0.0367431640625, 0.024169921875, 0.0850830078125, 0.14599609375, 0.2069091796875, 0.267822265625, 0.3287353515625, 0.3896484375, 0.4505615234375, 0.511474609375, 0.5723876953125, 0.63330078125, 0.6942138671875, 0.755126953125, 0.8160400390625, 0.876953125, 0.9378662109375, 0.998779296875, 1.0596923828125, 1.12060546875, 1.1815185546875, 1.242431640625, 1.3033447265625, 1.3642578125, 1.4251708984375, 1.486083984375, 1.5469970703125, 1.60791015625, 1.6688232421875, 1.729736328125, 1.7906494140625, 1.8515625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 3.0, 8.0, 8.0, 3.0, 17.0, 19.0, 57.0, 109.0, 222.0, 261.0, 137.0, 49.0, 24.0, 16.0, 8.0, 10.0, 9.0, 10.0, 0.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.172607421875, -0.1679515838623047, -0.16329574584960938, -0.15863990783691406, -0.15398406982421875, -0.14932823181152344, -0.14467239379882812, -0.1400165557861328, -0.1353607177734375, -0.1307048797607422, -0.12604904174804688, -0.12139320373535156, -0.11673736572265625, -0.11208152770996094, -0.10742568969726562, -0.10276985168457031, -0.098114013671875, -0.09345817565917969, -0.08880233764648438, -0.08414649963378906, -0.07949066162109375, -0.07483482360839844, -0.07017898559570312, -0.06552314758300781, -0.0608673095703125, -0.05621147155761719, -0.051555633544921875, -0.04689979553222656, -0.04224395751953125, -0.03758811950683594, -0.032932281494140625, -0.028276443481445312, -0.02362060546875, -0.018964767456054688, -0.014308929443359375, -0.009653091430664062, -0.00499725341796875, -0.0003414154052734375, 0.004314422607421875, 0.008970260620117188, 0.0136260986328125, 0.018281936645507812, 0.022937774658203125, 0.027593612670898438, 0.03224945068359375, 0.03690528869628906, 0.041561126708984375, 0.04621696472167969, 0.050872802734375, 0.05552864074707031, 0.060184478759765625, 0.06484031677246094, 0.06949615478515625, 0.07415199279785156, 0.07880783081054688, 0.08346366882324219, 0.0881195068359375, 0.09277534484863281, 0.09743118286132812, 0.10208702087402344, 0.10674285888671875, 0.11139869689941406, 0.11605453491210938, 0.12071037292480469, 0.1253662109375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 8.0, 2.0, 6.0, 8.0, 13.0, 14.0, 20.0, 58.0, 115.0, 383.0, 1247.0, 5296.0, 403184.0, 631054.0, 5216.0, 1273.0, 400.0, 122.0, 43.0, 20.0, 13.0, 12.0, 9.0, 8.0, 5.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9638671875, -1.8911590576171875, -1.818450927734375, -1.7457427978515625, -1.67303466796875, -1.6003265380859375, -1.527618408203125, -1.4549102783203125, -1.3822021484375, -1.3094940185546875, -1.236785888671875, -1.1640777587890625, -1.09136962890625, -1.0186614990234375, -0.945953369140625, -0.8732452392578125, -0.800537109375, -0.7278289794921875, -0.655120849609375, -0.5824127197265625, -0.50970458984375, -0.4369964599609375, -0.364288330078125, -0.2915802001953125, -0.2188720703125, -0.1461639404296875, -0.073455810546875, -0.0007476806640625, 0.07196044921875, 0.1446685791015625, 0.217376708984375, 0.2900848388671875, 0.36279296875, 0.4355010986328125, 0.508209228515625, 0.5809173583984375, 0.65362548828125, 0.7263336181640625, 0.799041748046875, 0.8717498779296875, 0.9444580078125, 1.0171661376953125, 1.089874267578125, 1.1625823974609375, 1.23529052734375, 1.3079986572265625, 1.380706787109375, 1.4534149169921875, 1.526123046875, 1.5988311767578125, 1.671539306640625, 1.7442474365234375, 1.81695556640625, 1.8896636962890625, 1.962371826171875, 2.0350799560546875, 2.1077880859375, 2.1804962158203125, 2.253204345703125, 2.3259124755859375, 2.39862060546875, 2.4713287353515625, 2.544036865234375, 2.6167449951171875, 2.689453125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 10.0, 3.0, 14.0, 32.0, 69.0, 130.0, 246.0, 255.0, 108.0, 62.0, 34.0, 13.0, 8.0, 9.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3813701868057251, -0.3655206263065338, -0.34967106580734253, -0.33382150530815125, -0.31797194480895996, -0.3021223843097687, -0.2862728238105774, -0.2704232633113861, -0.2545737028121948, -0.23872414231300354, -0.22287458181381226, -0.20702502131462097, -0.1911754608154297, -0.1753259003162384, -0.15947633981704712, -0.14362677931785583, -0.12777721881866455, -0.11192765831947327, -0.09607809782028198, -0.0802285373210907, -0.06437897682189941, -0.04852941632270813, -0.032679855823516846, -0.01683029532432556, -0.0009807348251342773, 0.014868825674057007, 0.03071838617324829, 0.046567946672439575, 0.06241750717163086, 0.07826706767082214, 0.09411662817001343, 0.10996618866920471, 0.12581580877304077, 0.14166536927223206, 0.15751492977142334, 0.17336449027061462, 0.1892140507698059, 0.2050636112689972, 0.22091317176818848, 0.23676273226737976, 0.25261229276657104, 0.26846185326576233, 0.2843114137649536, 0.3001609742641449, 0.3160105347633362, 0.33186009526252747, 0.34770965576171875, 0.36355921626091003, 0.3794087767601013, 0.3952583372592926, 0.4111078977584839, 0.42695745825767517, 0.44280701875686646, 0.45865657925605774, 0.474506139755249, 0.4903557002544403, 0.5062052607536316, 0.5220547914505005, 0.5379043817520142, 0.5537539720535278, 0.5696035027503967, 0.5854530334472656, 0.6013026237487793, 0.617152214050293, 0.6330017447471619]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 7.0, 7.0, 3.0, 5.0, 7.0, 11.0, 18.0, 13.0, 18.0, 18.0, 17.0, 23.0, 19.0, 34.0, 30.0, 35.0, 46.0, 46.0, 29.0, 40.0, 46.0, 48.0, 43.0, 36.0, 38.0, 35.0, 42.0, 31.0, 35.0, 36.0, 28.0, 24.0, 22.0, 18.0, 12.0, 8.0, 18.0, 12.0, 11.0, 8.0, 5.0, 3.0, 8.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1923372745513916, -0.1863102912902832, -0.1802832931280136, -0.1742563098669052, -0.16822931170463562, -0.16220232844352722, -0.15617534518241882, -0.15014834702014923, -0.14412134885787964, -0.13809436559677124, -0.13206736743450165, -0.12604038417339325, -0.12001338601112366, -0.11398640275001526, -0.10795941203832626, -0.10193242132663727, -0.09590543806552887, -0.08987844735383987, -0.08385145664215088, -0.07782447338104248, -0.07179747521877289, -0.06577049195766449, -0.059743501245975494, -0.0537165105342865, -0.047689519822597504, -0.04166252911090851, -0.03563553839921951, -0.029608551412820816, -0.02358156070113182, -0.017554569989442825, -0.011527583003044128, -0.005500592291355133, 0.0005263984203338623, 0.006553388200700283, 0.012580377981066704, 0.01860736683011055, 0.024634357541799545, 0.03066134825348854, 0.03668833523988724, 0.04271532595157623, 0.04874231666326523, 0.054769307374954224, 0.06079629808664322, 0.06682328879833221, 0.07285027205944061, 0.0788772702217102, 0.0849042534828186, 0.0909312441945076, 0.0969582349061966, 0.10298522561788559, 0.10901221632957458, 0.11503919959068298, 0.12106619775295258, 0.12709318101406097, 0.13312017917633057, 0.13914716243743896, 0.14517414569854736, 0.15120112895965576, 0.15722812712192535, 0.16325511038303375, 0.16928210854530334, 0.17530909180641174, 0.18133607506752014, 0.18736307322978973, 0.19339007139205933]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 5.0, 3.0, 3.0, 8.0, 6.0, 10.0, 6.0, 14.0, 11.0, 15.0, 22.0, 17.0, 23.0, 19.0, 31.0, 31.0, 38.0, 39.0, 32.0, 41.0, 36.0, 40.0, 38.0, 37.0, 47.0, 36.0, 29.0, 37.0, 33.0, 24.0, 29.0, 33.0, 30.0, 27.0, 25.0, 17.0, 13.0, 19.0, 18.0, 11.0, 7.0, 8.0, 10.0, 3.0, 11.0, 5.0, 8.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.23046875, -5.06439208984375, -4.8983154296875, -4.73223876953125, -4.566162109375, -4.40008544921875, -4.2340087890625, -4.06793212890625, -3.90185546875, -3.73577880859375, -3.5697021484375, -3.40362548828125, -3.237548828125, -3.07147216796875, -2.9053955078125, -2.73931884765625, -2.5732421875, -2.40716552734375, -2.2410888671875, -2.07501220703125, -1.908935546875, -1.74285888671875, -1.5767822265625, -1.41070556640625, -1.24462890625, -1.07855224609375, -0.9124755859375, -0.74639892578125, -0.580322265625, -0.41424560546875, -0.2481689453125, -0.08209228515625, 0.083984375, 0.25006103515625, 0.4161376953125, 0.58221435546875, 0.748291015625, 0.91436767578125, 1.0804443359375, 1.24652099609375, 1.41259765625, 1.57867431640625, 1.7447509765625, 1.91082763671875, 2.076904296875, 2.24298095703125, 2.4090576171875, 2.57513427734375, 2.7412109375, 2.90728759765625, 3.0733642578125, 3.23944091796875, 3.405517578125, 3.57159423828125, 3.7376708984375, 3.90374755859375, 4.06982421875, 4.23590087890625, 4.4019775390625, 4.56805419921875, 4.734130859375, 4.90020751953125, 5.0662841796875, 5.23236083984375, 5.3984375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 12.0, 15.0, 20.0, 41.0, 53.0, 67.0, 117.0, 182.0, 283.0, 509.0, 820.0, 1511.0, 2660.0, 5160.0, 10397.0, 21955.0, 46232.0, 92325.0, 174639.0, 303635.0, 189693.0, 99706.0, 50641.0, 23990.0, 11450.0, 5704.0, 2867.0, 1526.0, 939.0, 480.0, 328.0, 221.0, 127.0, 73.0, 43.0, 38.0, 27.0, 16.0, 14.0, 7.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.578125, -5.3828125, -5.1875, -4.9921875, -4.796875, -4.6015625, -4.40625, -4.2109375, -4.015625, -3.8203125, -3.625, -3.4296875, -3.234375, -3.0390625, -2.84375, -2.6484375, -2.453125, -2.2578125, -2.0625, -1.8671875, -1.671875, -1.4765625, -1.28125, -1.0859375, -0.890625, -0.6953125, -0.5, -0.3046875, -0.109375, 0.0859375, 0.28125, 0.4765625, 0.671875, 0.8671875, 1.0625, 1.2578125, 1.453125, 1.6484375, 1.84375, 2.0390625, 2.234375, 2.4296875, 2.625, 2.8203125, 3.015625, 3.2109375, 3.40625, 3.6015625, 3.796875, 3.9921875, 4.1875, 4.3828125, 4.578125, 4.7734375, 4.96875, 5.1640625, 5.359375, 5.5546875, 5.75, 5.9453125, 6.140625, 6.3359375, 6.53125, 6.7265625, 6.921875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 3.0, 13.0, 9.0, 6.0, 11.0, 6.0, 10.0, 10.0, 14.0, 23.0, 25.0, 17.0, 23.0, 20.0, 26.0, 46.0, 28.0, 36.0, 53.0, 96.0, 147.0, 274.0, 1383.0, 221.0, 108.0, 66.0, 40.0, 35.0, 34.0, 34.0, 28.0, 37.0, 18.0, 24.0, 17.0, 12.0, 12.0, 10.0, 9.0, 11.0, 11.0, 11.0, 7.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0], "bins": [-18.875, -18.308349609375, -17.74169921875, -17.175048828125, -16.6083984375, -16.041748046875, -15.47509765625, -14.908447265625, -14.341796875, -13.775146484375, -13.20849609375, -12.641845703125, -12.0751953125, -11.508544921875, -10.94189453125, -10.375244140625, -9.80859375, -9.241943359375, -8.67529296875, -8.108642578125, -7.5419921875, -6.975341796875, -6.40869140625, -5.842041015625, -5.275390625, -4.708740234375, -4.14208984375, -3.575439453125, -3.0087890625, -2.442138671875, -1.87548828125, -1.308837890625, -0.7421875, -0.175537109375, 0.39111328125, 0.957763671875, 1.5244140625, 2.091064453125, 2.65771484375, 3.224365234375, 3.791015625, 4.357666015625, 4.92431640625, 5.490966796875, 6.0576171875, 6.624267578125, 7.19091796875, 7.757568359375, 8.32421875, 8.890869140625, 9.45751953125, 10.024169921875, 10.5908203125, 11.157470703125, 11.72412109375, 12.290771484375, 12.857421875, 13.424072265625, 13.99072265625, 14.557373046875, 15.1240234375, 15.690673828125, 16.25732421875, 16.823974609375, 17.390625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 10.0, 7.0, 18.0, 12.0, 16.0, 21.0, 35.0, 36.0, 55.0, 49.0, 92.0, 132.0, 190.0, 335.0, 660.0, 1563.0, 10612.0, 2713261.0, 411914.0, 4215.0, 1106.0, 508.0, 267.0, 156.0, 119.0, 81.0, 46.0, 39.0, 37.0, 26.0, 27.0, 23.0, 10.0, 8.0, 7.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.125, -55.43603515625, -53.7470703125, -52.05810546875, -50.369140625, -48.68017578125, -46.9912109375, -45.30224609375, -43.61328125, -41.92431640625, -40.2353515625, -38.54638671875, -36.857421875, -35.16845703125, -33.4794921875, -31.79052734375, -30.1015625, -28.41259765625, -26.7236328125, -25.03466796875, -23.345703125, -21.65673828125, -19.9677734375, -18.27880859375, -16.58984375, -14.90087890625, -13.2119140625, -11.52294921875, -9.833984375, -8.14501953125, -6.4560546875, -4.76708984375, -3.078125, -1.38916015625, 0.2998046875, 1.98876953125, 3.677734375, 5.36669921875, 7.0556640625, 8.74462890625, 10.43359375, 12.12255859375, 13.8115234375, 15.50048828125, 17.189453125, 18.87841796875, 20.5673828125, 22.25634765625, 23.9453125, 25.63427734375, 27.3232421875, 29.01220703125, 30.701171875, 32.39013671875, 34.0791015625, 35.76806640625, 37.45703125, 39.14599609375, 40.8349609375, 42.52392578125, 44.212890625, 45.90185546875, 47.5908203125, 49.27978515625, 50.96875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 44.0, 132.0, 320.0, 318.0, 150.0, 38.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-174.1971893310547, -170.90866088867188, -167.62014770507812, -164.3316192626953, -161.0430908203125, -157.7545623779297, -154.46603393554688, -151.17752075195312, -147.8889923095703, -144.6004638671875, -141.31195068359375, -138.02342224121094, -134.73489379882812, -131.4463653564453, -128.1578369140625, -124.86932373046875, -121.58079528808594, -118.29226684570312, -115.00374603271484, -111.71522521972656, -108.42669677734375, -105.13816833496094, -101.84964752197266, -98.56112670898438, -95.27259826660156, -91.98406982421875, -88.69554901123047, -85.40702819824219, -82.11849975585938, -78.82997131347656, -75.54145050048828, -72.2529296875, -68.96440124511719, -65.67587280273438, -62.387351989746094, -59.09882736206055, -55.810302734375, -52.52177810668945, -49.233253479003906, -45.94472885131836, -42.65620422363281, -39.367679595947266, -36.07915496826172, -32.79063034057617, -29.502105712890625, -26.213581085205078, -22.92505645751953, -19.636531829833984, -16.348007202148438, -13.05948257446289, -9.770957946777344, -6.482433319091797, -3.19390869140625, 0.09461593627929688, 3.3831405639648438, 6.671665191650391, 9.960189819335938, 13.248714447021484, 16.53723907470703, 19.825763702392578, 23.114288330078125, 26.402812957763672, 29.69133758544922, 32.979862213134766, 36.26838684082031]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 3.0, 9.0, 4.0, 6.0, 11.0, 14.0, 10.0, 24.0, 17.0, 19.0, 22.0, 25.0, 24.0, 37.0, 33.0, 40.0, 36.0, 42.0, 41.0, 54.0, 31.0, 38.0, 50.0, 30.0, 39.0, 52.0, 29.0, 32.0, 32.0, 24.0, 24.0, 20.0, 25.0, 16.0, 13.0, 17.0, 14.0, 8.0, 6.0, 11.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-57.29645919799805, -55.64466094970703, -53.992862701416016, -52.341064453125, -50.689266204833984, -49.03746795654297, -47.38566970825195, -45.73387145996094, -44.08207321166992, -42.430274963378906, -40.77847671508789, -39.126678466796875, -37.47488021850586, -35.823081970214844, -34.17128372192383, -32.51948547363281, -30.867687225341797, -29.21588897705078, -27.564090728759766, -25.91229248046875, -24.260494232177734, -22.60869598388672, -20.956897735595703, -19.305099487304688, -17.653301239013672, -16.001502990722656, -14.34970474243164, -12.697906494140625, -11.04610824584961, -9.394309997558594, -7.742511749267578, -6.0907135009765625, -4.438915252685547, -2.7871170043945312, -1.1353187561035156, 0.5164794921875, 2.1682777404785156, 3.8200759887695312, 5.471874237060547, 7.1236724853515625, 8.775470733642578, 10.427268981933594, 12.07906723022461, 13.730865478515625, 15.38266372680664, 17.034461975097656, 18.686260223388672, 20.338058471679688, 21.989856719970703, 23.64165496826172, 25.293453216552734, 26.94525146484375, 28.597049713134766, 30.24884796142578, 31.900646209716797, 33.55244445800781, 35.20424270629883, 36.856040954589844, 38.50783920288086, 40.159637451171875, 41.81143569946289, 43.463233947753906, 45.11503219604492, 46.76683044433594, 48.41862869262695]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 2.0, 5.0, 4.0, 2.0, 6.0, 7.0, 9.0, 10.0, 17.0, 8.0, 17.0, 16.0, 30.0, 24.0, 24.0, 39.0, 36.0, 25.0, 32.0, 34.0, 33.0, 26.0, 47.0, 33.0, 38.0, 40.0, 30.0, 40.0, 40.0, 38.0, 30.0, 23.0, 25.0, 23.0, 29.0, 19.0, 30.0, 19.0, 14.0, 10.0, 11.0, 8.0, 12.0, 6.0, 6.0, 8.0, 3.0, 8.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-5.8046875, -5.630126953125, -5.45556640625, -5.281005859375, -5.1064453125, -4.931884765625, -4.75732421875, -4.582763671875, -4.408203125, -4.233642578125, -4.05908203125, -3.884521484375, -3.7099609375, -3.535400390625, -3.36083984375, -3.186279296875, -3.01171875, -2.837158203125, -2.66259765625, -2.488037109375, -2.3134765625, -2.138916015625, -1.96435546875, -1.789794921875, -1.615234375, -1.440673828125, -1.26611328125, -1.091552734375, -0.9169921875, -0.742431640625, -0.56787109375, -0.393310546875, -0.21875, -0.044189453125, 0.13037109375, 0.304931640625, 0.4794921875, 0.654052734375, 0.82861328125, 1.003173828125, 1.177734375, 1.352294921875, 1.52685546875, 1.701416015625, 1.8759765625, 2.050537109375, 2.22509765625, 2.399658203125, 2.57421875, 2.748779296875, 2.92333984375, 3.097900390625, 3.2724609375, 3.447021484375, 3.62158203125, 3.796142578125, 3.970703125, 4.145263671875, 4.31982421875, 4.494384765625, 4.6689453125, 4.843505859375, 5.01806640625, 5.192626953125, 5.3671875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 1.0, 6.0, 9.0, 11.0, 6.0, 13.0, 22.0, 17.0, 21.0, 33.0, 52.0, 48.0, 71.0, 121.0, 214.0, 389.0, 972.0, 3002.0, 10871.0, 44136.0, 184033.0, 705256.0, 1648624.0, 1142514.0, 341971.0, 83466.0, 20087.0, 5267.0, 1602.0, 577.0, 256.0, 159.0, 112.0, 81.0, 45.0, 38.0, 27.0, 34.0, 28.0, 25.0, 14.0, 18.0, 5.0, 11.0, 5.0, 4.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1171875, -8.8204345703125, -8.523681640625, -8.2269287109375, -7.93017578125, -7.6334228515625, -7.336669921875, -7.0399169921875, -6.7431640625, -6.4464111328125, -6.149658203125, -5.8529052734375, -5.55615234375, -5.2593994140625, -4.962646484375, -4.6658935546875, -4.369140625, -4.0723876953125, -3.775634765625, -3.4788818359375, -3.18212890625, -2.8853759765625, -2.588623046875, -2.2918701171875, -1.9951171875, -1.6983642578125, -1.401611328125, -1.1048583984375, -0.80810546875, -0.5113525390625, -0.214599609375, 0.0821533203125, 0.37890625, 0.6756591796875, 0.972412109375, 1.2691650390625, 1.56591796875, 1.8626708984375, 2.159423828125, 2.4561767578125, 2.7529296875, 3.0496826171875, 3.346435546875, 3.6431884765625, 3.93994140625, 4.2366943359375, 4.533447265625, 4.8302001953125, 5.126953125, 5.4237060546875, 5.720458984375, 6.0172119140625, 6.31396484375, 6.6107177734375, 6.907470703125, 7.2042236328125, 7.5009765625, 7.7977294921875, 8.094482421875, 8.3912353515625, 8.68798828125, 8.9847412109375, 9.281494140625, 9.5782470703125, 9.875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 6.0, 8.0, 11.0, 13.0, 15.0, 22.0, 33.0, 30.0, 44.0, 56.0, 76.0, 83.0, 138.0, 187.0, 226.0, 316.0, 313.0, 396.0, 382.0, 351.0, 287.0, 223.0, 196.0, 167.0, 107.0, 87.0, 71.0, 60.0, 36.0, 27.0, 29.0, 21.0, 17.0, 11.0, 8.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.953125, -11.611572265625, -11.27001953125, -10.928466796875, -10.5869140625, -10.245361328125, -9.90380859375, -9.562255859375, -9.220703125, -8.879150390625, -8.53759765625, -8.196044921875, -7.8544921875, -7.512939453125, -7.17138671875, -6.829833984375, -6.48828125, -6.146728515625, -5.80517578125, -5.463623046875, -5.1220703125, -4.780517578125, -4.43896484375, -4.097412109375, -3.755859375, -3.414306640625, -3.07275390625, -2.731201171875, -2.3896484375, -2.048095703125, -1.70654296875, -1.364990234375, -1.0234375, -0.681884765625, -0.34033203125, 0.001220703125, 0.3427734375, 0.684326171875, 1.02587890625, 1.367431640625, 1.708984375, 2.050537109375, 2.39208984375, 2.733642578125, 3.0751953125, 3.416748046875, 3.75830078125, 4.099853515625, 4.44140625, 4.782958984375, 5.12451171875, 5.466064453125, 5.8076171875, 6.149169921875, 6.49072265625, 6.832275390625, 7.173828125, 7.515380859375, 7.85693359375, 8.198486328125, 8.5400390625, 8.881591796875, 9.22314453125, 9.564697265625, 9.90625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 1.0, 2.0, 2.0, 5.0, 8.0, 11.0, 13.0, 17.0, 24.0, 23.0, 37.0, 61.0, 45.0, 74.0, 111.0, 131.0, 205.0, 274.0, 432.0, 1853.0, 191457.0, 3871984.0, 124739.0, 1490.0, 405.0, 240.0, 175.0, 101.0, 91.0, 57.0, 55.0, 32.0, 34.0, 28.0, 18.0, 12.0, 12.0, 9.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-43.46875, -41.94140625, -40.4140625, -38.88671875, -37.359375, -35.83203125, -34.3046875, -32.77734375, -31.25, -29.72265625, -28.1953125, -26.66796875, -25.140625, -23.61328125, -22.0859375, -20.55859375, -19.03125, -17.50390625, -15.9765625, -14.44921875, -12.921875, -11.39453125, -9.8671875, -8.33984375, -6.8125, -5.28515625, -3.7578125, -2.23046875, -0.703125, 0.82421875, 2.3515625, 3.87890625, 5.40625, 6.93359375, 8.4609375, 9.98828125, 11.515625, 13.04296875, 14.5703125, 16.09765625, 17.625, 19.15234375, 20.6796875, 22.20703125, 23.734375, 25.26171875, 26.7890625, 28.31640625, 29.84375, 31.37109375, 32.8984375, 34.42578125, 35.953125, 37.48046875, 39.0078125, 40.53515625, 42.0625, 43.58984375, 45.1171875, 46.64453125, 48.171875, 49.69921875, 51.2265625, 52.75390625, 54.28125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 29.0, 116.0, 276.0, 337.0, 190.0, 57.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-317.87823486328125, -312.1028137207031, -306.327392578125, -300.5519714355469, -294.77655029296875, -289.0011291503906, -283.2257080078125, -277.4503173828125, -271.67486572265625, -265.8994445800781, -260.1240234375, -254.34860229492188, -248.57318115234375, -242.7977752685547, -237.02235412597656, -231.24693298339844, -225.47152709960938, -219.69610595703125, -213.92068481445312, -208.145263671875, -202.36984252929688, -196.5944366455078, -190.8190155029297, -185.04359436035156, -179.26817321777344, -173.4927520751953, -167.7173309326172, -161.94190979003906, -156.16650390625, -150.39108276367188, -144.61566162109375, -138.84024047851562, -133.06480407714844, -127.28938293457031, -121.51396179199219, -115.7385482788086, -109.96312713623047, -104.18770599365234, -98.41229248046875, -92.63687133789062, -86.8614501953125, -81.08602905273438, -75.31060791015625, -69.53519439697266, -63.75977325439453, -57.984352111816406, -52.20893478393555, -46.43351745605469, -40.65809631347656, -34.88267517089844, -29.107257843017578, -23.331838607788086, -17.556419372558594, -11.781000137329102, -6.005580902099609, -0.23016357421875, 5.545257568359375, 11.320676803588867, 17.09609603881836, 22.87151527404785, 28.646934509277344, 34.42235565185547, 40.19777297973633, 45.97319030761719, 51.74861145019531]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 4.0, 5.0, 8.0, 9.0, 9.0, 8.0, 23.0, 26.0, 25.0, 26.0, 32.0, 28.0, 36.0, 32.0, 41.0, 49.0, 41.0, 46.0, 51.0, 45.0, 36.0, 32.0, 36.0, 36.0, 46.0, 36.0, 34.0, 33.0, 22.0, 18.0, 28.0, 13.0, 16.0, 14.0, 10.0, 8.0, 11.0, 10.0, 5.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.1520881652832, -44.73635482788086, -43.320621490478516, -41.90488815307617, -40.48915481567383, -39.073421478271484, -37.657691955566406, -36.24195861816406, -34.82622528076172, -33.410491943359375, -31.99475860595703, -30.579025268554688, -29.163291931152344, -27.74755859375, -26.33182716369629, -24.916093826293945, -23.50035858154297, -22.084625244140625, -20.66889190673828, -19.253158569335938, -17.837425231933594, -16.42169189453125, -15.005960464477539, -13.590227127075195, -12.174493789672852, -10.758760452270508, -9.343027114868164, -7.927294731140137, -6.511561393737793, -5.095828056335449, -3.680095672607422, -2.264362335205078, -0.8486328125, 0.5671002864837646, 1.9828333854675293, 3.398566246032715, 4.814299583435059, 6.230032920837402, 7.64576530456543, 9.061498641967773, 10.477231979370117, 11.892965316772461, 13.308698654174805, 14.724431037902832, 16.14016342163086, 17.555896759033203, 18.971630096435547, 20.38736343383789, 21.803096771240234, 23.218830108642578, 24.634563446044922, 26.050296783447266, 27.46603012084961, 28.881763458251953, 30.297494888305664, 31.713228225708008, 33.12895965576172, 34.54469299316406, 35.960426330566406, 37.37615966796875, 38.791893005371094, 40.20762634277344, 41.62335968017578, 43.039093017578125, 44.45482635498047]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 7.0, 5.0, 8.0, 7.0, 10.0, 21.0, 15.0, 18.0, 14.0, 20.0, 27.0, 35.0, 22.0, 30.0, 33.0, 38.0, 27.0, 34.0, 36.0, 42.0, 30.0, 38.0, 34.0, 45.0, 36.0, 34.0, 26.0, 27.0, 31.0, 29.0, 20.0, 23.0, 23.0, 20.0, 26.0, 23.0, 14.0, 15.0, 8.0, 8.0, 5.0, 7.0, 8.0, 7.0, 6.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.921875, -4.7596435546875, -4.597412109375, -4.4351806640625, -4.27294921875, -4.1107177734375, -3.948486328125, -3.7862548828125, -3.6240234375, -3.4617919921875, -3.299560546875, -3.1373291015625, -2.97509765625, -2.8128662109375, -2.650634765625, -2.4884033203125, -2.326171875, -2.1639404296875, -2.001708984375, -1.8394775390625, -1.67724609375, -1.5150146484375, -1.352783203125, -1.1905517578125, -1.0283203125, -0.8660888671875, -0.703857421875, -0.5416259765625, -0.37939453125, -0.2171630859375, -0.054931640625, 0.1072998046875, 0.26953125, 0.4317626953125, 0.593994140625, 0.7562255859375, 0.91845703125, 1.0806884765625, 1.242919921875, 1.4051513671875, 1.5673828125, 1.7296142578125, 1.891845703125, 2.0540771484375, 2.21630859375, 2.3785400390625, 2.540771484375, 2.7030029296875, 2.865234375, 3.0274658203125, 3.189697265625, 3.3519287109375, 3.51416015625, 3.6763916015625, 3.838623046875, 4.0008544921875, 4.1630859375, 4.3253173828125, 4.487548828125, 4.6497802734375, 4.81201171875, 4.9742431640625, 5.136474609375, 5.2987060546875, 5.4609375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 9.0, 10.0, 20.0, 36.0, 38.0, 68.0, 129.0, 157.0, 258.0, 426.0, 605.0, 977.0, 1447.0, 2190.0, 3442.0, 5009.0, 7740.0, 11286.0, 16674.0, 23319.0, 33546.0, 46281.0, 61262.0, 78844.0, 95281.0, 108105.0, 110801.0, 102474.0, 86755.0, 69788.0, 53173.0, 39036.0, 28444.0, 19613.0, 13620.0, 9259.0, 6289.0, 4146.0, 2738.0, 1857.0, 1227.0, 753.0, 524.0, 311.0, 213.0, 131.0, 89.0, 55.0, 40.0, 24.0, 17.0, 9.0, 4.0, 6.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.71240234375, -0.6880416870117188, -0.6636810302734375, -0.6393203735351562, -0.614959716796875, -0.5905990600585938, -0.5662384033203125, -0.5418777465820312, -0.51751708984375, -0.49315643310546875, -0.4687957763671875, -0.44443511962890625, -0.420074462890625, -0.39571380615234375, -0.3713531494140625, -0.34699249267578125, -0.3226318359375, -0.29827117919921875, -0.2739105224609375, -0.24954986572265625, -0.225189208984375, -0.20082855224609375, -0.1764678955078125, -0.15210723876953125, -0.12774658203125, -0.10338592529296875, -0.0790252685546875, -0.05466461181640625, -0.030303955078125, -0.00594329833984375, 0.0184173583984375, 0.04277801513671875, 0.067138671875, 0.09149932861328125, 0.1158599853515625, 0.14022064208984375, 0.164581298828125, 0.18894195556640625, 0.2133026123046875, 0.23766326904296875, 0.26202392578125, 0.28638458251953125, 0.3107452392578125, 0.33510589599609375, 0.359466552734375, 0.38382720947265625, 0.4081878662109375, 0.43254852294921875, 0.4569091796875, 0.48126983642578125, 0.5056304931640625, 0.5299911499023438, 0.554351806640625, 0.5787124633789062, 0.6030731201171875, 0.6274337768554688, 0.65179443359375, 0.6761550903320312, 0.7005157470703125, 0.7248764038085938, 0.749237060546875, 0.7735977172851562, 0.7979583740234375, 0.8223190307617188, 0.8466796875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 10.0, 4.0, 4.0, 9.0, 10.0, 10.0, 17.0, 16.0, 19.0, 26.0, 34.0, 38.0, 36.0, 23.0, 29.0, 30.0, 38.0, 50.0, 46.0, 41.0, 1067.0, 40.0, 39.0, 41.0, 32.0, 41.0, 27.0, 42.0, 39.0, 30.0, 15.0, 27.0, 24.0, 16.0, 10.0, 14.0, 8.0, 6.0, 5.0, 9.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.65234375, -4.50738525390625, -4.3624267578125, -4.21746826171875, -4.072509765625, -3.92755126953125, -3.7825927734375, -3.63763427734375, -3.49267578125, -3.34771728515625, -3.2027587890625, -3.05780029296875, -2.912841796875, -2.76788330078125, -2.6229248046875, -2.47796630859375, -2.3330078125, -2.18804931640625, -2.0430908203125, -1.89813232421875, -1.753173828125, -1.60821533203125, -1.4632568359375, -1.31829833984375, -1.17333984375, -1.02838134765625, -0.8834228515625, -0.73846435546875, -0.593505859375, -0.44854736328125, -0.3035888671875, -0.15863037109375, -0.013671875, 0.13128662109375, 0.2762451171875, 0.42120361328125, 0.566162109375, 0.71112060546875, 0.8560791015625, 1.00103759765625, 1.14599609375, 1.29095458984375, 1.4359130859375, 1.58087158203125, 1.725830078125, 1.87078857421875, 2.0157470703125, 2.16070556640625, 2.3056640625, 2.45062255859375, 2.5955810546875, 2.74053955078125, 2.885498046875, 3.03045654296875, 3.1754150390625, 3.32037353515625, 3.46533203125, 3.61029052734375, 3.7552490234375, 3.90020751953125, 4.045166015625, 4.19012451171875, 4.3350830078125, 4.48004150390625, 4.625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 9.0, 7.0, 17.0, 22.0, 36.0, 35.0, 71.0, 92.0, 141.0, 208.0, 384.0, 545.0, 892.0, 1424.0, 2267.0, 3783.0, 6166.0, 10269.0, 17289.0, 29147.0, 56581.0, 1871926.0, 38117.0, 22700.0, 13775.0, 8147.0, 4935.0, 3103.0, 1899.0, 1156.0, 736.0, 440.0, 275.0, 186.0, 118.0, 68.0, 54.0, 35.0, 26.0, 19.0, 10.0, 6.0, 9.0, 6.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-1.84375, -1.788330078125, -1.73291015625, -1.677490234375, -1.6220703125, -1.566650390625, -1.51123046875, -1.455810546875, -1.400390625, -1.344970703125, -1.28955078125, -1.234130859375, -1.1787109375, -1.123291015625, -1.06787109375, -1.012451171875, -0.95703125, -0.901611328125, -0.84619140625, -0.790771484375, -0.7353515625, -0.679931640625, -0.62451171875, -0.569091796875, -0.513671875, -0.458251953125, -0.40283203125, -0.347412109375, -0.2919921875, -0.236572265625, -0.18115234375, -0.125732421875, -0.0703125, -0.014892578125, 0.04052734375, 0.095947265625, 0.1513671875, 0.206787109375, 0.26220703125, 0.317626953125, 0.373046875, 0.428466796875, 0.48388671875, 0.539306640625, 0.5947265625, 0.650146484375, 0.70556640625, 0.760986328125, 0.81640625, 0.871826171875, 0.92724609375, 0.982666015625, 1.0380859375, 1.093505859375, 1.14892578125, 1.204345703125, 1.259765625, 1.315185546875, 1.37060546875, 1.426025390625, 1.4814453125, 1.536865234375, 1.59228515625, 1.647705078125, 1.703125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 7.0, 3.0, 7.0, 12.0, 8.0, 19.0, 12.0, 15.0, 16.0, 21.0, 43.0, 43.0, 69.0, 83.0, 113.0, 140.0, 88.0, 63.0, 54.0, 38.0, 39.0, 23.0, 22.0, 12.0, 10.0, 7.0, 11.0, 8.0, 3.0, 6.0, 3.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050872802734375, -0.0488591194152832, -0.046845436096191406, -0.04483175277709961, -0.04281806945800781, -0.040804386138916016, -0.03879070281982422, -0.03677701950073242, -0.034763336181640625, -0.03274965286254883, -0.03073596954345703, -0.028722286224365234, -0.026708602905273438, -0.02469491958618164, -0.022681236267089844, -0.020667552947998047, -0.01865386962890625, -0.016640186309814453, -0.014626502990722656, -0.01261281967163086, -0.010599136352539062, -0.008585453033447266, -0.006571769714355469, -0.004558086395263672, -0.002544403076171875, -0.0005307197570800781, 0.0014829635620117188, 0.0034966468811035156, 0.0055103302001953125, 0.007524013519287109, 0.009537696838378906, 0.011551380157470703, 0.0135650634765625, 0.015578746795654297, 0.017592430114746094, 0.01960611343383789, 0.021619796752929688, 0.023633480072021484, 0.02564716339111328, 0.027660846710205078, 0.029674530029296875, 0.03168821334838867, 0.03370189666748047, 0.035715579986572266, 0.03772926330566406, 0.03974294662475586, 0.041756629943847656, 0.04377031326293945, 0.04578399658203125, 0.04779767990112305, 0.049811363220214844, 0.05182504653930664, 0.05383872985839844, 0.055852413177490234, 0.05786609649658203, 0.05987977981567383, 0.061893463134765625, 0.06390714645385742, 0.06592082977294922, 0.06793451309204102, 0.06994819641113281, 0.07196187973022461, 0.0739755630493164, 0.0759892463684082, 0.0780029296875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 8.0, 14.0, 14.0, 18.0, 27.0, 38.0, 66.0, 89.0, 191.0, 384.0, 2488.0, 1023419.0, 20513.0, 645.0, 245.0, 131.0, 71.0, 44.0, 31.0, 16.0, 19.0, 17.0, 10.0, 15.0, 5.0, 5.0, 6.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.578125, -1.537353515625, -1.49658203125, -1.455810546875, -1.4150390625, -1.374267578125, -1.33349609375, -1.292724609375, -1.251953125, -1.211181640625, -1.17041015625, -1.129638671875, -1.0888671875, -1.048095703125, -1.00732421875, -0.966552734375, -0.92578125, -0.885009765625, -0.84423828125, -0.803466796875, -0.7626953125, -0.721923828125, -0.68115234375, -0.640380859375, -0.599609375, -0.558837890625, -0.51806640625, -0.477294921875, -0.4365234375, -0.395751953125, -0.35498046875, -0.314208984375, -0.2734375, -0.232666015625, -0.19189453125, -0.151123046875, -0.1103515625, -0.069580078125, -0.02880859375, 0.011962890625, 0.052734375, 0.093505859375, 0.13427734375, 0.175048828125, 0.2158203125, 0.256591796875, 0.29736328125, 0.338134765625, 0.37890625, 0.419677734375, 0.46044921875, 0.501220703125, 0.5419921875, 0.582763671875, 0.62353515625, 0.664306640625, 0.705078125, 0.745849609375, 0.78662109375, 0.827392578125, 0.8681640625, 0.908935546875, 0.94970703125, 0.990478515625, 1.03125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 8.0, 58.0, 641.0, 287.0, 22.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3244344890117645, -0.30396637320518494, -0.28349825739860535, -0.26303011178970337, -0.24256199598312378, -0.2220938801765442, -0.2016257643699646, -0.18115763366222382, -0.16068951785564423, -0.14022140204906464, -0.11975327134132385, -0.09928515553474426, -0.07881703227758408, -0.05834890902042389, -0.0378807932138443, -0.017412662506103516, 0.0030554533004760742, 0.023523574694991112, 0.04399169608950615, 0.06445981562137604, 0.08492793887853622, 0.10539606213569641, 0.125864177942276, 0.14633230865001678, 0.16680042445659637, 0.18726854026317596, 0.20773667097091675, 0.22820478677749634, 0.24867290258407593, 0.2691410183906555, 0.2896091341972351, 0.3100772798061371, 0.3305453658103943, 0.3510134816169739, 0.37148159742355347, 0.39194971323013306, 0.41241785883903503, 0.4328859746456146, 0.4533540904521942, 0.4738222360610962, 0.4942903518676758, 0.5147584676742554, 0.535226583480835, 0.5556946992874146, 0.5761628150939941, 0.5966309309005737, 0.6170990467071533, 0.6375672221183777, 0.6580352783203125, 0.6785033941268921, 0.6989715099334717, 0.7194396257400513, 0.7399077415466309, 0.7603758573532104, 0.78084397315979, 0.8013121485710144, 0.821780264377594, 0.8422483801841736, 0.8627164959907532, 0.8831846117973328, 0.9036527276039124, 0.9241209030151367, 0.9445890188217163, 0.9650571346282959, 0.9855252504348755]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 0.0, 4.0, 6.0, 5.0, 6.0, 12.0, 12.0, 12.0, 12.0, 15.0, 16.0, 15.0, 17.0, 26.0, 25.0, 26.0, 21.0, 40.0, 28.0, 44.0, 30.0, 40.0, 43.0, 36.0, 23.0, 37.0, 39.0, 33.0, 32.0, 32.0, 25.0, 32.0, 28.0, 21.0, 22.0, 32.0, 21.0, 27.0, 15.0, 11.0, 16.0, 8.0, 7.0, 8.0, 7.0, 9.0, 6.0, 7.0, 5.0, 2.0, 6.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.08650553226470947, -0.08369187265634537, -0.08087821304798126, -0.07806454598903656, -0.07525088638067245, -0.07243722677230835, -0.06962355971336365, -0.06680990010499954, -0.06399624049663544, -0.06118258088827133, -0.05836891755461693, -0.055555254220962524, -0.05274159461259842, -0.049927935004234314, -0.04711427167057991, -0.04430060833692551, -0.0414869487285614, -0.038673289120197296, -0.03585962578654289, -0.03304596245288849, -0.030232302844524384, -0.02741864137351513, -0.024604979902505875, -0.02179131843149662, -0.018977656960487366, -0.01616399548947811, -0.013350334018468857, -0.010536672547459602, -0.007723011076450348, -0.0049093496054410934, -0.002095688134431839, 0.0007179733365774155, 0.00353163480758667, 0.006345296278595924, 0.009158957749605179, 0.011972619220614433, 0.014786280691623688, 0.017599942162632942, 0.020413603633642197, 0.02322726510465145, 0.026040926575660706, 0.02885458804666996, 0.031668249517679214, 0.03448191285133362, 0.03729557245969772, 0.04010923206806183, 0.04292289540171623, 0.045736558735370636, 0.04855021834373474, 0.051363877952098846, 0.05417754128575325, 0.056991204619407654, 0.05980486422777176, 0.06261852383613586, 0.06543219089508057, 0.06824585050344467, 0.07105951011180878, 0.07387316972017288, 0.07668682932853699, 0.07950049638748169, 0.0823141559958458, 0.0851278156042099, 0.0879414826631546, 0.09075514227151871, 0.09356880187988281]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 5.0, 8.0, 8.0, 10.0, 12.0, 6.0, 14.0, 15.0, 18.0, 23.0, 20.0, 20.0, 22.0, 29.0, 39.0, 30.0, 28.0, 30.0, 40.0, 52.0, 42.0, 37.0, 47.0, 44.0, 35.0, 29.0, 30.0, 34.0, 23.0, 28.0, 33.0, 29.0, 31.0, 19.0, 16.0, 20.0, 18.0, 13.0, 8.0, 5.0, 10.0, 7.0, 7.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.36328125, -5.1910400390625, -5.018798828125, -4.8465576171875, -4.67431640625, -4.5020751953125, -4.329833984375, -4.1575927734375, -3.9853515625, -3.8131103515625, -3.640869140625, -3.4686279296875, -3.29638671875, -3.1241455078125, -2.951904296875, -2.7796630859375, -2.607421875, -2.4351806640625, -2.262939453125, -2.0906982421875, -1.91845703125, -1.7462158203125, -1.573974609375, -1.4017333984375, -1.2294921875, -1.0572509765625, -0.885009765625, -0.7127685546875, -0.54052734375, -0.3682861328125, -0.196044921875, -0.0238037109375, 0.1484375, 0.3206787109375, 0.492919921875, 0.6651611328125, 0.83740234375, 1.0096435546875, 1.181884765625, 1.3541259765625, 1.5263671875, 1.6986083984375, 1.870849609375, 2.0430908203125, 2.21533203125, 2.3875732421875, 2.559814453125, 2.7320556640625, 2.904296875, 3.0765380859375, 3.248779296875, 3.4210205078125, 3.59326171875, 3.7655029296875, 3.937744140625, 4.1099853515625, 4.2822265625, 4.4544677734375, 4.626708984375, 4.7989501953125, 4.97119140625, 5.1434326171875, 5.315673828125, 5.4879150390625, 5.66015625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 4.0, 8.0, 6.0, 18.0, 21.0, 24.0, 55.0, 74.0, 158.0, 334.0, 603.0, 1168.0, 2230.0, 4358.0, 8222.0, 16013.0, 32970.0, 72681.0, 171246.0, 358472.0, 212027.0, 89413.0, 39423.0, 18788.0, 9717.0, 5143.0, 2569.0, 1335.0, 713.0, 344.0, 166.0, 103.0, 56.0, 27.0, 28.0, 14.0, 10.0, 7.0, 5.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.48828125, -6.25335693359375, -6.0184326171875, -5.78350830078125, -5.548583984375, -5.31365966796875, -5.0787353515625, -4.84381103515625, -4.60888671875, -4.37396240234375, -4.1390380859375, -3.90411376953125, -3.669189453125, -3.43426513671875, -3.1993408203125, -2.96441650390625, -2.7294921875, -2.49456787109375, -2.2596435546875, -2.02471923828125, -1.789794921875, -1.55487060546875, -1.3199462890625, -1.08502197265625, -0.85009765625, -0.61517333984375, -0.3802490234375, -0.14532470703125, 0.089599609375, 0.32452392578125, 0.5594482421875, 0.79437255859375, 1.029296875, 1.26422119140625, 1.4991455078125, 1.73406982421875, 1.968994140625, 2.20391845703125, 2.4388427734375, 2.67376708984375, 2.90869140625, 3.14361572265625, 3.3785400390625, 3.61346435546875, 3.848388671875, 4.08331298828125, 4.3182373046875, 4.55316162109375, 4.7880859375, 5.02301025390625, 5.2579345703125, 5.49285888671875, 5.727783203125, 5.96270751953125, 6.1976318359375, 6.43255615234375, 6.66748046875, 6.90240478515625, 7.1373291015625, 7.37225341796875, 7.607177734375, 7.84210205078125, 8.0770263671875, 8.31195068359375, 8.546875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 7.0, 9.0, 8.0, 12.0, 11.0, 19.0, 13.0, 27.0, 29.0, 28.0, 35.0, 32.0, 52.0, 49.0, 68.0, 104.0, 183.0, 339.0, 1354.0, 169.0, 97.0, 74.0, 50.0, 35.0, 47.0, 20.0, 31.0, 23.0, 26.0, 17.0, 13.0, 14.0, 12.0, 7.0, 11.0, 7.0, 6.0, 6.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.234375, -23.562744140625, -22.89111328125, -22.219482421875, -21.5478515625, -20.876220703125, -20.20458984375, -19.532958984375, -18.861328125, -18.189697265625, -17.51806640625, -16.846435546875, -16.1748046875, -15.503173828125, -14.83154296875, -14.159912109375, -13.48828125, -12.816650390625, -12.14501953125, -11.473388671875, -10.8017578125, -10.130126953125, -9.45849609375, -8.786865234375, -8.115234375, -7.443603515625, -6.77197265625, -6.100341796875, -5.4287109375, -4.757080078125, -4.08544921875, -3.413818359375, -2.7421875, -2.070556640625, -1.39892578125, -0.727294921875, -0.0556640625, 0.615966796875, 1.28759765625, 1.959228515625, 2.630859375, 3.302490234375, 3.97412109375, 4.645751953125, 5.3173828125, 5.989013671875, 6.66064453125, 7.332275390625, 8.00390625, 8.675537109375, 9.34716796875, 10.018798828125, 10.6904296875, 11.362060546875, 12.03369140625, 12.705322265625, 13.376953125, 14.048583984375, 14.72021484375, 15.391845703125, 16.0634765625, 16.735107421875, 17.40673828125, 18.078369140625, 18.75]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 14.0, 15.0, 15.0, 11.0, 19.0, 21.0, 26.0, 33.0, 55.0, 73.0, 81.0, 100.0, 164.0, 236.0, 396.0, 977.0, 10128.0, 1387938.0, 1731365.0, 11643.0, 1010.0, 423.0, 258.0, 162.0, 125.0, 96.0, 71.0, 51.0, 47.0, 28.0, 25.0, 21.0, 21.0, 10.0, 8.0, 9.0, 8.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.125, -38.69287109375, -37.2607421875, -35.82861328125, -34.396484375, -32.96435546875, -31.5322265625, -30.10009765625, -28.66796875, -27.23583984375, -25.8037109375, -24.37158203125, -22.939453125, -21.50732421875, -20.0751953125, -18.64306640625, -17.2109375, -15.77880859375, -14.3466796875, -12.91455078125, -11.482421875, -10.05029296875, -8.6181640625, -7.18603515625, -5.75390625, -4.32177734375, -2.8896484375, -1.45751953125, -0.025390625, 1.40673828125, 2.8388671875, 4.27099609375, 5.703125, 7.13525390625, 8.5673828125, 9.99951171875, 11.431640625, 12.86376953125, 14.2958984375, 15.72802734375, 17.16015625, 18.59228515625, 20.0244140625, 21.45654296875, 22.888671875, 24.32080078125, 25.7529296875, 27.18505859375, 28.6171875, 30.04931640625, 31.4814453125, 32.91357421875, 34.345703125, 35.77783203125, 37.2099609375, 38.64208984375, 40.07421875, 41.50634765625, 42.9384765625, 44.37060546875, 45.802734375, 47.23486328125, 48.6669921875, 50.09912109375, 51.53125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 20.0, 33.0, 67.0, 121.0, 147.0, 170.0, 173.0, 113.0, 71.0, 39.0, 31.0, 8.0, 9.0, 2.0, 1.0, 2.0, 1.0], "bins": [-77.54837036132812, -76.0772705078125, -74.60617065429688, -73.13507080078125, -71.66397094726562, -70.19287109375, -68.72177124023438, -67.25067901611328, -65.77957916259766, -64.30847930908203, -62.837379455566406, -61.36627960205078, -59.89518356323242, -58.4240837097168, -56.95298385620117, -55.48188400268555, -54.01078414916992, -52.5396842956543, -51.06858444213867, -49.59748840332031, -48.12638854980469, -46.65528869628906, -45.18418884277344, -43.71308898925781, -42.24198913574219, -40.77088928222656, -39.29978942871094, -37.82868957519531, -36.35759353637695, -34.88649368286133, -33.4153938293457, -31.944293975830078, -30.47319984436035, -29.002099990844727, -27.531002044677734, -26.05990219116211, -24.588802337646484, -23.117704391479492, -21.646604537963867, -20.175506591796875, -18.70440673828125, -17.233306884765625, -15.762208938598633, -14.291109085083008, -12.8200101852417, -11.34891128540039, -9.877811431884766, -8.406712532043457, -6.935613632202148, -5.46451473236084, -3.993415355682373, -2.5223159790039062, -1.0512170791625977, 0.41988182067871094, 1.890981674194336, 3.3620805740356445, 4.833179473876953, 6.304278373718262, 7.7753777503967285, 9.246477127075195, 10.717576026916504, 12.188674926757812, 13.659774780273438, 15.130873680114746, 16.601972579956055]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 4.0, 8.0, 11.0, 7.0, 12.0, 16.0, 21.0, 12.0, 17.0, 21.0, 28.0, 26.0, 22.0, 25.0, 37.0, 39.0, 33.0, 29.0, 38.0, 34.0, 41.0, 38.0, 39.0, 34.0, 39.0, 53.0, 36.0, 38.0, 29.0, 23.0, 24.0, 18.0, 23.0, 23.0, 15.0, 17.0, 13.0, 11.0, 8.0, 4.0, 7.0, 8.0, 4.0, 8.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-42.895843505859375, -41.54581069946289, -40.195777893066406, -38.84574508666992, -37.49571228027344, -36.14567565917969, -34.79564666748047, -33.44561004638672, -32.095577239990234, -30.74554443359375, -29.395511627197266, -28.04547882080078, -26.695444107055664, -25.34541130065918, -23.995378494262695, -22.645343780517578, -21.295312881469727, -19.945280075073242, -18.595247268676758, -17.24521255493164, -15.895179748535156, -14.545146942138672, -13.195114135742188, -11.845080375671387, -10.495047569274902, -9.145014762878418, -7.794981002807617, -6.444948196411133, -5.09491491317749, -3.7448816299438477, -2.3948488235473633, -1.0448150634765625, 0.3052177429199219, 1.655250906944275, 3.005284070968628, 4.355317115783691, 5.705350399017334, 7.055383682250977, 8.405416488647461, 9.755450248718262, 11.105483055114746, 12.45551586151123, 13.805549621582031, 15.155582427978516, 16.505615234375, 17.855648040771484, 19.20568084716797, 20.555715560913086, 21.90574836730957, 23.255781173706055, 24.60581398010254, 25.955848693847656, 27.30588150024414, 28.655914306640625, 30.00594711303711, 31.355979919433594, 32.70601272583008, 34.05604553222656, 35.40607833862305, 36.75611114501953, 38.106143951416016, 39.4561767578125, 40.80621337890625, 42.156246185302734, 43.50627899169922]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 8.0, 5.0, 7.0, 7.0, 5.0, 16.0, 12.0, 17.0, 21.0, 25.0, 30.0, 41.0, 28.0, 40.0, 39.0, 49.0, 51.0, 43.0, 41.0, 37.0, 49.0, 37.0, 42.0, 32.0, 49.0, 37.0, 42.0, 33.0, 27.0, 24.0, 30.0, 22.0, 19.0, 10.0, 10.0, 8.0, 4.0, 4.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8671875, -5.64697265625, -5.4267578125, -5.20654296875, -4.986328125, -4.76611328125, -4.5458984375, -4.32568359375, -4.10546875, -3.88525390625, -3.6650390625, -3.44482421875, -3.224609375, -3.00439453125, -2.7841796875, -2.56396484375, -2.34375, -2.12353515625, -1.9033203125, -1.68310546875, -1.462890625, -1.24267578125, -1.0224609375, -0.80224609375, -0.58203125, -0.36181640625, -0.1416015625, 0.07861328125, 0.298828125, 0.51904296875, 0.7392578125, 0.95947265625, 1.1796875, 1.39990234375, 1.6201171875, 1.84033203125, 2.060546875, 2.28076171875, 2.5009765625, 2.72119140625, 2.94140625, 3.16162109375, 3.3818359375, 3.60205078125, 3.822265625, 4.04248046875, 4.2626953125, 4.48291015625, 4.703125, 4.92333984375, 5.1435546875, 5.36376953125, 5.583984375, 5.80419921875, 6.0244140625, 6.24462890625, 6.46484375, 6.68505859375, 6.9052734375, 7.12548828125, 7.345703125, 7.56591796875, 7.7861328125, 8.00634765625, 8.2265625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 8.0, 10.0, 5.0, 8.0, 9.0, 12.0, 16.0, 15.0, 26.0, 31.0, 54.0, 59.0, 124.0, 228.0, 528.0, 1801.0, 9070.0, 65181.0, 494348.0, 2161219.0, 1243675.0, 188057.0, 24210.0, 3848.0, 934.0, 314.0, 164.0, 86.0, 56.0, 42.0, 43.0, 29.0, 19.0, 14.0, 16.0, 6.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7421875, -11.3033447265625, -10.864501953125, -10.4256591796875, -9.98681640625, -9.5479736328125, -9.109130859375, -8.6702880859375, -8.2314453125, -7.7926025390625, -7.353759765625, -6.9149169921875, -6.47607421875, -6.0372314453125, -5.598388671875, -5.1595458984375, -4.720703125, -4.2818603515625, -3.843017578125, -3.4041748046875, -2.96533203125, -2.5264892578125, -2.087646484375, -1.6488037109375, -1.2099609375, -0.7711181640625, -0.332275390625, 0.1065673828125, 0.54541015625, 0.9842529296875, 1.423095703125, 1.8619384765625, 2.30078125, 2.7396240234375, 3.178466796875, 3.6173095703125, 4.05615234375, 4.4949951171875, 4.933837890625, 5.3726806640625, 5.8115234375, 6.2503662109375, 6.689208984375, 7.1280517578125, 7.56689453125, 8.0057373046875, 8.444580078125, 8.8834228515625, 9.322265625, 9.7611083984375, 10.199951171875, 10.6387939453125, 11.07763671875, 11.5164794921875, 11.955322265625, 12.3941650390625, 12.8330078125, 13.2718505859375, 13.710693359375, 14.1495361328125, 14.58837890625, 15.0272216796875, 15.466064453125, 15.9049072265625, 16.34375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 5.0, 6.0, 5.0, 8.0, 11.0, 8.0, 16.0, 30.0, 32.0, 51.0, 47.0, 60.0, 83.0, 103.0, 150.0, 153.0, 200.0, 246.0, 276.0, 258.0, 355.0, 329.0, 330.0, 261.0, 212.0, 174.0, 142.0, 119.0, 91.0, 73.0, 43.0, 55.0, 39.0, 34.0, 22.0, 10.0, 9.0, 11.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9296875, -8.6309814453125, -8.332275390625, -8.0335693359375, -7.73486328125, -7.4361572265625, -7.137451171875, -6.8387451171875, -6.5400390625, -6.2413330078125, -5.942626953125, -5.6439208984375, -5.34521484375, -5.0465087890625, -4.747802734375, -4.4490966796875, -4.150390625, -3.8516845703125, -3.552978515625, -3.2542724609375, -2.95556640625, -2.6568603515625, -2.358154296875, -2.0594482421875, -1.7607421875, -1.4620361328125, -1.163330078125, -0.8646240234375, -0.56591796875, -0.2672119140625, 0.031494140625, 0.3302001953125, 0.62890625, 0.9276123046875, 1.226318359375, 1.5250244140625, 1.82373046875, 2.1224365234375, 2.421142578125, 2.7198486328125, 3.0185546875, 3.3172607421875, 3.615966796875, 3.9146728515625, 4.21337890625, 4.5120849609375, 4.810791015625, 5.1094970703125, 5.408203125, 5.7069091796875, 6.005615234375, 6.3043212890625, 6.60302734375, 6.9017333984375, 7.200439453125, 7.4991455078125, 7.7978515625, 8.0965576171875, 8.395263671875, 8.6939697265625, 8.99267578125, 9.2913818359375, 9.590087890625, 9.8887939453125, 10.1875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 1.0, 7.0, 11.0, 7.0, 11.0, 16.0, 34.0, 30.0, 52.0, 51.0, 48.0, 91.0, 120.0, 157.0, 165.0, 256.0, 425.0, 1889.0, 130240.0, 3658051.0, 396419.0, 4362.0, 581.0, 319.0, 197.0, 181.0, 132.0, 96.0, 69.0, 52.0, 46.0, 48.0, 28.0, 24.0, 14.0, 9.0, 9.0, 6.0, 7.0, 8.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.4375, -44.125, -42.8125, -41.5, -40.1875, -38.875, -37.5625, -36.25, -34.9375, -33.625, -32.3125, -31.0, -29.6875, -28.375, -27.0625, -25.75, -24.4375, -23.125, -21.8125, -20.5, -19.1875, -17.875, -16.5625, -15.25, -13.9375, -12.625, -11.3125, -10.0, -8.6875, -7.375, -6.0625, -4.75, -3.4375, -2.125, -0.8125, 0.5, 1.8125, 3.125, 4.4375, 5.75, 7.0625, 8.375, 9.6875, 11.0, 12.3125, 13.625, 14.9375, 16.25, 17.5625, 18.875, 20.1875, 21.5, 22.8125, 24.125, 25.4375, 26.75, 28.0625, 29.375, 30.6875, 32.0, 33.3125, 34.625, 35.9375, 37.25, 38.5625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 9.0, 11.0, 42.0, 80.0, 159.0, 194.0, 197.0, 153.0, 103.0, 50.0, 13.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-141.73069763183594, -138.37290954589844, -135.01512145996094, -131.65733337402344, -128.29954528808594, -124.94176483154297, -121.58397674560547, -118.22618865966797, -114.868408203125, -111.5106201171875, -108.15283203125, -104.7950439453125, -101.43726348876953, -98.07947540283203, -94.72168731689453, -91.36389923095703, -88.00611114501953, -84.64832305908203, -81.29053497314453, -77.93275451660156, -74.57496643066406, -71.21717834472656, -67.85939025878906, -64.50160217285156, -61.14381790161133, -57.78602981567383, -54.428245544433594, -51.070457458496094, -47.712669372558594, -44.35488510131836, -40.99709701538086, -37.639312744140625, -34.281524658203125, -30.923738479614258, -27.56595230102539, -24.20816421508789, -20.850378036499023, -17.492591857910156, -14.134803771972656, -10.777017593383789, -7.419231414794922, -4.0614447593688965, -0.7036581039428711, 2.6541290283203125, 6.01191520690918, 9.369701385498047, 12.727489471435547, 16.085275650024414, 19.44306182861328, 22.80084800720215, 26.158634185791016, 29.516422271728516, 32.87420654296875, 36.23199462890625, 39.58978271484375, 42.94757080078125, 46.305355072021484, 49.663143157958984, 53.02092742919922, 56.37871551513672, 59.73650360107422, 63.09428787231445, 66.45207214355469, 69.80986022949219, 73.16764831542969]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 1.0, 5.0, 4.0, 8.0, 8.0, 12.0, 10.0, 15.0, 11.0, 17.0, 17.0, 26.0, 29.0, 24.0, 36.0, 36.0, 33.0, 36.0, 45.0, 39.0, 35.0, 45.0, 43.0, 46.0, 32.0, 27.0, 34.0, 28.0, 43.0, 27.0, 27.0, 29.0, 23.0, 23.0, 19.0, 14.0, 10.0, 11.0, 19.0, 16.0, 7.0, 7.0, 5.0, 9.0, 8.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-41.78966522216797, -40.536075592041016, -39.2824821472168, -38.028892517089844, -36.775299072265625, -35.52170944213867, -34.26811981201172, -33.0145263671875, -31.760936737060547, -30.50734519958496, -29.253753662109375, -28.000164031982422, -26.746572494506836, -25.49298095703125, -24.239389419555664, -22.985797882080078, -21.732206344604492, -20.478614807128906, -19.22502326965332, -17.971431732177734, -16.71784210205078, -15.464250564575195, -14.21065902709961, -12.95706844329834, -11.703476905822754, -10.449885368347168, -9.196294784545898, -7.9427032470703125, -6.689112186431885, -5.435521125793457, -4.181929588317871, -2.9283390045166016, -1.6747474670410156, -0.42115628719329834, 0.832434892654419, 2.086026191711426, 3.3396172523498535, 4.593208312988281, 5.846799850463867, 7.100390434265137, 8.353981971740723, 9.607573509216309, 10.861164093017578, 12.114755630493164, 13.36834716796875, 14.62193775177002, 15.875529289245605, 17.129119873046875, 18.38271141052246, 19.636302947998047, 20.889894485473633, 22.14348602294922, 23.397075653076172, 24.650667190551758, 25.904258728027344, 27.157848358154297, 28.411441802978516, 29.6650333404541, 30.918624877929688, 32.17221450805664, 33.42580795288086, 34.67939758300781, 35.93299102783203, 37.186580657958984, 38.44017028808594]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 8.0, 7.0, 5.0, 7.0, 10.0, 5.0, 16.0, 12.0, 13.0, 18.0, 35.0, 23.0, 37.0, 34.0, 38.0, 39.0, 34.0, 42.0, 35.0, 42.0, 49.0, 47.0, 46.0, 44.0, 38.0, 36.0, 35.0, 31.0, 37.0, 25.0, 17.0, 24.0, 23.0, 18.0, 23.0, 14.0, 10.0, 13.0, 2.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3359375, -5.137939453125, -4.93994140625, -4.741943359375, -4.5439453125, -4.345947265625, -4.14794921875, -3.949951171875, -3.751953125, -3.553955078125, -3.35595703125, -3.157958984375, -2.9599609375, -2.761962890625, -2.56396484375, -2.365966796875, -2.16796875, -1.969970703125, -1.77197265625, -1.573974609375, -1.3759765625, -1.177978515625, -0.97998046875, -0.781982421875, -0.583984375, -0.385986328125, -0.18798828125, 0.010009765625, 0.2080078125, 0.406005859375, 0.60400390625, 0.802001953125, 1.0, 1.197998046875, 1.39599609375, 1.593994140625, 1.7919921875, 1.989990234375, 2.18798828125, 2.385986328125, 2.583984375, 2.781982421875, 2.97998046875, 3.177978515625, 3.3759765625, 3.573974609375, 3.77197265625, 3.969970703125, 4.16796875, 4.365966796875, 4.56396484375, 4.761962890625, 4.9599609375, 5.157958984375, 5.35595703125, 5.553955078125, 5.751953125, 5.949951171875, 6.14794921875, 6.345947265625, 6.5439453125, 6.741943359375, 6.93994140625, 7.137939453125, 7.3359375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 4.0, 11.0, 18.0, 34.0, 43.0, 55.0, 107.0, 171.0, 303.0, 477.0, 889.0, 1517.0, 2477.0, 4249.0, 7177.0, 11738.0, 18825.0, 29530.0, 44870.0, 66065.0, 91027.0, 117041.0, 136143.0, 133910.0, 113488.0, 87957.0, 63477.0, 43582.0, 28156.0, 17789.0, 10930.0, 6601.0, 3990.0, 2479.0, 1335.0, 894.0, 469.0, 286.0, 179.0, 100.0, 57.0, 39.0, 25.0, 16.0, 5.0, 6.0, 8.0, 4.0, 3.0, 1.0, 1.0], "bins": [-1.0234375, -0.994964599609375, -0.96649169921875, -0.938018798828125, -0.9095458984375, -0.881072998046875, -0.85260009765625, -0.824127197265625, -0.795654296875, -0.767181396484375, -0.73870849609375, -0.710235595703125, -0.6817626953125, -0.653289794921875, -0.62481689453125, -0.596343994140625, -0.56787109375, -0.539398193359375, -0.51092529296875, -0.482452392578125, -0.4539794921875, -0.425506591796875, -0.39703369140625, -0.368560791015625, -0.340087890625, -0.311614990234375, -0.28314208984375, -0.254669189453125, -0.2261962890625, -0.197723388671875, -0.16925048828125, -0.140777587890625, -0.1123046875, -0.083831787109375, -0.05535888671875, -0.026885986328125, 0.0015869140625, 0.030059814453125, 0.05853271484375, 0.087005615234375, 0.115478515625, 0.143951416015625, 0.17242431640625, 0.200897216796875, 0.2293701171875, 0.257843017578125, 0.28631591796875, 0.314788818359375, 0.34326171875, 0.371734619140625, 0.40020751953125, 0.428680419921875, 0.4571533203125, 0.485626220703125, 0.51409912109375, 0.542572021484375, 0.571044921875, 0.599517822265625, 0.62799072265625, 0.656463623046875, 0.6849365234375, 0.713409423828125, 0.74188232421875, 0.770355224609375, 0.798828125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 4.0, 8.0, 11.0, 6.0, 10.0, 18.0, 20.0, 21.0, 23.0, 25.0, 16.0, 29.0, 24.0, 41.0, 36.0, 36.0, 36.0, 41.0, 44.0, 32.0, 1070.0, 27.0, 41.0, 31.0, 45.0, 41.0, 28.0, 33.0, 34.0, 22.0, 23.0, 26.0, 17.0, 12.0, 17.0, 17.0, 14.0, 11.0, 12.0, 4.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.0859375, -3.945556640625, -3.80517578125, -3.664794921875, -3.5244140625, -3.384033203125, -3.24365234375, -3.103271484375, -2.962890625, -2.822509765625, -2.68212890625, -2.541748046875, -2.4013671875, -2.260986328125, -2.12060546875, -1.980224609375, -1.83984375, -1.699462890625, -1.55908203125, -1.418701171875, -1.2783203125, -1.137939453125, -0.99755859375, -0.857177734375, -0.716796875, -0.576416015625, -0.43603515625, -0.295654296875, -0.1552734375, -0.014892578125, 0.12548828125, 0.265869140625, 0.40625, 0.546630859375, 0.68701171875, 0.827392578125, 0.9677734375, 1.108154296875, 1.24853515625, 1.388916015625, 1.529296875, 1.669677734375, 1.81005859375, 1.950439453125, 2.0908203125, 2.231201171875, 2.37158203125, 2.511962890625, 2.65234375, 2.792724609375, 2.93310546875, 3.073486328125, 3.2138671875, 3.354248046875, 3.49462890625, 3.635009765625, 3.775390625, 3.915771484375, 4.05615234375, 4.196533203125, 4.3369140625, 4.477294921875, 4.61767578125, 4.758056640625, 4.8984375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 3.0, 13.0, 8.0, 17.0, 34.0, 55.0, 67.0, 137.0, 176.0, 326.0, 536.0, 987.0, 1615.0, 2925.0, 5143.0, 9618.0, 16948.0, 31134.0, 74985.0, 1870205.0, 36783.0, 20254.0, 11010.0, 6140.0, 3284.0, 1953.0, 1158.0, 691.0, 375.0, 204.0, 150.0, 73.0, 54.0, 29.0, 13.0, 8.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9697265625, -1.9043731689453125, -1.839019775390625, -1.7736663818359375, -1.70831298828125, -1.6429595947265625, -1.577606201171875, -1.5122528076171875, -1.4468994140625, -1.3815460205078125, -1.316192626953125, -1.2508392333984375, -1.18548583984375, -1.1201324462890625, -1.054779052734375, -0.9894256591796875, -0.924072265625, -0.8587188720703125, -0.793365478515625, -0.7280120849609375, -0.66265869140625, -0.5973052978515625, -0.531951904296875, -0.4665985107421875, -0.4012451171875, -0.3358917236328125, -0.270538330078125, -0.2051849365234375, -0.13983154296875, -0.0744781494140625, -0.009124755859375, 0.0562286376953125, 0.12158203125, 0.1869354248046875, 0.252288818359375, 0.3176422119140625, 0.38299560546875, 0.4483489990234375, 0.513702392578125, 0.5790557861328125, 0.6444091796875, 0.7097625732421875, 0.775115966796875, 0.8404693603515625, 0.90582275390625, 0.9711761474609375, 1.036529541015625, 1.1018829345703125, 1.167236328125, 1.2325897216796875, 1.297943115234375, 1.3632965087890625, 1.42864990234375, 1.4940032958984375, 1.559356689453125, 1.6247100830078125, 1.6900634765625, 1.7554168701171875, 1.820770263671875, 1.8861236572265625, 1.95147705078125, 2.0168304443359375, 2.082183837890625, 2.1475372314453125, 2.212890625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 8.0, 5.0, 4.0, 10.0, 12.0, 18.0, 25.0, 40.0, 86.0, 158.0, 176.0, 182.0, 107.0, 61.0, 32.0, 24.0, 12.0, 12.0, 6.0, 1.0, 5.0, 7.0, 2.0, 3.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.079345703125, -0.07685375213623047, -0.07436180114746094, -0.0718698501586914, -0.06937789916992188, -0.06688594818115234, -0.06439399719238281, -0.06190204620361328, -0.05941009521484375, -0.05691814422607422, -0.05442619323730469, -0.051934242248535156, -0.049442291259765625, -0.046950340270996094, -0.04445838928222656, -0.04196643829345703, -0.0394744873046875, -0.03698253631591797, -0.03449058532714844, -0.031998634338378906, -0.029506683349609375, -0.027014732360839844, -0.024522781372070312, -0.02203083038330078, -0.01953887939453125, -0.01704692840576172, -0.014554977416992188, -0.012063026428222656, -0.009571075439453125, -0.007079124450683594, -0.0045871734619140625, -0.0020952224731445312, 0.000396728515625, 0.0028886795043945312, 0.0053806304931640625, 0.007872581481933594, 0.010364532470703125, 0.012856483459472656, 0.015348434448242188, 0.01784038543701172, 0.02033233642578125, 0.02282428741455078, 0.025316238403320312, 0.027808189392089844, 0.030300140380859375, 0.032792091369628906, 0.03528404235839844, 0.03777599334716797, 0.0402679443359375, 0.04275989532470703, 0.04525184631347656, 0.047743797302246094, 0.050235748291015625, 0.052727699279785156, 0.05521965026855469, 0.05771160125732422, 0.06020355224609375, 0.06269550323486328, 0.06518745422363281, 0.06767940521240234, 0.07017135620117188, 0.0726633071899414, 0.07515525817871094, 0.07764720916748047, 0.08013916015625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 4.0, 5.0, 5.0, 7.0, 11.0, 17.0, 20.0, 40.0, 62.0, 139.0, 300.0, 6021.0, 1040501.0, 936.0, 230.0, 89.0, 60.0, 25.0, 28.0, 15.0, 6.0, 6.0, 10.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.625, -1.574676513671875, -1.52435302734375, -1.474029541015625, -1.4237060546875, -1.373382568359375, -1.32305908203125, -1.272735595703125, -1.222412109375, -1.172088623046875, -1.12176513671875, -1.071441650390625, -1.0211181640625, -0.970794677734375, -0.92047119140625, -0.870147705078125, -0.81982421875, -0.769500732421875, -0.71917724609375, -0.668853759765625, -0.6185302734375, -0.568206787109375, -0.51788330078125, -0.467559814453125, -0.417236328125, -0.366912841796875, -0.31658935546875, -0.266265869140625, -0.2159423828125, -0.165618896484375, -0.11529541015625, -0.064971923828125, -0.0146484375, 0.035675048828125, 0.08599853515625, 0.136322021484375, 0.1866455078125, 0.236968994140625, 0.28729248046875, 0.337615966796875, 0.387939453125, 0.438262939453125, 0.48858642578125, 0.538909912109375, 0.5892333984375, 0.639556884765625, 0.68988037109375, 0.740203857421875, 0.79052734375, 0.840850830078125, 0.89117431640625, 0.941497802734375, 0.9918212890625, 1.042144775390625, 1.09246826171875, 1.142791748046875, 1.193115234375, 1.243438720703125, 1.29376220703125, 1.344085693359375, 1.3944091796875, 1.444732666015625, 1.49505615234375, 1.545379638671875, 1.595703125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 233.0, 764.0, 15.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.261430948972702, -0.2415895313024521, -0.22174811363220215, -0.2019067108631134, -0.18206527829170227, -0.16222387552261353, -0.1423824578523636, -0.12254104018211365, -0.10269962251186371, -0.08285820484161377, -0.06301678717136383, -0.04317537695169449, -0.02333395928144455, -0.0034925416111946106, 0.01634886860847473, 0.03619028627872467, 0.05603170394897461, 0.07587312161922455, 0.09571453928947449, 0.11555594950914383, 0.13539737462997437, 0.1552387773990631, 0.17508019506931305, 0.194921612739563, 0.21476303040981293, 0.23460444808006287, 0.2544458508491516, 0.27428728342056274, 0.2941286861896515, 0.3139701187610626, 0.33381152153015137, 0.3536529541015625, 0.37349432706832886, 0.3933357298374176, 0.41317716240882874, 0.4330185651779175, 0.4528599977493286, 0.47270140051841736, 0.4925428032875061, 0.5123842358589172, 0.5322256684303284, 0.5520671010017395, 0.5719084739685059, 0.591749906539917, 0.6115913391113281, 0.6314327716827393, 0.6512741446495056, 0.6711155772209167, 0.6909569501876831, 0.7107983827590942, 0.7306397557258606, 0.7504811882972717, 0.7703226208686829, 0.790164053440094, 0.8100054264068604, 0.8298468589782715, 0.8496882915496826, 0.8695297241210938, 0.8893710970878601, 0.9092125296592712, 0.9290539622306824, 0.9488953948020935, 0.9687367677688599, 0.988578200340271, 1.0084196329116821]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 5.0, 2.0, 6.0, 9.0, 12.0, 15.0, 18.0, 13.0, 15.0, 22.0, 21.0, 26.0, 34.0, 28.0, 26.0, 29.0, 30.0, 30.0, 36.0, 39.0, 40.0, 27.0, 32.0, 38.0, 31.0, 36.0, 38.0, 36.0, 32.0, 26.0, 35.0, 39.0, 22.0, 18.0, 19.0, 19.0, 13.0, 15.0, 9.0, 15.0, 12.0, 11.0, 5.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.06620246171951294, -0.06408698856830597, -0.0619715191423893, -0.059856049716472626, -0.057740576565265656, -0.055625103414058685, -0.053509633988142014, -0.05139416456222534, -0.04927869141101837, -0.0471632182598114, -0.04504774883389473, -0.04293227940797806, -0.04081680625677109, -0.03870133310556412, -0.036585863679647446, -0.034470394253730774, -0.032354921102523804, -0.030239449813961983, -0.028123978525400162, -0.02600850723683834, -0.02389303594827652, -0.0217775646597147, -0.019662093371152878, -0.017546622082591057, -0.015431150794029236, -0.013315679505467415, -0.011200208216905594, -0.009084736928343773, -0.006969265639781952, -0.004853794351220131, -0.00273832306265831, -0.000622851774096489, 0.001492619514465332, 0.003608090803027153, 0.005723562091588974, 0.007839033380150795, 0.009954504668712616, 0.012069975957274437, 0.014185447245836258, 0.01630091853439808, 0.0184163898229599, 0.02053186111152172, 0.022647332400083542, 0.024762803688645363, 0.026878274977207184, 0.028993746265769005, 0.031109217554330826, 0.0332246869802475, 0.03534016013145447, 0.03745563328266144, 0.03957110270857811, 0.04168657213449478, 0.04380204528570175, 0.04591751843690872, 0.048032987862825394, 0.050148457288742065, 0.052263930439949036, 0.054379403591156006, 0.05649487301707268, 0.05861034244298935, 0.06072581559419632, 0.06284128874540329, 0.06495675444602966, 0.06707222759723663, 0.0691877007484436]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 7.0, 3.0, 6.0, 3.0, 9.0, 6.0, 10.0, 14.0, 19.0, 23.0, 15.0, 20.0, 25.0, 26.0, 29.0, 33.0, 35.0, 36.0, 43.0, 51.0, 43.0, 48.0, 47.0, 35.0, 37.0, 39.0, 37.0, 36.0, 35.0, 32.0, 28.0, 27.0, 28.0, 21.0, 19.0, 12.0, 16.0, 12.0, 9.0, 11.0, 9.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.796875, -5.6058349609375, -5.414794921875, -5.2237548828125, -5.03271484375, -4.8416748046875, -4.650634765625, -4.4595947265625, -4.2685546875, -4.0775146484375, -3.886474609375, -3.6954345703125, -3.50439453125, -3.3133544921875, -3.122314453125, -2.9312744140625, -2.740234375, -2.5491943359375, -2.358154296875, -2.1671142578125, -1.97607421875, -1.7850341796875, -1.593994140625, -1.4029541015625, -1.2119140625, -1.0208740234375, -0.829833984375, -0.6387939453125, -0.44775390625, -0.2567138671875, -0.065673828125, 0.1253662109375, 0.31640625, 0.5074462890625, 0.698486328125, 0.8895263671875, 1.08056640625, 1.2716064453125, 1.462646484375, 1.6536865234375, 1.8447265625, 2.0357666015625, 2.226806640625, 2.4178466796875, 2.60888671875, 2.7999267578125, 2.990966796875, 3.1820068359375, 3.373046875, 3.5640869140625, 3.755126953125, 3.9461669921875, 4.13720703125, 4.3282470703125, 4.519287109375, 4.7103271484375, 4.9013671875, 5.0924072265625, 5.283447265625, 5.4744873046875, 5.66552734375, 5.8565673828125, 6.047607421875, 6.2386474609375, 6.4296875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 7.0, 1.0, 8.0, 12.0, 8.0, 15.0, 14.0, 18.0, 28.0, 57.0, 83.0, 126.0, 202.0, 402.0, 716.0, 1315.0, 2398.0, 4641.0, 8927.0, 18072.0, 35858.0, 75693.0, 159331.0, 316508.0, 221244.0, 104659.0, 48902.0, 23946.0, 11997.0, 6203.0, 3202.0, 1724.0, 977.0, 524.0, 245.0, 172.0, 98.0, 65.0, 38.0, 43.0, 25.0, 9.0, 14.0, 9.0, 6.0, 2.0, 10.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.5546875, -6.3341064453125, -6.113525390625, -5.8929443359375, -5.67236328125, -5.4517822265625, -5.231201171875, -5.0106201171875, -4.7900390625, -4.5694580078125, -4.348876953125, -4.1282958984375, -3.90771484375, -3.6871337890625, -3.466552734375, -3.2459716796875, -3.025390625, -2.8048095703125, -2.584228515625, -2.3636474609375, -2.14306640625, -1.9224853515625, -1.701904296875, -1.4813232421875, -1.2607421875, -1.0401611328125, -0.819580078125, -0.5989990234375, -0.37841796875, -0.1578369140625, 0.062744140625, 0.2833251953125, 0.50390625, 0.7244873046875, 0.945068359375, 1.1656494140625, 1.38623046875, 1.6068115234375, 1.827392578125, 2.0479736328125, 2.2685546875, 2.4891357421875, 2.709716796875, 2.9302978515625, 3.15087890625, 3.3714599609375, 3.592041015625, 3.8126220703125, 4.033203125, 4.2537841796875, 4.474365234375, 4.6949462890625, 4.91552734375, 5.1361083984375, 5.356689453125, 5.5772705078125, 5.7978515625, 6.0184326171875, 6.239013671875, 6.4595947265625, 6.68017578125, 6.9007568359375, 7.121337890625, 7.3419189453125, 7.5625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 7.0, 3.0, 7.0, 12.0, 12.0, 12.0, 13.0, 20.0, 16.0, 27.0, 23.0, 26.0, 28.0, 35.0, 31.0, 45.0, 53.0, 55.0, 90.0, 144.0, 318.0, 1348.0, 214.0, 98.0, 54.0, 50.0, 44.0, 30.0, 38.0, 28.0, 26.0, 17.0, 23.0, 24.0, 18.0, 14.0, 13.0, 8.0, 7.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.015625, -18.44091796875, -17.8662109375, -17.29150390625, -16.716796875, -16.14208984375, -15.5673828125, -14.99267578125, -14.41796875, -13.84326171875, -13.2685546875, -12.69384765625, -12.119140625, -11.54443359375, -10.9697265625, -10.39501953125, -9.8203125, -9.24560546875, -8.6708984375, -8.09619140625, -7.521484375, -6.94677734375, -6.3720703125, -5.79736328125, -5.22265625, -4.64794921875, -4.0732421875, -3.49853515625, -2.923828125, -2.34912109375, -1.7744140625, -1.19970703125, -0.625, -0.05029296875, 0.5244140625, 1.09912109375, 1.673828125, 2.24853515625, 2.8232421875, 3.39794921875, 3.97265625, 4.54736328125, 5.1220703125, 5.69677734375, 6.271484375, 6.84619140625, 7.4208984375, 7.99560546875, 8.5703125, 9.14501953125, 9.7197265625, 10.29443359375, 10.869140625, 11.44384765625, 12.0185546875, 12.59326171875, 13.16796875, 13.74267578125, 14.3173828125, 14.89208984375, 15.466796875, 16.04150390625, 16.6162109375, 17.19091796875, 17.765625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 4.0, 9.0, 14.0, 18.0, 21.0, 24.0, 49.0, 43.0, 82.0, 118.0, 148.0, 267.0, 560.0, 1768.0, 45567.0, 3066305.0, 27848.0, 1543.0, 487.0, 280.0, 140.0, 106.0, 83.0, 59.0, 36.0, 30.0, 11.0, 18.0, 17.0, 17.0, 2.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.03125, -55.02685546875, -53.0224609375, -51.01806640625, -49.013671875, -47.00927734375, -45.0048828125, -43.00048828125, -40.99609375, -38.99169921875, -36.9873046875, -34.98291015625, -32.978515625, -30.97412109375, -28.9697265625, -26.96533203125, -24.9609375, -22.95654296875, -20.9521484375, -18.94775390625, -16.943359375, -14.93896484375, -12.9345703125, -10.93017578125, -8.92578125, -6.92138671875, -4.9169921875, -2.91259765625, -0.908203125, 1.09619140625, 3.1005859375, 5.10498046875, 7.109375, 9.11376953125, 11.1181640625, 13.12255859375, 15.126953125, 17.13134765625, 19.1357421875, 21.14013671875, 23.14453125, 25.14892578125, 27.1533203125, 29.15771484375, 31.162109375, 33.16650390625, 35.1708984375, 37.17529296875, 39.1796875, 41.18408203125, 43.1884765625, 45.19287109375, 47.197265625, 49.20166015625, 51.2060546875, 53.21044921875, 55.21484375, 57.21923828125, 59.2236328125, 61.22802734375, 63.232421875, 65.23681640625, 67.2412109375, 69.24560546875, 71.25]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 82.0, 470.0, 384.0, 76.0, 2.0, 0.0, 1.0, 1.0], "bins": [-290.2415466308594, -285.2328796386719, -280.22418212890625, -275.21551513671875, -270.20684814453125, -265.1981506347656, -260.1894836425781, -255.18080139160156, -250.172119140625, -245.16343688964844, -240.15475463867188, -235.14608764648438, -230.1374053955078, -225.12872314453125, -220.12005615234375, -215.1113739013672, -210.10269165039062, -205.09400939941406, -200.0853271484375, -195.07666015625, -190.06797790527344, -185.05929565429688, -180.05062866210938, -175.0419464111328, -170.03326416015625, -165.0245819091797, -160.01589965820312, -155.00723266601562, -149.99855041503906, -144.9898681640625, -139.981201171875, -134.97251892089844, -129.9638214111328, -124.95513916015625, -119.94646453857422, -114.93778991699219, -109.92910766601562, -104.92042541503906, -99.91175079345703, -94.903076171875, -89.89439392089844, -84.88571166992188, -79.87703704833984, -74.86836242675781, -69.85968017578125, -64.85099792480469, -59.842323303222656, -54.83364486694336, -49.82496643066406, -44.816287994384766, -39.80760955810547, -34.79893112182617, -29.790252685546875, -24.781574249267578, -19.77289581298828, -14.764217376708984, -9.755538940429688, -4.746860504150391, 0.26181793212890625, 5.270496368408203, 10.2791748046875, 15.287853240966797, 20.296531677246094, 25.30521011352539, 30.313888549804688]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 7.0, 8.0, 5.0, 12.0, 20.0, 29.0, 19.0, 31.0, 21.0, 28.0, 30.0, 45.0, 40.0, 36.0, 42.0, 34.0, 42.0, 48.0, 51.0, 43.0, 37.0, 45.0, 31.0, 43.0, 37.0, 27.0, 26.0, 25.0, 23.0, 21.0, 20.0, 22.0, 14.0, 10.0, 8.0, 6.0, 4.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.346309661865234, -45.65230941772461, -43.95831298828125, -42.264312744140625, -40.5703125, -38.876312255859375, -37.18231201171875, -35.48831558227539, -33.794315338134766, -32.10031509399414, -30.40631675720215, -28.712318420410156, -27.01831817626953, -25.324317932128906, -23.630319595336914, -21.936321258544922, -20.242321014404297, -18.548320770263672, -16.85432243347168, -15.160323143005371, -13.466323852539062, -11.772324562072754, -10.078325271606445, -8.384325981140137, -6.690326690673828, -4.9963274002075195, -3.302328109741211, -1.6083288192749023, 0.08567047119140625, 1.7796697616577148, 3.4736690521240234, 5.167668342590332, 6.861671447753906, 8.555670738220215, 10.249670028686523, 11.943669319152832, 13.63766860961914, 15.33166790008545, 17.025667190551758, 18.71966552734375, 20.413665771484375, 22.107666015625, 23.801664352416992, 25.495662689208984, 27.18966293334961, 28.883663177490234, 30.577661514282227, 32.27165985107422, 33.965660095214844, 35.65966033935547, 37.353660583496094, 39.04765701293945, 40.74165725708008, 42.4356575012207, 44.12965393066406, 45.82365417480469, 47.51765441894531, 49.21165466308594, 50.90565490722656, 52.59965133666992, 54.29365158081055, 55.98765182495117, 57.68164825439453, 59.375648498535156, 61.06964874267578]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 6.0, 4.0, 10.0, 8.0, 10.0, 13.0, 19.0, 21.0, 25.0, 19.0, 31.0, 23.0, 37.0, 39.0, 27.0, 55.0, 42.0, 45.0, 51.0, 42.0, 49.0, 50.0, 41.0, 47.0, 34.0, 24.0, 29.0, 34.0, 23.0, 29.0, 21.0, 18.0, 20.0, 15.0, 12.0, 11.0, 6.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.2265625, -7.003662109375, -6.78076171875, -6.557861328125, -6.3349609375, -6.112060546875, -5.88916015625, -5.666259765625, -5.443359375, -5.220458984375, -4.99755859375, -4.774658203125, -4.5517578125, -4.328857421875, -4.10595703125, -3.883056640625, -3.66015625, -3.437255859375, -3.21435546875, -2.991455078125, -2.7685546875, -2.545654296875, -2.32275390625, -2.099853515625, -1.876953125, -1.654052734375, -1.43115234375, -1.208251953125, -0.9853515625, -0.762451171875, -0.53955078125, -0.316650390625, -0.09375, 0.129150390625, 0.35205078125, 0.574951171875, 0.7978515625, 1.020751953125, 1.24365234375, 1.466552734375, 1.689453125, 1.912353515625, 2.13525390625, 2.358154296875, 2.5810546875, 2.803955078125, 3.02685546875, 3.249755859375, 3.47265625, 3.695556640625, 3.91845703125, 4.141357421875, 4.3642578125, 4.587158203125, 4.81005859375, 5.032958984375, 5.255859375, 5.478759765625, 5.70166015625, 5.924560546875, 6.1474609375, 6.370361328125, 6.59326171875, 6.816162109375, 7.0390625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 7.0, 4.0, 8.0, 7.0, 6.0, 13.0, 19.0, 15.0, 14.0, 23.0, 23.0, 27.0, 34.0, 58.0, 114.0, 255.0, 717.0, 2924.0, 16068.0, 110185.0, 723948.0, 2252247.0, 917843.0, 143255.0, 21225.0, 3666.0, 850.0, 285.0, 137.0, 78.0, 37.0, 37.0, 27.0, 19.0, 17.0, 14.0, 16.0, 12.0, 12.0, 9.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.0, -11.5799560546875, -11.159912109375, -10.7398681640625, -10.31982421875, -9.8997802734375, -9.479736328125, -9.0596923828125, -8.6396484375, -8.2196044921875, -7.799560546875, -7.3795166015625, -6.95947265625, -6.5394287109375, -6.119384765625, -5.6993408203125, -5.279296875, -4.8592529296875, -4.439208984375, -4.0191650390625, -3.59912109375, -3.1790771484375, -2.759033203125, -2.3389892578125, -1.9189453125, -1.4989013671875, -1.078857421875, -0.6588134765625, -0.23876953125, 0.1812744140625, 0.601318359375, 1.0213623046875, 1.44140625, 1.8614501953125, 2.281494140625, 2.7015380859375, 3.12158203125, 3.5416259765625, 3.961669921875, 4.3817138671875, 4.8017578125, 5.2218017578125, 5.641845703125, 6.0618896484375, 6.48193359375, 6.9019775390625, 7.322021484375, 7.7420654296875, 8.162109375, 8.5821533203125, 9.002197265625, 9.4222412109375, 9.84228515625, 10.2623291015625, 10.682373046875, 11.1024169921875, 11.5224609375, 11.9425048828125, 12.362548828125, 12.7825927734375, 13.20263671875, 13.6226806640625, 14.042724609375, 14.4627685546875, 14.8828125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 6.0, 9.0, 5.0, 8.0, 11.0, 7.0, 15.0, 28.0, 35.0, 28.0, 54.0, 60.0, 75.0, 99.0, 143.0, 186.0, 249.0, 278.0, 379.0, 408.0, 412.0, 338.0, 292.0, 225.0, 157.0, 141.0, 103.0, 80.0, 68.0, 40.0, 36.0, 35.0, 19.0, 15.0, 7.0, 5.0, 7.0, 6.0, 4.0, 2.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8125, -8.485107421875, -8.15771484375, -7.830322265625, -7.5029296875, -7.175537109375, -6.84814453125, -6.520751953125, -6.193359375, -5.865966796875, -5.53857421875, -5.211181640625, -4.8837890625, -4.556396484375, -4.22900390625, -3.901611328125, -3.57421875, -3.246826171875, -2.91943359375, -2.592041015625, -2.2646484375, -1.937255859375, -1.60986328125, -1.282470703125, -0.955078125, -0.627685546875, -0.30029296875, 0.027099609375, 0.3544921875, 0.681884765625, 1.00927734375, 1.336669921875, 1.6640625, 1.991455078125, 2.31884765625, 2.646240234375, 2.9736328125, 3.301025390625, 3.62841796875, 3.955810546875, 4.283203125, 4.610595703125, 4.93798828125, 5.265380859375, 5.5927734375, 5.920166015625, 6.24755859375, 6.574951171875, 6.90234375, 7.229736328125, 7.55712890625, 7.884521484375, 8.2119140625, 8.539306640625, 8.86669921875, 9.194091796875, 9.521484375, 9.848876953125, 10.17626953125, 10.503662109375, 10.8310546875, 11.158447265625, 11.48583984375, 11.813232421875, 12.140625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 0.0, 6.0, 6.0, 5.0, 6.0, 9.0, 12.0, 19.0, 34.0, 40.0, 43.0, 69.0, 66.0, 122.0, 137.0, 197.0, 301.0, 509.0, 5470.0, 1852854.0, 2325622.0, 7125.0, 529.0, 322.0, 195.0, 143.0, 114.0, 66.0, 66.0, 51.0, 29.0, 34.0, 21.0, 14.0, 10.0, 12.0, 3.0, 9.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-64.9375, -63.18359375, -61.4296875, -59.67578125, -57.921875, -56.16796875, -54.4140625, -52.66015625, -50.90625, -49.15234375, -47.3984375, -45.64453125, -43.890625, -42.13671875, -40.3828125, -38.62890625, -36.875, -35.12109375, -33.3671875, -31.61328125, -29.859375, -28.10546875, -26.3515625, -24.59765625, -22.84375, -21.08984375, -19.3359375, -17.58203125, -15.828125, -14.07421875, -12.3203125, -10.56640625, -8.8125, -7.05859375, -5.3046875, -3.55078125, -1.796875, -0.04296875, 1.7109375, 3.46484375, 5.21875, 6.97265625, 8.7265625, 10.48046875, 12.234375, 13.98828125, 15.7421875, 17.49609375, 19.25, 21.00390625, 22.7578125, 24.51171875, 26.265625, 28.01953125, 29.7734375, 31.52734375, 33.28125, 35.03515625, 36.7890625, 38.54296875, 40.296875, 42.05078125, 43.8046875, 45.55859375, 47.3125]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 8.0, 10.0, 18.0, 25.0, 20.0, 28.0, 49.0, 60.0, 61.0, 76.0, 62.0, 83.0, 79.0, 77.0, 78.0, 65.0, 50.0, 46.0, 36.0, 25.0, 17.0, 11.0, 6.0, 5.0, 6.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.190227508544922, -30.027223587036133, -28.864221572875977, -27.701217651367188, -26.53821563720703, -25.375211715698242, -24.212207794189453, -23.049205780029297, -21.88620376586914, -20.72319984436035, -19.560197830200195, -18.397193908691406, -17.23419189453125, -16.07118797302246, -14.908185005187988, -13.745182037353516, -12.582178115844727, -11.419175148010254, -10.256172180175781, -9.093168258666992, -7.930165767669678, -6.767162799835205, -5.604159355163574, -4.441156387329102, -3.278153419494629, -2.1151504516601562, -0.9521472454071045, 0.21085596084594727, 1.37385892868042, 2.5368618965148926, 3.6998653411865234, 4.862868309020996, 6.025871276855469, 7.188874244689941, 8.351877212524414, 9.514881134033203, 10.67788314819336, 11.840887069702148, 13.003890037536621, 14.166893005371094, 15.329895973205566, 16.49289894104004, 17.655902862548828, 18.818904876708984, 19.981908798217773, 21.14491081237793, 22.30791473388672, 23.470916748046875, 24.633920669555664, 25.796924591064453, 26.95992660522461, 28.1229305267334, 29.285932540893555, 30.448936462402344, 31.6119384765625, 32.774940490722656, 33.93794631958008, 35.100948333740234, 36.263954162597656, 37.42695617675781, 38.58995819091797, 39.752960205078125, 40.91596603393555, 42.0789680480957, 43.24197006225586]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 0.0, 7.0, 5.0, 7.0, 7.0, 6.0, 13.0, 7.0, 14.0, 13.0, 25.0, 21.0, 28.0, 25.0, 21.0, 31.0, 28.0, 29.0, 32.0, 39.0, 28.0, 43.0, 33.0, 39.0, 40.0, 42.0, 44.0, 28.0, 47.0, 36.0, 33.0, 26.0, 31.0, 27.0, 17.0, 19.0, 13.0, 24.0, 9.0, 9.0, 17.0, 5.0, 5.0, 6.0, 7.0, 1.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0], "bins": [-34.472469329833984, -33.409088134765625, -32.34571075439453, -31.282329559326172, -30.218950271606445, -29.15557098388672, -28.09218978881836, -27.028810501098633, -25.965431213378906, -24.90205192565918, -23.838672637939453, -22.775291442871094, -21.711912155151367, -20.64853286743164, -19.58515167236328, -18.521772384643555, -17.458393096923828, -16.3950138092041, -15.331633567810059, -14.268253326416016, -13.204874038696289, -12.141494750976562, -11.07811450958252, -10.014734268188477, -8.95135498046875, -7.887975215911865, -6.8245954513549805, -5.761215686798096, -4.697835922241211, -3.634456157684326, -2.5710763931274414, -1.5076966285705566, -0.44431304931640625, 0.6190667152404785, 1.6824464797973633, 2.745826244354248, 3.809206008911133, 4.872585773468018, 5.935965538024902, 6.999345302581787, 8.062725067138672, 9.126104354858398, 10.189484596252441, 11.252864837646484, 12.316244125366211, 13.379623413085938, 14.44300365447998, 15.506383895874023, 16.56976318359375, 17.633142471313477, 18.696521759033203, 19.759902954101562, 20.82328224182129, 21.886661529541016, 22.950042724609375, 24.0134220123291, 25.076801300048828, 26.140180587768555, 27.20355987548828, 28.26694107055664, 29.330320358276367, 30.393699645996094, 31.457080841064453, 32.52045822143555, 33.583839416503906]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 6.0, 5.0, 6.0, 6.0, 5.0, 7.0, 17.0, 17.0, 30.0, 14.0, 25.0, 20.0, 27.0, 25.0, 31.0, 42.0, 30.0, 35.0, 37.0, 41.0, 32.0, 45.0, 37.0, 40.0, 36.0, 34.0, 30.0, 34.0, 40.0, 35.0, 30.0, 28.0, 17.0, 19.0, 24.0, 16.0, 16.0, 11.0, 7.0, 9.0, 9.0, 7.0, 8.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.91015625, -5.71990966796875, -5.5296630859375, -5.33941650390625, -5.149169921875, -4.95892333984375, -4.7686767578125, -4.57843017578125, -4.38818359375, -4.19793701171875, -4.0076904296875, -3.81744384765625, -3.627197265625, -3.43695068359375, -3.2467041015625, -3.05645751953125, -2.8662109375, -2.67596435546875, -2.4857177734375, -2.29547119140625, -2.105224609375, -1.91497802734375, -1.7247314453125, -1.53448486328125, -1.34423828125, -1.15399169921875, -0.9637451171875, -0.77349853515625, -0.583251953125, -0.39300537109375, -0.2027587890625, -0.01251220703125, 0.177734375, 0.36798095703125, 0.5582275390625, 0.74847412109375, 0.938720703125, 1.12896728515625, 1.3192138671875, 1.50946044921875, 1.69970703125, 1.88995361328125, 2.0802001953125, 2.27044677734375, 2.460693359375, 2.65093994140625, 2.8411865234375, 3.03143310546875, 3.2216796875, 3.41192626953125, 3.6021728515625, 3.79241943359375, 3.982666015625, 4.17291259765625, 4.3631591796875, 4.55340576171875, 4.74365234375, 4.93389892578125, 5.1241455078125, 5.31439208984375, 5.504638671875, 5.69488525390625, 5.8851318359375, 6.07537841796875, 6.265625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 10.0, 16.0, 18.0, 35.0, 37.0, 66.0, 82.0, 85.0, 183.0, 276.0, 413.0, 650.0, 985.0, 1634.0, 2576.0, 4105.0, 6693.0, 10216.0, 15881.0, 24348.0, 36467.0, 53528.0, 73889.0, 96891.0, 118212.0, 129933.0, 120858.0, 101428.0, 78808.0, 57158.0, 39176.0, 26420.0, 17107.0, 11100.0, 6975.0, 4466.0, 2815.0, 1817.0, 1144.0, 705.0, 470.0, 305.0, 186.0, 127.0, 85.0, 62.0, 41.0, 31.0, 22.0, 6.0, 10.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.84375, -0.8178634643554688, -0.7919769287109375, -0.7660903930664062, -0.740203857421875, -0.7143173217773438, -0.6884307861328125, -0.6625442504882812, -0.63665771484375, -0.6107711791992188, -0.5848846435546875, -0.5589981079101562, -0.533111572265625, -0.5072250366210938, -0.4813385009765625, -0.45545196533203125, -0.4295654296875, -0.40367889404296875, -0.3777923583984375, -0.35190582275390625, -0.326019287109375, -0.30013275146484375, -0.2742462158203125, -0.24835968017578125, -0.22247314453125, -0.19658660888671875, -0.1707000732421875, -0.14481353759765625, -0.118927001953125, -0.09304046630859375, -0.0671539306640625, -0.04126739501953125, -0.015380859375, 0.01050567626953125, 0.0363922119140625, 0.06227874755859375, 0.088165283203125, 0.11405181884765625, 0.1399383544921875, 0.16582489013671875, 0.19171142578125, 0.21759796142578125, 0.2434844970703125, 0.26937103271484375, 0.295257568359375, 0.32114410400390625, 0.3470306396484375, 0.37291717529296875, 0.3988037109375, 0.42469024658203125, 0.4505767822265625, 0.47646331787109375, 0.502349853515625, 0.5282363891601562, 0.5541229248046875, 0.5800094604492188, 0.60589599609375, 0.6317825317382812, 0.6576690673828125, 0.6835556030273438, 0.709442138671875, 0.7353286743164062, 0.7612152099609375, 0.7871017456054688, 0.81298828125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 10.0, 5.0, 6.0, 10.0, 15.0, 15.0, 13.0, 13.0, 26.0, 28.0, 30.0, 26.0, 41.0, 34.0, 41.0, 49.0, 51.0, 46.0, 1067.0, 41.0, 57.0, 34.0, 41.0, 27.0, 39.0, 34.0, 24.0, 31.0, 22.0, 38.0, 22.0, 20.0, 13.0, 9.0, 7.0, 4.0, 12.0, 5.0, 2.0, 7.0, 4.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.3046875, -5.1473388671875, -4.989990234375, -4.8326416015625, -4.67529296875, -4.5179443359375, -4.360595703125, -4.2032470703125, -4.0458984375, -3.8885498046875, -3.731201171875, -3.5738525390625, -3.41650390625, -3.2591552734375, -3.101806640625, -2.9444580078125, -2.787109375, -2.6297607421875, -2.472412109375, -2.3150634765625, -2.15771484375, -2.0003662109375, -1.843017578125, -1.6856689453125, -1.5283203125, -1.3709716796875, -1.213623046875, -1.0562744140625, -0.89892578125, -0.7415771484375, -0.584228515625, -0.4268798828125, -0.26953125, -0.1121826171875, 0.045166015625, 0.2025146484375, 0.35986328125, 0.5172119140625, 0.674560546875, 0.8319091796875, 0.9892578125, 1.1466064453125, 1.303955078125, 1.4613037109375, 1.61865234375, 1.7760009765625, 1.933349609375, 2.0906982421875, 2.248046875, 2.4053955078125, 2.562744140625, 2.7200927734375, 2.87744140625, 3.0347900390625, 3.192138671875, 3.3494873046875, 3.5068359375, 3.6641845703125, 3.821533203125, 3.9788818359375, 4.13623046875, 4.2935791015625, 4.450927734375, 4.6082763671875, 4.765625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 8.0, 7.0, 7.0, 9.0, 17.0, 41.0, 55.0, 68.0, 79.0, 146.0, 239.0, 336.0, 550.0, 798.0, 1317.0, 2172.0, 3417.0, 5384.0, 9021.0, 14976.0, 24502.0, 42541.0, 1874815.0, 47922.0, 26656.0, 16490.0, 9906.0, 5994.0, 3739.0, 2109.0, 1381.0, 847.0, 552.0, 359.0, 243.0, 141.0, 98.0, 62.0, 42.0, 33.0, 26.0, 17.0, 6.0, 4.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.68359375, -1.626678466796875, -1.56976318359375, -1.512847900390625, -1.4559326171875, -1.399017333984375, -1.34210205078125, -1.285186767578125, -1.228271484375, -1.171356201171875, -1.11444091796875, -1.057525634765625, -1.0006103515625, -0.943695068359375, -0.88677978515625, -0.829864501953125, -0.77294921875, -0.716033935546875, -0.65911865234375, -0.602203369140625, -0.5452880859375, -0.488372802734375, -0.43145751953125, -0.374542236328125, -0.317626953125, -0.260711669921875, -0.20379638671875, -0.146881103515625, -0.0899658203125, -0.033050537109375, 0.02386474609375, 0.080780029296875, 0.1376953125, 0.194610595703125, 0.25152587890625, 0.308441162109375, 0.3653564453125, 0.422271728515625, 0.47918701171875, 0.536102294921875, 0.593017578125, 0.649932861328125, 0.70684814453125, 0.763763427734375, 0.8206787109375, 0.877593994140625, 0.93450927734375, 0.991424560546875, 1.04833984375, 1.105255126953125, 1.16217041015625, 1.219085693359375, 1.2760009765625, 1.332916259765625, 1.38983154296875, 1.446746826171875, 1.503662109375, 1.560577392578125, 1.61749267578125, 1.674407958984375, 1.7313232421875, 1.788238525390625, 1.84515380859375, 1.902069091796875, 1.958984375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 6.0, 7.0, 5.0, 8.0, 13.0, 16.0, 21.0, 20.0, 22.0, 37.0, 44.0, 32.0, 41.0, 46.0, 49.0, 49.0, 68.0, 61.0, 63.0, 56.0, 51.0, 54.0, 47.0, 27.0, 25.0, 14.0, 23.0, 26.0, 12.0, 12.0, 7.0, 6.0, 6.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.054931640625, -0.05336570739746094, -0.051799774169921875, -0.05023384094238281, -0.04866790771484375, -0.04710197448730469, -0.045536041259765625, -0.04397010803222656, -0.0424041748046875, -0.04083824157714844, -0.039272308349609375, -0.03770637512207031, -0.03614044189453125, -0.03457450866699219, -0.033008575439453125, -0.03144264221191406, -0.029876708984375, -0.028310775756835938, -0.026744842529296875, -0.025178909301757812, -0.02361297607421875, -0.022047042846679688, -0.020481109619140625, -0.018915176391601562, -0.0173492431640625, -0.015783309936523438, -0.014217376708984375, -0.012651443481445312, -0.01108551025390625, -0.009519577026367188, -0.007953643798828125, -0.0063877105712890625, -0.00482177734375, -0.0032558441162109375, -0.001689910888671875, -0.0001239776611328125, 0.00144195556640625, 0.0030078887939453125, 0.004573822021484375, 0.0061397552490234375, 0.0077056884765625, 0.009271621704101562, 0.010837554931640625, 0.012403488159179688, 0.01396942138671875, 0.015535354614257812, 0.017101287841796875, 0.018667221069335938, 0.020233154296875, 0.021799087524414062, 0.023365020751953125, 0.024930953979492188, 0.02649688720703125, 0.028062820434570312, 0.029628753662109375, 0.031194686889648438, 0.0327606201171875, 0.03432655334472656, 0.035892486572265625, 0.03745841979980469, 0.03902435302734375, 0.04059028625488281, 0.042156219482421875, 0.04372215270996094, 0.0452880859375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 4.0, 6.0, 4.0, 8.0, 8.0, 4.0, 12.0, 16.0, 27.0, 36.0, 45.0, 50.0, 90.0, 191.0, 473.0, 966.0, 2609.0, 8799.0, 995225.0, 32969.0, 4237.0, 1490.0, 579.0, 266.0, 134.0, 105.0, 60.0, 38.0, 27.0, 21.0, 13.0, 8.0, 4.0, 12.0, 1.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.05078125, -1.0154266357421875, -0.980072021484375, -0.9447174072265625, -0.90936279296875, -0.8740081787109375, -0.838653564453125, -0.8032989501953125, -0.7679443359375, -0.7325897216796875, -0.697235107421875, -0.6618804931640625, -0.62652587890625, -0.5911712646484375, -0.555816650390625, -0.5204620361328125, -0.485107421875, -0.4497528076171875, -0.414398193359375, -0.3790435791015625, -0.34368896484375, -0.3083343505859375, -0.272979736328125, -0.2376251220703125, -0.2022705078125, -0.1669158935546875, -0.131561279296875, -0.0962066650390625, -0.06085205078125, -0.0254974365234375, 0.009857177734375, 0.0452117919921875, 0.08056640625, 0.1159210205078125, 0.151275634765625, 0.1866302490234375, 0.22198486328125, 0.2573394775390625, 0.292694091796875, 0.3280487060546875, 0.3634033203125, 0.3987579345703125, 0.434112548828125, 0.4694671630859375, 0.50482177734375, 0.5401763916015625, 0.575531005859375, 0.6108856201171875, 0.646240234375, 0.6815948486328125, 0.716949462890625, 0.7523040771484375, 0.78765869140625, 0.8230133056640625, 0.858367919921875, 0.8937225341796875, 0.9290771484375, 0.9644317626953125, 0.999786376953125, 1.0351409912109375, 1.07049560546875, 1.1058502197265625, 1.141204833984375, 1.1765594482421875, 1.2119140625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 11.0, 25.0, 85.0, 443.0, 361.0, 70.0, 8.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41213223338127136, -0.3904305100440979, -0.36872875690460205, -0.3470270335674286, -0.3253253102302551, -0.3036235570907593, -0.2819218337535858, -0.26022011041641235, -0.2385183721780777, -0.21681663393974304, -0.19511491060256958, -0.17341317236423492, -0.15171143412590027, -0.1300097107887268, -0.10830797255039215, -0.08660624921321869, -0.06490451097488403, -0.043202780187129974, -0.021501045674085617, 0.00020068883895874023, 0.0219024196267128, 0.04360415041446686, 0.06530588865280151, 0.08700761198997498, 0.10870935022830963, 0.1304110884666443, 0.15211281180381775, 0.1738145500421524, 0.19551628828048706, 0.21721801161766052, 0.23891974985599518, 0.26062148809432983, 0.2823231816291809, 0.30402490496635437, 0.3257266581058502, 0.3474283814430237, 0.36913010478019714, 0.3908318281173706, 0.41253358125686646, 0.4342353045940399, 0.4559370279312134, 0.47763875126838684, 0.4993405044078827, 0.5210422277450562, 0.542743980884552, 0.5644456744194031, 0.5861474275588989, 0.60784912109375, 0.6295509338378906, 0.6512526869773865, 0.6729543805122375, 0.6946561336517334, 0.7163578867912292, 0.7380595803260803, 0.7597613334655762, 0.7814630270004272, 0.8031647801399231, 0.824866533279419, 0.84656822681427, 0.8682699799537659, 0.8899717330932617, 0.9116734266281128, 0.9333751797676086, 0.9550769329071045, 0.9767786264419556]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 8.0, 5.0, 10.0, 2.0, 10.0, 16.0, 17.0, 14.0, 20.0, 20.0, 16.0, 23.0, 24.0, 32.0, 39.0, 38.0, 41.0, 40.0, 27.0, 32.0, 31.0, 37.0, 33.0, 30.0, 44.0, 44.0, 40.0, 28.0, 37.0, 36.0, 21.0, 26.0, 25.0, 25.0, 14.0, 18.0, 15.0, 16.0, 8.0, 7.0, 7.0, 11.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10407847166061401, -0.10091446340084076, -0.0977504551410675, -0.09458643943071365, -0.0914224311709404, -0.08825842291116714, -0.0850944072008133, -0.08193039894104004, -0.07876639068126678, -0.07560238242149353, -0.07243837416172028, -0.06927435845136642, -0.06611035019159317, -0.06294634193181992, -0.05978232994675636, -0.05661831796169281, -0.053454309701919556, -0.0502903014421463, -0.04712628945708275, -0.043962277472019196, -0.04079826921224594, -0.03763426095247269, -0.034470248967409134, -0.03130623698234558, -0.028142228722572327, -0.024978218600153923, -0.02181420847773552, -0.018650198355317116, -0.015486188232898712, -0.012322178110480309, -0.009158167988061905, -0.005994157865643501, -0.0028301477432250977, 0.00033386237919330597, 0.0034978725016117096, 0.006661882624030113, 0.009825892746448517, 0.01298990286886692, 0.016153912991285324, 0.019317923113703728, 0.02248193323612213, 0.025645943358540535, 0.02880995348095894, 0.03197396546602249, 0.035137973725795746, 0.038301981985569, 0.04146599397063255, 0.044630005955696106, 0.04779401421546936, 0.050958022475242615, 0.05412203446030617, 0.05728604644536972, 0.060450054705142975, 0.06361406296491623, 0.06677807867527008, 0.06994208693504333, 0.07310609519481659, 0.07627010345458984, 0.0794341117143631, 0.08259812742471695, 0.0857621356844902, 0.08892614394426346, 0.09209015965461731, 0.09525416791439056, 0.09841817617416382]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 6.0, 5.0, 14.0, 5.0, 8.0, 14.0, 13.0, 13.0, 25.0, 30.0, 35.0, 31.0, 38.0, 28.0, 49.0, 33.0, 37.0, 38.0, 37.0, 55.0, 54.0, 49.0, 45.0, 51.0, 53.0, 30.0, 30.0, 33.0, 30.0, 15.0, 24.0, 14.0, 15.0, 11.0, 8.0, 7.0, 3.0, 8.0, 3.0, 5.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0625, -5.8416748046875, -5.620849609375, -5.4000244140625, -5.17919921875, -4.9583740234375, -4.737548828125, -4.5167236328125, -4.2958984375, -4.0750732421875, -3.854248046875, -3.6334228515625, -3.41259765625, -3.1917724609375, -2.970947265625, -2.7501220703125, -2.529296875, -2.3084716796875, -2.087646484375, -1.8668212890625, -1.64599609375, -1.4251708984375, -1.204345703125, -0.9835205078125, -0.7626953125, -0.5418701171875, -0.321044921875, -0.1002197265625, 0.12060546875, 0.3414306640625, 0.562255859375, 0.7830810546875, 1.00390625, 1.2247314453125, 1.445556640625, 1.6663818359375, 1.88720703125, 2.1080322265625, 2.328857421875, 2.5496826171875, 2.7705078125, 2.9913330078125, 3.212158203125, 3.4329833984375, 3.65380859375, 3.8746337890625, 4.095458984375, 4.3162841796875, 4.537109375, 4.7579345703125, 4.978759765625, 5.1995849609375, 5.42041015625, 5.6412353515625, 5.862060546875, 6.0828857421875, 6.3037109375, 6.5245361328125, 6.745361328125, 6.9661865234375, 7.18701171875, 7.4078369140625, 7.628662109375, 7.8494873046875, 8.0703125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 7.0, 3.0, 7.0, 10.0, 16.0, 15.0, 31.0, 38.0, 35.0, 66.0, 93.0, 163.0, 344.0, 870.0, 2288.0, 6783.0, 19968.0, 57185.0, 191820.0, 496820.0, 185686.0, 56076.0, 19410.0, 6792.0, 2432.0, 809.0, 336.0, 169.0, 73.0, 58.0, 31.0, 35.0, 21.0, 21.0, 16.0, 6.0, 10.0, 4.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.609375, -8.2716064453125, -7.933837890625, -7.5960693359375, -7.25830078125, -6.9205322265625, -6.582763671875, -6.2449951171875, -5.9072265625, -5.5694580078125, -5.231689453125, -4.8939208984375, -4.55615234375, -4.2183837890625, -3.880615234375, -3.5428466796875, -3.205078125, -2.8673095703125, -2.529541015625, -2.1917724609375, -1.85400390625, -1.5162353515625, -1.178466796875, -0.8406982421875, -0.5029296875, -0.1651611328125, 0.172607421875, 0.5103759765625, 0.84814453125, 1.1859130859375, 1.523681640625, 1.8614501953125, 2.19921875, 2.5369873046875, 2.874755859375, 3.2125244140625, 3.55029296875, 3.8880615234375, 4.225830078125, 4.5635986328125, 4.9013671875, 5.2391357421875, 5.576904296875, 5.9146728515625, 6.25244140625, 6.5902099609375, 6.927978515625, 7.2657470703125, 7.603515625, 7.9412841796875, 8.279052734375, 8.6168212890625, 8.95458984375, 9.2923583984375, 9.630126953125, 9.9678955078125, 10.3056640625, 10.6434326171875, 10.981201171875, 11.3189697265625, 11.65673828125, 11.9945068359375, 12.332275390625, 12.6700439453125, 13.0078125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 8.0, 1.0, 9.0, 15.0, 8.0, 12.0, 12.0, 22.0, 19.0, 16.0, 37.0, 25.0, 32.0, 36.0, 28.0, 43.0, 50.0, 64.0, 87.0, 166.0, 304.0, 1332.0, 167.0, 97.0, 59.0, 46.0, 46.0, 38.0, 23.0, 30.0, 24.0, 29.0, 25.0, 20.0, 17.0, 12.0, 18.0, 14.0, 11.0, 7.0, 9.0, 8.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-18.75, -18.147216796875, -17.54443359375, -16.941650390625, -16.3388671875, -15.736083984375, -15.13330078125, -14.530517578125, -13.927734375, -13.324951171875, -12.72216796875, -12.119384765625, -11.5166015625, -10.913818359375, -10.31103515625, -9.708251953125, -9.10546875, -8.502685546875, -7.89990234375, -7.297119140625, -6.6943359375, -6.091552734375, -5.48876953125, -4.885986328125, -4.283203125, -3.680419921875, -3.07763671875, -2.474853515625, -1.8720703125, -1.269287109375, -0.66650390625, -0.063720703125, 0.5390625, 1.141845703125, 1.74462890625, 2.347412109375, 2.9501953125, 3.552978515625, 4.15576171875, 4.758544921875, 5.361328125, 5.964111328125, 6.56689453125, 7.169677734375, 7.7724609375, 8.375244140625, 8.97802734375, 9.580810546875, 10.18359375, 10.786376953125, 11.38916015625, 11.991943359375, 12.5947265625, 13.197509765625, 13.80029296875, 14.403076171875, 15.005859375, 15.608642578125, 16.21142578125, 16.814208984375, 17.4169921875, 18.019775390625, 18.62255859375, 19.225341796875, 19.828125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 11.0, 10.0, 8.0, 15.0, 16.0, 15.0, 29.0, 24.0, 34.0, 35.0, 59.0, 38.0, 76.0, 70.0, 122.0, 198.0, 357.0, 724.0, 2356.0, 42591.0, 2922776.0, 169838.0, 4050.0, 980.0, 408.0, 220.0, 136.0, 115.0, 83.0, 58.0, 37.0, 41.0, 31.0, 35.0, 18.0, 24.0, 15.0, 6.0, 10.0, 12.0, 3.0, 8.0, 6.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-49.90625, -48.4228515625, -46.939453125, -45.4560546875, -43.97265625, -42.4892578125, -41.005859375, -39.5224609375, -38.0390625, -36.5556640625, -35.072265625, -33.5888671875, -32.10546875, -30.6220703125, -29.138671875, -27.6552734375, -26.171875, -24.6884765625, -23.205078125, -21.7216796875, -20.23828125, -18.7548828125, -17.271484375, -15.7880859375, -14.3046875, -12.8212890625, -11.337890625, -9.8544921875, -8.37109375, -6.8876953125, -5.404296875, -3.9208984375, -2.4375, -0.9541015625, 0.529296875, 2.0126953125, 3.49609375, 4.9794921875, 6.462890625, 7.9462890625, 9.4296875, 10.9130859375, 12.396484375, 13.8798828125, 15.36328125, 16.8466796875, 18.330078125, 19.8134765625, 21.296875, 22.7802734375, 24.263671875, 25.7470703125, 27.23046875, 28.7138671875, 30.197265625, 31.6806640625, 33.1640625, 34.6474609375, 36.130859375, 37.6142578125, 39.09765625, 40.5810546875, 42.064453125, 43.5478515625, 45.03125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 10.0, 14.0, 17.0, 49.0, 77.0, 111.0, 135.0, 143.0, 126.0, 102.0, 76.0, 51.0, 48.0, 19.0, 12.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.80305099487305, -43.72513198852539, -42.647212982177734, -41.569297790527344, -40.49137878417969, -39.41345977783203, -38.335540771484375, -37.25762176513672, -36.17970657348633, -35.10178756713867, -34.023868560791016, -32.945953369140625, -31.86803436279297, -30.790115356445312, -29.712196350097656, -28.634279251098633, -27.556360244750977, -26.47844123840332, -25.400524139404297, -24.32260513305664, -23.244688034057617, -22.16676902770996, -21.088851928710938, -20.01093292236328, -18.933013916015625, -17.85509490966797, -16.777177810668945, -15.699258804321289, -14.621341705322266, -13.54342269897461, -12.46550464630127, -11.38758659362793, -10.309667587280273, -9.231749534606934, -8.153831481933594, -7.075912952423096, -5.997994899749756, -4.920076847076416, -3.842158317565918, -2.764240264892578, -1.6863222122192383, -0.6084040403366089, 0.4695141315460205, 1.5474324226379395, 2.6253504753112793, 3.703268527984619, 4.781187057495117, 5.859105110168457, 6.937023162841797, 8.014941215515137, 9.092859268188477, 10.170778274536133, 11.248695373535156, 12.326614379882812, 13.404532432556152, 14.482450485229492, 15.560368537902832, 16.638286590576172, 17.716205596923828, 18.79412269592285, 19.872041702270508, 20.94995880126953, 22.027877807617188, 23.105796813964844, 24.183713912963867]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 7.0, 3.0, 3.0, 3.0, 5.0, 9.0, 7.0, 13.0, 7.0, 11.0, 14.0, 12.0, 17.0, 23.0, 21.0, 22.0, 27.0, 29.0, 43.0, 38.0, 37.0, 37.0, 28.0, 39.0, 37.0, 49.0, 39.0, 43.0, 28.0, 32.0, 42.0, 41.0, 35.0, 29.0, 19.0, 21.0, 31.0, 16.0, 13.0, 13.0, 12.0, 9.0, 12.0, 9.0, 7.0, 7.0, 1.0, 4.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-50.77058410644531, -49.14675521850586, -47.52293014526367, -45.89910125732422, -44.27527618408203, -42.65144729614258, -41.027618408203125, -39.40379333496094, -37.77996826171875, -36.1561393737793, -34.53231430053711, -32.908485412597656, -31.28466033935547, -29.660831451416016, -28.037004470825195, -26.413177490234375, -24.789348602294922, -23.1655216217041, -21.54169464111328, -19.917865753173828, -18.29404067993164, -16.670211791992188, -15.046384811401367, -13.422557830810547, -11.798730850219727, -10.174903869628906, -8.551076889038086, -6.927248954772949, -5.303421974182129, -3.6795949935913086, -2.055767059326172, -0.43194007873535156, 1.1918907165527344, 2.815717935562134, 4.439545154571533, 6.063372611999512, 7.687199592590332, 9.311026573181152, 10.934854507446289, 12.55868148803711, 14.18250846862793, 15.80633544921875, 17.43016242980957, 19.05398941040039, 20.677818298339844, 22.30164337158203, 23.925472259521484, 25.549299240112305, 27.173126220703125, 28.796953201293945, 30.420780181884766, 32.04460906982422, 33.668434143066406, 35.29226303100586, 36.91609191894531, 38.5399169921875, 40.16374206542969, 41.78757095336914, 43.41139602661133, 45.03522491455078, 46.65904998779297, 48.28287887573242, 49.906707763671875, 51.53053283691406, 53.154361724853516]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 5.0, 6.0, 8.0, 13.0, 13.0, 13.0, 8.0, 18.0, 19.0, 23.0, 29.0, 27.0, 29.0, 27.0, 27.0, 41.0, 33.0, 45.0, 33.0, 46.0, 48.0, 48.0, 38.0, 44.0, 44.0, 44.0, 37.0, 28.0, 34.0, 29.0, 27.0, 25.0, 23.0, 12.0, 17.0, 9.0, 5.0, 8.0, 5.0, 5.0, 5.0, 6.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.66796875, -6.43450927734375, -6.2010498046875, -5.96759033203125, -5.734130859375, -5.50067138671875, -5.2672119140625, -5.03375244140625, -4.80029296875, -4.56683349609375, -4.3333740234375, -4.09991455078125, -3.866455078125, -3.63299560546875, -3.3995361328125, -3.16607666015625, -2.9326171875, -2.69915771484375, -2.4656982421875, -2.23223876953125, -1.998779296875, -1.76531982421875, -1.5318603515625, -1.29840087890625, -1.06494140625, -0.83148193359375, -0.5980224609375, -0.36456298828125, -0.131103515625, 0.10235595703125, 0.3358154296875, 0.56927490234375, 0.802734375, 1.03619384765625, 1.2696533203125, 1.50311279296875, 1.736572265625, 1.97003173828125, 2.2034912109375, 2.43695068359375, 2.67041015625, 2.90386962890625, 3.1373291015625, 3.37078857421875, 3.604248046875, 3.83770751953125, 4.0711669921875, 4.30462646484375, 4.5380859375, 4.77154541015625, 5.0050048828125, 5.23846435546875, 5.471923828125, 5.70538330078125, 5.9388427734375, 6.17230224609375, 6.40576171875, 6.63922119140625, 6.8726806640625, 7.10614013671875, 7.339599609375, 7.57305908203125, 7.8065185546875, 8.03997802734375, 8.2734375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 7.0, 9.0, 13.0, 20.0, 20.0, 41.0, 61.0, 82.0, 138.0, 225.0, 469.0, 930.0, 1956.0, 4518.0, 11372.0, 28918.0, 74219.0, 187644.0, 443282.0, 873879.0, 1127437.0, 787208.0, 387503.0, 161173.0, 62795.0, 23852.0, 9455.0, 3791.0, 1614.0, 705.0, 385.0, 190.0, 125.0, 85.0, 43.0, 32.0, 16.0, 19.0, 15.0, 10.0, 3.0, 9.0, 6.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.421875, -6.210693359375, -5.99951171875, -5.788330078125, -5.5771484375, -5.365966796875, -5.15478515625, -4.943603515625, -4.732421875, -4.521240234375, -4.31005859375, -4.098876953125, -3.8876953125, -3.676513671875, -3.46533203125, -3.254150390625, -3.04296875, -2.831787109375, -2.62060546875, -2.409423828125, -2.1982421875, -1.987060546875, -1.77587890625, -1.564697265625, -1.353515625, -1.142333984375, -0.93115234375, -0.719970703125, -0.5087890625, -0.297607421875, -0.08642578125, 0.124755859375, 0.3359375, 0.547119140625, 0.75830078125, 0.969482421875, 1.1806640625, 1.391845703125, 1.60302734375, 1.814208984375, 2.025390625, 2.236572265625, 2.44775390625, 2.658935546875, 2.8701171875, 3.081298828125, 3.29248046875, 3.503662109375, 3.71484375, 3.926025390625, 4.13720703125, 4.348388671875, 4.5595703125, 4.770751953125, 4.98193359375, 5.193115234375, 5.404296875, 5.615478515625, 5.82666015625, 6.037841796875, 6.2490234375, 6.460205078125, 6.67138671875, 6.882568359375, 7.09375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 4.0, 2.0, 5.0, 8.0, 24.0, 13.0, 28.0, 18.0, 44.0, 41.0, 51.0, 68.0, 85.0, 127.0, 151.0, 178.0, 221.0, 262.0, 318.0, 372.0, 361.0, 306.0, 250.0, 242.0, 198.0, 141.0, 107.0, 102.0, 77.0, 62.0, 48.0, 38.0, 27.0, 24.0, 18.0, 10.0, 11.0, 11.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.5546875, -10.236572265625, -9.91845703125, -9.600341796875, -9.2822265625, -8.964111328125, -8.64599609375, -8.327880859375, -8.009765625, -7.691650390625, -7.37353515625, -7.055419921875, -6.7373046875, -6.419189453125, -6.10107421875, -5.782958984375, -5.46484375, -5.146728515625, -4.82861328125, -4.510498046875, -4.1923828125, -3.874267578125, -3.55615234375, -3.238037109375, -2.919921875, -2.601806640625, -2.28369140625, -1.965576171875, -1.6474609375, -1.329345703125, -1.01123046875, -0.693115234375, -0.375, -0.056884765625, 0.26123046875, 0.579345703125, 0.8974609375, 1.215576171875, 1.53369140625, 1.851806640625, 2.169921875, 2.488037109375, 2.80615234375, 3.124267578125, 3.4423828125, 3.760498046875, 4.07861328125, 4.396728515625, 4.71484375, 5.032958984375, 5.35107421875, 5.669189453125, 5.9873046875, 6.305419921875, 6.62353515625, 6.941650390625, 7.259765625, 7.577880859375, 7.89599609375, 8.214111328125, 8.5322265625, 8.850341796875, 9.16845703125, 9.486572265625, 9.8046875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 5.0, 4.0, 7.0, 11.0, 11.0, 12.0, 20.0, 16.0, 36.0, 36.0, 50.0, 81.0, 92.0, 115.0, 195.0, 258.0, 455.0, 732.0, 1927.0, 21253.0, 1109762.0, 2973181.0, 79998.0, 3440.0, 920.0, 555.0, 337.0, 201.0, 154.0, 97.0, 76.0, 50.0, 43.0, 37.0, 24.0, 27.0, 21.0, 16.0, 7.0, 7.0, 4.0, 2.0, 0.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-35.40625, -34.2705078125, -33.134765625, -31.9990234375, -30.86328125, -29.7275390625, -28.591796875, -27.4560546875, -26.3203125, -25.1845703125, -24.048828125, -22.9130859375, -21.77734375, -20.6416015625, -19.505859375, -18.3701171875, -17.234375, -16.0986328125, -14.962890625, -13.8271484375, -12.69140625, -11.5556640625, -10.419921875, -9.2841796875, -8.1484375, -7.0126953125, -5.876953125, -4.7412109375, -3.60546875, -2.4697265625, -1.333984375, -0.1982421875, 0.9375, 2.0732421875, 3.208984375, 4.3447265625, 5.48046875, 6.6162109375, 7.751953125, 8.8876953125, 10.0234375, 11.1591796875, 12.294921875, 13.4306640625, 14.56640625, 15.7021484375, 16.837890625, 17.9736328125, 19.109375, 20.2451171875, 21.380859375, 22.5166015625, 23.65234375, 24.7880859375, 25.923828125, 27.0595703125, 28.1953125, 29.3310546875, 30.466796875, 31.6025390625, 32.73828125, 33.8740234375, 35.009765625, 36.1455078125, 37.28125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 15.0, 48.0, 134.0, 192.0, 232.0, 214.0, 116.0, 42.0, 18.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-176.10963439941406, -172.3258514404297, -168.5420684814453, -164.75830078125, -160.97451782226562, -157.19073486328125, -153.40695190429688, -149.6231689453125, -145.83938598632812, -142.05560302734375, -138.27182006835938, -134.48805236816406, -130.7042694091797, -126.92048645019531, -123.13670349121094, -119.35292053222656, -115.56915283203125, -111.78536987304688, -108.00159454345703, -104.21781158447266, -100.43403625488281, -96.65025329589844, -92.86647033691406, -89.08268737792969, -85.29891204833984, -81.51512908935547, -77.73135375976562, -73.94757080078125, -70.16378784179688, -66.38001251220703, -62.596229553222656, -58.81245040893555, -55.02867889404297, -51.24489974975586, -47.46112060546875, -43.677337646484375, -39.893558502197266, -36.109779357910156, -32.32599639892578, -28.542217254638672, -24.758438110351562, -20.974658966064453, -17.19087791442871, -13.407097816467285, -9.62331771850586, -5.83953857421875, -2.055757522583008, 1.7280235290527344, 5.511802673339844, 9.29558277130127, 13.079362869262695, 16.863143920898438, 20.646923065185547, 24.430702209472656, 28.2144832611084, 31.99826431274414, 35.78204345703125, 39.56582260131836, 43.34960174560547, 47.133384704589844, 50.91716384887695, 54.70094299316406, 58.48472595214844, 62.26850509643555, 66.05228424072266]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 7.0, 8.0, 3.0, 7.0, 15.0, 15.0, 16.0, 22.0, 20.0, 21.0, 22.0, 26.0, 26.0, 36.0, 33.0, 37.0, 30.0, 33.0, 37.0, 31.0, 54.0, 36.0, 48.0, 34.0, 25.0, 35.0, 35.0, 31.0, 37.0, 38.0, 20.0, 21.0, 15.0, 16.0, 18.0, 24.0, 12.0, 20.0, 8.0, 5.0, 8.0, 6.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0], "bins": [-45.07491683959961, -43.844627380371094, -42.61433410644531, -41.3840446472168, -40.15375518798828, -38.923465728759766, -37.69317626953125, -36.46288299560547, -35.23259353637695, -34.00230407714844, -32.772010803222656, -31.54172134399414, -30.311431884765625, -29.08114242553711, -27.85085105895996, -26.620559692382812, -25.390270233154297, -24.15998077392578, -22.929689407348633, -21.699398040771484, -20.46910858154297, -19.238819122314453, -18.008527755737305, -16.778236389160156, -15.54794692993164, -14.317656517028809, -13.087366104125977, -11.857075691223145, -10.626785278320312, -9.39649486541748, -8.166204452514648, -6.935914039611816, -5.70562744140625, -4.475337028503418, -3.245046615600586, -2.014756202697754, -0.7844657897949219, 0.44582462310791016, 1.6761150360107422, 2.906405448913574, 4.136695861816406, 5.366986274719238, 6.59727668762207, 7.827567100524902, 9.057857513427734, 10.288147926330566, 11.518438339233398, 12.74872875213623, 13.979019165039062, 15.209309577941895, 16.439599990844727, 17.669891357421875, 18.90018081665039, 20.130470275878906, 21.360761642456055, 22.591053009033203, 23.82134246826172, 25.051631927490234, 26.281923294067383, 27.51221466064453, 28.742504119873047, 29.972793579101562, 31.20308494567871, 32.43337631225586, 33.663665771484375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 7.0, 3.0, 5.0, 5.0, 6.0, 8.0, 9.0, 14.0, 12.0, 12.0, 10.0, 18.0, 15.0, 20.0, 16.0, 24.0, 29.0, 35.0, 27.0, 31.0, 41.0, 33.0, 36.0, 36.0, 42.0, 38.0, 35.0, 42.0, 44.0, 35.0, 28.0, 32.0, 23.0, 30.0, 35.0, 30.0, 23.0, 14.0, 19.0, 17.0, 11.0, 10.0, 14.0, 5.0, 4.0, 4.0, 8.0, 2.0, 1.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-5.96875, -5.78204345703125, -5.5953369140625, -5.40863037109375, -5.221923828125, -5.03521728515625, -4.8485107421875, -4.66180419921875, -4.47509765625, -4.28839111328125, -4.1016845703125, -3.91497802734375, -3.728271484375, -3.54156494140625, -3.3548583984375, -3.16815185546875, -2.9814453125, -2.79473876953125, -2.6080322265625, -2.42132568359375, -2.234619140625, -2.04791259765625, -1.8612060546875, -1.67449951171875, -1.48779296875, -1.30108642578125, -1.1143798828125, -0.92767333984375, -0.740966796875, -0.55426025390625, -0.3675537109375, -0.18084716796875, 0.005859375, 0.19256591796875, 0.3792724609375, 0.56597900390625, 0.752685546875, 0.93939208984375, 1.1260986328125, 1.31280517578125, 1.49951171875, 1.68621826171875, 1.8729248046875, 2.05963134765625, 2.246337890625, 2.43304443359375, 2.6197509765625, 2.80645751953125, 2.9931640625, 3.17987060546875, 3.3665771484375, 3.55328369140625, 3.739990234375, 3.92669677734375, 4.1134033203125, 4.30010986328125, 4.48681640625, 4.67352294921875, 4.8602294921875, 5.04693603515625, 5.233642578125, 5.42034912109375, 5.6070556640625, 5.79376220703125, 5.98046875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 7.0, 6.0, 7.0, 9.0, 17.0, 25.0, 43.0, 49.0, 81.0, 139.0, 199.0, 327.0, 429.0, 702.0, 1037.0, 1543.0, 2293.0, 3278.0, 4759.0, 7085.0, 10024.0, 14251.0, 20059.0, 27908.0, 38170.0, 50813.0, 65254.0, 80550.0, 94792.0, 103766.0, 103678.0, 93507.0, 79820.0, 64258.0, 49801.0, 37530.0, 27524.0, 19600.0, 13919.0, 9766.0, 6929.0, 4728.0, 3244.0, 2140.0, 1513.0, 975.0, 681.0, 462.0, 311.0, 202.0, 128.0, 93.0, 44.0, 43.0, 23.0, 10.0, 10.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.673828125, -0.652069091796875, -0.63031005859375, -0.608551025390625, -0.5867919921875, -0.565032958984375, -0.54327392578125, -0.521514892578125, -0.499755859375, -0.477996826171875, -0.45623779296875, -0.434478759765625, -0.4127197265625, -0.390960693359375, -0.36920166015625, -0.347442626953125, -0.32568359375, -0.303924560546875, -0.28216552734375, -0.260406494140625, -0.2386474609375, -0.216888427734375, -0.19512939453125, -0.173370361328125, -0.151611328125, -0.129852294921875, -0.10809326171875, -0.086334228515625, -0.0645751953125, -0.042816162109375, -0.02105712890625, 0.000701904296875, 0.0224609375, 0.044219970703125, 0.06597900390625, 0.087738037109375, 0.1094970703125, 0.131256103515625, 0.15301513671875, 0.174774169921875, 0.196533203125, 0.218292236328125, 0.24005126953125, 0.261810302734375, 0.2835693359375, 0.305328369140625, 0.32708740234375, 0.348846435546875, 0.37060546875, 0.392364501953125, 0.41412353515625, 0.435882568359375, 0.4576416015625, 0.479400634765625, 0.50115966796875, 0.522918701171875, 0.544677734375, 0.566436767578125, 0.58819580078125, 0.609954833984375, 0.6317138671875, 0.653472900390625, 0.67523193359375, 0.696990966796875, 0.71875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 7.0, 3.0, 7.0, 6.0, 7.0, 10.0, 10.0, 13.0, 20.0, 19.0, 28.0, 20.0, 36.0, 31.0, 33.0, 37.0, 37.0, 37.0, 47.0, 44.0, 51.0, 1065.0, 50.0, 42.0, 44.0, 36.0, 33.0, 26.0, 27.0, 24.0, 28.0, 28.0, 22.0, 18.0, 14.0, 12.0, 11.0, 10.0, 6.0, 4.0, 4.0, 5.0, 6.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.33203125, -5.1656494140625, -4.999267578125, -4.8328857421875, -4.66650390625, -4.5001220703125, -4.333740234375, -4.1673583984375, -4.0009765625, -3.8345947265625, -3.668212890625, -3.5018310546875, -3.33544921875, -3.1690673828125, -3.002685546875, -2.8363037109375, -2.669921875, -2.5035400390625, -2.337158203125, -2.1707763671875, -2.00439453125, -1.8380126953125, -1.671630859375, -1.5052490234375, -1.3388671875, -1.1724853515625, -1.006103515625, -0.8397216796875, -0.67333984375, -0.5069580078125, -0.340576171875, -0.1741943359375, -0.0078125, 0.1585693359375, 0.324951171875, 0.4913330078125, 0.65771484375, 0.8240966796875, 0.990478515625, 1.1568603515625, 1.3232421875, 1.4896240234375, 1.656005859375, 1.8223876953125, 1.98876953125, 2.1551513671875, 2.321533203125, 2.4879150390625, 2.654296875, 2.8206787109375, 2.987060546875, 3.1534423828125, 3.31982421875, 3.4862060546875, 3.652587890625, 3.8189697265625, 3.9853515625, 4.1517333984375, 4.318115234375, 4.4844970703125, 4.65087890625, 4.8172607421875, 4.983642578125, 5.1500244140625, 5.31640625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 7.0, 10.0, 13.0, 18.0, 12.0, 30.0, 30.0, 58.0, 72.0, 112.0, 191.0, 271.0, 399.0, 673.0, 1050.0, 1612.0, 2516.0, 3853.0, 6310.0, 10391.0, 17010.0, 27371.0, 51541.0, 1871253.0, 39826.0, 23696.0, 14641.0, 8920.0, 5597.0, 3445.0, 2128.0, 1417.0, 925.0, 579.0, 373.0, 240.0, 161.0, 133.0, 89.0, 42.0, 43.0, 28.0, 14.0, 7.0, 12.0, 2.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.900390625, -1.841644287109375, -1.78289794921875, -1.724151611328125, -1.6654052734375, -1.606658935546875, -1.54791259765625, -1.489166259765625, -1.430419921875, -1.371673583984375, -1.31292724609375, -1.254180908203125, -1.1954345703125, -1.136688232421875, -1.07794189453125, -1.019195556640625, -0.96044921875, -0.901702880859375, -0.84295654296875, -0.784210205078125, -0.7254638671875, -0.666717529296875, -0.60797119140625, -0.549224853515625, -0.490478515625, -0.431732177734375, -0.37298583984375, -0.314239501953125, -0.2554931640625, -0.196746826171875, -0.13800048828125, -0.079254150390625, -0.0205078125, 0.038238525390625, 0.09698486328125, 0.155731201171875, 0.2144775390625, 0.273223876953125, 0.33197021484375, 0.390716552734375, 0.449462890625, 0.508209228515625, 0.56695556640625, 0.625701904296875, 0.6844482421875, 0.743194580078125, 0.80194091796875, 0.860687255859375, 0.91943359375, 0.978179931640625, 1.03692626953125, 1.095672607421875, 1.1544189453125, 1.213165283203125, 1.27191162109375, 1.330657958984375, 1.389404296875, 1.448150634765625, 1.50689697265625, 1.565643310546875, 1.6243896484375, 1.683135986328125, 1.74188232421875, 1.800628662109375, 1.859375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 7.0, 15.0, 24.0, 23.0, 43.0, 52.0, 74.0, 87.0, 122.0, 93.0, 106.0, 98.0, 95.0, 46.0, 35.0, 23.0, 20.0, 4.0, 10.0, 4.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11114501953125, -0.10782527923583984, -0.10450553894042969, -0.10118579864501953, -0.09786605834960938, -0.09454631805419922, -0.09122657775878906, -0.0879068374633789, -0.08458709716796875, -0.0812673568725586, -0.07794761657714844, -0.07462787628173828, -0.07130813598632812, -0.06798839569091797, -0.06466865539550781, -0.061348915100097656, -0.0580291748046875, -0.054709434509277344, -0.05138969421386719, -0.04806995391845703, -0.044750213623046875, -0.04143047332763672, -0.03811073303222656, -0.034790992736816406, -0.03147125244140625, -0.028151512145996094, -0.024831771850585938, -0.02151203155517578, -0.018192291259765625, -0.014872550964355469, -0.011552810668945312, -0.008233070373535156, -0.004913330078125, -0.0015935897827148438, 0.0017261505126953125, 0.005045890808105469, 0.008365631103515625, 0.011685371398925781, 0.015005111694335938, 0.018324851989746094, 0.02164459228515625, 0.024964332580566406, 0.028284072875976562, 0.03160381317138672, 0.034923553466796875, 0.03824329376220703, 0.04156303405761719, 0.044882774353027344, 0.0482025146484375, 0.051522254943847656, 0.05484199523925781, 0.05816173553466797, 0.061481475830078125, 0.06480121612548828, 0.06812095642089844, 0.0714406967163086, 0.07476043701171875, 0.0780801773071289, 0.08139991760253906, 0.08471965789794922, 0.08803939819335938, 0.09135913848876953, 0.09467887878417969, 0.09799861907958984, 0.101318359375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 6.0, 8.0, 9.0, 27.0, 43.0, 74.0, 138.0, 332.0, 2415.0, 1041632.0, 3202.0, 319.0, 139.0, 72.0, 50.0, 26.0, 21.0, 13.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.498046875, -2.416229248046875, -2.33441162109375, -2.252593994140625, -2.1707763671875, -2.088958740234375, -2.00714111328125, -1.925323486328125, -1.843505859375, -1.761688232421875, -1.67987060546875, -1.598052978515625, -1.5162353515625, -1.434417724609375, -1.35260009765625, -1.270782470703125, -1.18896484375, -1.107147216796875, -1.02532958984375, -0.943511962890625, -0.8616943359375, -0.779876708984375, -0.69805908203125, -0.616241455078125, -0.534423828125, -0.452606201171875, -0.37078857421875, -0.288970947265625, -0.2071533203125, -0.125335693359375, -0.04351806640625, 0.038299560546875, 0.1201171875, 0.201934814453125, 0.28375244140625, 0.365570068359375, 0.4473876953125, 0.529205322265625, 0.61102294921875, 0.692840576171875, 0.774658203125, 0.856475830078125, 0.93829345703125, 1.020111083984375, 1.1019287109375, 1.183746337890625, 1.26556396484375, 1.347381591796875, 1.42919921875, 1.511016845703125, 1.59283447265625, 1.674652099609375, 1.7564697265625, 1.838287353515625, 1.92010498046875, 2.001922607421875, 2.083740234375, 2.165557861328125, 2.24737548828125, 2.329193115234375, 2.4110107421875, 2.492828369140625, 2.57464599609375, 2.656463623046875, 2.73828125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 10.0, 49.0, 427.0, 487.0, 36.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37764009833335876, -0.3631519675254822, -0.348663866519928, -0.3341757357120514, -0.3196876049041748, -0.3051994740962982, -0.29071134328842163, -0.27622324228286743, -0.26173511147499084, -0.24724698066711426, -0.23275886476039886, -0.21827074885368347, -0.20378261804580688, -0.1892944872379303, -0.1748063713312149, -0.1603182554244995, -0.14583012461662292, -0.13134199380874634, -0.11685387790203094, -0.10236575454473495, -0.08787763118743896, -0.07338950783014297, -0.058901384472846985, -0.044413261115550995, -0.029925137758255005, -0.015437014400959015, -0.0009488910436630249, 0.013539232313632965, 0.028027355670928955, 0.042515479028224945, 0.057003602385520935, 0.07149172574281693, 0.0859798789024353, 0.10046800225973129, 0.11495612561702728, 0.12944424152374268, 0.14393237233161926, 0.15842050313949585, 0.17290861904621124, 0.18739673495292664, 0.20188486576080322, 0.2163729965686798, 0.2308611124753952, 0.2453492283821106, 0.2598373591899872, 0.27432548999786377, 0.28881359100341797, 0.30330172181129456, 0.31778985261917114, 0.33227798342704773, 0.3467661142349243, 0.3612542152404785, 0.3757423460483551, 0.3902304768562317, 0.4047185778617859, 0.4192067086696625, 0.43369483947753906, 0.44818297028541565, 0.46267110109329224, 0.47715920209884644, 0.491647332906723, 0.5061354637145996, 0.5206235647201538, 0.5351117253303528, 0.549599826335907]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 8.0, 1.0, 9.0, 13.0, 9.0, 12.0, 19.0, 10.0, 15.0, 19.0, 23.0, 32.0, 32.0, 32.0, 24.0, 34.0, 35.0, 45.0, 42.0, 39.0, 49.0, 33.0, 47.0, 38.0, 39.0, 33.0, 30.0, 27.0, 24.0, 26.0, 21.0, 33.0, 24.0, 13.0, 23.0, 12.0, 8.0, 14.0, 6.0, 6.0, 9.0, 7.0, 4.0, 7.0, 4.0, 4.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.053669512271881104, -0.05201977491378784, -0.05037003383040428, -0.04872029274702072, -0.04707055538892746, -0.0454208180308342, -0.04377107694745064, -0.04212133586406708, -0.040471598505973816, -0.038821861147880554, -0.037172120064496994, -0.035522378981113434, -0.03387264162302017, -0.03222290426492691, -0.03057316318154335, -0.02892342396080494, -0.02727368474006653, -0.025623945519328117, -0.023974206298589706, -0.022324467077851295, -0.020674727857112885, -0.019024988636374474, -0.017375249415636063, -0.01572551019489765, -0.01407577097415924, -0.01242603175342083, -0.010776292532682419, -0.009126553311944008, -0.007476814091205597, -0.005827074870467186, -0.004177335649728775, -0.002527596428990364, -0.0008778572082519531, 0.0007718820124864578, 0.0024216212332248688, 0.00407136045396328, 0.005721099674701691, 0.007370838895440102, 0.009020578116178513, 0.010670317336916924, 0.012320056557655334, 0.013969795778393745, 0.015619534999132156, 0.017269274219870567, 0.01891901344060898, 0.02056875266134739, 0.0222184918820858, 0.02386823110282421, 0.025517970323562622, 0.027167709544301033, 0.028817448765039444, 0.030467187985777855, 0.032116927206516266, 0.03376666456460953, 0.03541640564799309, 0.03706614673137665, 0.03871588408946991, 0.04036562144756317, 0.04201536253094673, 0.04366510361433029, 0.04531484097242355, 0.046964578330516815, 0.048614319413900375, 0.050264060497283936, 0.0519137978553772]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 5.0, 4.0, 4.0, 7.0, 10.0, 11.0, 10.0, 13.0, 16.0, 18.0, 26.0, 18.0, 26.0, 24.0, 38.0, 25.0, 40.0, 33.0, 29.0, 39.0, 47.0, 29.0, 43.0, 47.0, 44.0, 38.0, 45.0, 38.0, 25.0, 40.0, 27.0, 22.0, 33.0, 25.0, 22.0, 26.0, 16.0, 9.0, 7.0, 9.0, 1.0, 3.0, 2.0, 3.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.75, -6.54010009765625, -6.3302001953125, -6.12030029296875, -5.910400390625, -5.70050048828125, -5.4906005859375, -5.28070068359375, -5.07080078125, -4.86090087890625, -4.6510009765625, -4.44110107421875, -4.231201171875, -4.02130126953125, -3.8114013671875, -3.60150146484375, -3.3916015625, -3.18170166015625, -2.9718017578125, -2.76190185546875, -2.552001953125, -2.34210205078125, -2.1322021484375, -1.92230224609375, -1.71240234375, -1.50250244140625, -1.2926025390625, -1.08270263671875, -0.872802734375, -0.66290283203125, -0.4530029296875, -0.24310302734375, -0.033203125, 0.17669677734375, 0.3865966796875, 0.59649658203125, 0.806396484375, 1.01629638671875, 1.2261962890625, 1.43609619140625, 1.64599609375, 1.85589599609375, 2.0657958984375, 2.27569580078125, 2.485595703125, 2.69549560546875, 2.9053955078125, 3.11529541015625, 3.3251953125, 3.53509521484375, 3.7449951171875, 3.95489501953125, 4.164794921875, 4.37469482421875, 4.5845947265625, 4.79449462890625, 5.00439453125, 5.21429443359375, 5.4241943359375, 5.63409423828125, 5.843994140625, 6.05389404296875, 6.2637939453125, 6.47369384765625, 6.68359375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 4.0, 12.0, 18.0, 12.0, 24.0, 34.0, 56.0, 101.0, 119.0, 228.0, 376.0, 585.0, 940.0, 1501.0, 2483.0, 4194.0, 6688.0, 10956.0, 18086.0, 30087.0, 50680.0, 89281.0, 162733.0, 244117.0, 183456.0, 100656.0, 55993.0, 33156.0, 20241.0, 12301.0, 7477.0, 4652.0, 2894.0, 1660.0, 1105.0, 629.0, 377.0, 225.0, 171.0, 105.0, 51.0, 24.0, 16.0, 16.0, 8.0, 10.0, 9.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-5.734375, -5.563720703125, -5.39306640625, -5.222412109375, -5.0517578125, -4.881103515625, -4.71044921875, -4.539794921875, -4.369140625, -4.198486328125, -4.02783203125, -3.857177734375, -3.6865234375, -3.515869140625, -3.34521484375, -3.174560546875, -3.00390625, -2.833251953125, -2.66259765625, -2.491943359375, -2.3212890625, -2.150634765625, -1.97998046875, -1.809326171875, -1.638671875, -1.468017578125, -1.29736328125, -1.126708984375, -0.9560546875, -0.785400390625, -0.61474609375, -0.444091796875, -0.2734375, -0.102783203125, 0.06787109375, 0.238525390625, 0.4091796875, 0.579833984375, 0.75048828125, 0.921142578125, 1.091796875, 1.262451171875, 1.43310546875, 1.603759765625, 1.7744140625, 1.945068359375, 2.11572265625, 2.286376953125, 2.45703125, 2.627685546875, 2.79833984375, 2.968994140625, 3.1396484375, 3.310302734375, 3.48095703125, 3.651611328125, 3.822265625, 3.992919921875, 4.16357421875, 4.334228515625, 4.5048828125, 4.675537109375, 4.84619140625, 5.016845703125, 5.1875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 5.0, 4.0, 7.0, 9.0, 12.0, 11.0, 18.0, 27.0, 21.0, 30.0, 13.0, 34.0, 32.0, 37.0, 40.0, 49.0, 54.0, 74.0, 140.0, 301.0, 1441.0, 199.0, 82.0, 48.0, 49.0, 40.0, 46.0, 27.0, 24.0, 32.0, 19.0, 10.0, 12.0, 14.0, 18.0, 17.0, 11.0, 13.0, 5.0, 3.0, 4.0, 1.0, 9.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.03125, -20.335693359375, -19.64013671875, -18.944580078125, -18.2490234375, -17.553466796875, -16.85791015625, -16.162353515625, -15.466796875, -14.771240234375, -14.07568359375, -13.380126953125, -12.6845703125, -11.989013671875, -11.29345703125, -10.597900390625, -9.90234375, -9.206787109375, -8.51123046875, -7.815673828125, -7.1201171875, -6.424560546875, -5.72900390625, -5.033447265625, -4.337890625, -3.642333984375, -2.94677734375, -2.251220703125, -1.5556640625, -0.860107421875, -0.16455078125, 0.531005859375, 1.2265625, 1.922119140625, 2.61767578125, 3.313232421875, 4.0087890625, 4.704345703125, 5.39990234375, 6.095458984375, 6.791015625, 7.486572265625, 8.18212890625, 8.877685546875, 9.5732421875, 10.268798828125, 10.96435546875, 11.659912109375, 12.35546875, 13.051025390625, 13.74658203125, 14.442138671875, 15.1376953125, 15.833251953125, 16.52880859375, 17.224365234375, 17.919921875, 18.615478515625, 19.31103515625, 20.006591796875, 20.7021484375, 21.397705078125, 22.09326171875, 22.788818359375, 23.484375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0, 8.0, 6.0, 7.0, 10.0, 17.0, 11.0, 26.0, 19.0, 26.0, 38.0, 45.0, 65.0, 98.0, 117.0, 192.0, 276.0, 574.0, 1775.0, 28535.0, 2034227.0, 1058641.0, 18045.0, 1496.0, 478.0, 312.0, 168.0, 133.0, 84.0, 60.0, 40.0, 38.0, 40.0, 22.0, 17.0, 20.0, 11.0, 5.0, 8.0, 3.0, 4.0, 2.0, 6.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.40625, -32.25146484375, -31.0966796875, -29.94189453125, -28.787109375, -27.63232421875, -26.4775390625, -25.32275390625, -24.16796875, -23.01318359375, -21.8583984375, -20.70361328125, -19.548828125, -18.39404296875, -17.2392578125, -16.08447265625, -14.9296875, -13.77490234375, -12.6201171875, -11.46533203125, -10.310546875, -9.15576171875, -8.0009765625, -6.84619140625, -5.69140625, -4.53662109375, -3.3818359375, -2.22705078125, -1.072265625, 0.08251953125, 1.2373046875, 2.39208984375, 3.546875, 4.70166015625, 5.8564453125, 7.01123046875, 8.166015625, 9.32080078125, 10.4755859375, 11.63037109375, 12.78515625, 13.93994140625, 15.0947265625, 16.24951171875, 17.404296875, 18.55908203125, 19.7138671875, 20.86865234375, 22.0234375, 23.17822265625, 24.3330078125, 25.48779296875, 26.642578125, 27.79736328125, 28.9521484375, 30.10693359375, 31.26171875, 32.41650390625, 33.5712890625, 34.72607421875, 35.880859375, 37.03564453125, 38.1904296875, 39.34521484375, 40.5]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 19.0, 493.0, 482.0, 26.0], "bins": [-475.9611511230469, -468.2827453613281, -460.6043395996094, -452.9259338378906, -445.2475280761719, -437.5691223144531, -429.8907165527344, -422.2123107910156, -414.5339050292969, -406.8554992675781, -399.1770935058594, -391.4986877441406, -383.8202819824219, -376.1418762207031, -368.4634704589844, -360.7850646972656, -353.10662841796875, -345.42822265625, -337.74981689453125, -330.0714111328125, -322.39300537109375, -314.714599609375, -307.03619384765625, -299.3577880859375, -291.67938232421875, -284.0009765625, -276.32257080078125, -268.6441650390625, -260.96575927734375, -253.287353515625, -245.60894775390625, -237.9305419921875, -230.25213623046875, -222.57373046875, -214.89532470703125, -207.2169189453125, -199.53851318359375, -191.860107421875, -184.18170166015625, -176.5032958984375, -168.8248748779297, -161.14646911621094, -153.4680633544922, -145.78965759277344, -138.1112518310547, -130.43284606933594, -122.75443267822266, -115.0760269165039, -107.39762115478516, -99.7192153930664, -92.04080963134766, -84.36239624023438, -76.68399047851562, -69.00558471679688, -61.327178955078125, -53.648773193359375, -45.970367431640625, -38.291961669921875, -30.613554000854492, -22.93514633178711, -15.25674057006836, -7.578334808349609, 0.10007476806640625, 7.778480529785156, 15.456884384155273]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 8.0, 5.0, 16.0, 8.0, 6.0, 12.0, 18.0, 18.0, 29.0, 21.0, 27.0, 30.0, 34.0, 33.0, 48.0, 42.0, 51.0, 41.0, 40.0, 47.0, 51.0, 41.0, 23.0, 46.0, 44.0, 37.0, 28.0, 22.0, 28.0, 24.0, 31.0, 17.0, 12.0, 11.0, 10.0, 10.0, 10.0, 6.0, 7.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.573909759521484, -49.738372802734375, -47.902835845947266, -46.067298889160156, -44.23176193237305, -42.39622497558594, -40.56068801879883, -38.72515106201172, -36.88961410522461, -35.0540771484375, -33.21854019165039, -31.38300323486328, -29.547466278076172, -27.711929321289062, -25.876392364501953, -24.040855407714844, -22.205318450927734, -20.369781494140625, -18.534244537353516, -16.698707580566406, -14.863170623779297, -13.027633666992188, -11.192096710205078, -9.356559753417969, -7.521022796630859, -5.68548583984375, -3.8499488830566406, -2.0144119262695312, -0.17887496948242188, 1.6566619873046875, 3.492198944091797, 5.327735900878906, 7.16326904296875, 8.99880599975586, 10.834342956542969, 12.669879913330078, 14.505416870117188, 16.340953826904297, 18.176490783691406, 20.012027740478516, 21.847564697265625, 23.683101654052734, 25.518638610839844, 27.354175567626953, 29.189712524414062, 31.025249481201172, 32.86078643798828, 34.69632339477539, 36.5318603515625, 38.36739730834961, 40.20293426513672, 42.03847122192383, 43.87400817871094, 45.70954513549805, 47.545082092285156, 49.380619049072266, 51.216156005859375, 53.051692962646484, 54.887229919433594, 56.7227668762207, 58.55830383300781, 60.39384078979492, 62.22937774658203, 64.06491088867188, 65.90045166015625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 6.0, 6.0, 8.0, 11.0, 11.0, 18.0, 14.0, 19.0, 18.0, 23.0, 29.0, 25.0, 30.0, 26.0, 41.0, 31.0, 48.0, 38.0, 49.0, 47.0, 38.0, 31.0, 41.0, 48.0, 35.0, 38.0, 37.0, 31.0, 26.0, 21.0, 30.0, 24.0, 19.0, 16.0, 12.0, 11.0, 12.0, 6.0, 2.0, 4.0, 8.0, 1.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.17578125, -6.95867919921875, -6.7415771484375, -6.52447509765625, -6.307373046875, -6.09027099609375, -5.8731689453125, -5.65606689453125, -5.43896484375, -5.22186279296875, -5.0047607421875, -4.78765869140625, -4.570556640625, -4.35345458984375, -4.1363525390625, -3.91925048828125, -3.7021484375, -3.48504638671875, -3.2679443359375, -3.05084228515625, -2.833740234375, -2.61663818359375, -2.3995361328125, -2.18243408203125, -1.96533203125, -1.74822998046875, -1.5311279296875, -1.31402587890625, -1.096923828125, -0.87982177734375, -0.6627197265625, -0.44561767578125, -0.228515625, -0.01141357421875, 0.2056884765625, 0.42279052734375, 0.639892578125, 0.85699462890625, 1.0740966796875, 1.29119873046875, 1.50830078125, 1.72540283203125, 1.9425048828125, 2.15960693359375, 2.376708984375, 2.59381103515625, 2.8109130859375, 3.02801513671875, 3.2451171875, 3.46221923828125, 3.6793212890625, 3.89642333984375, 4.113525390625, 4.33062744140625, 4.5477294921875, 4.76483154296875, 4.98193359375, 5.19903564453125, 5.4161376953125, 5.63323974609375, 5.850341796875, 6.06744384765625, 6.2845458984375, 6.50164794921875, 6.71875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 2.0, 6.0, 7.0, 5.0, 11.0, 12.0, 10.0, 13.0, 13.0, 15.0, 13.0, 24.0, 33.0, 35.0, 51.0, 75.0, 184.0, 585.0, 2738.0, 15294.0, 92763.0, 560002.0, 2112007.0, 1161752.0, 207599.0, 33551.0, 5761.0, 1068.0, 278.0, 95.0, 52.0, 50.0, 24.0, 30.0, 30.0, 16.0, 18.0, 8.0, 6.0, 8.0, 4.0, 4.0, 10.0, 3.0, 4.0, 3.0, 5.0, 1.0, 2.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3828125, -11.979736328125, -11.57666015625, -11.173583984375, -10.7705078125, -10.367431640625, -9.96435546875, -9.561279296875, -9.158203125, -8.755126953125, -8.35205078125, -7.948974609375, -7.5458984375, -7.142822265625, -6.73974609375, -6.336669921875, -5.93359375, -5.530517578125, -5.12744140625, -4.724365234375, -4.3212890625, -3.918212890625, -3.51513671875, -3.112060546875, -2.708984375, -2.305908203125, -1.90283203125, -1.499755859375, -1.0966796875, -0.693603515625, -0.29052734375, 0.112548828125, 0.515625, 0.918701171875, 1.32177734375, 1.724853515625, 2.1279296875, 2.531005859375, 2.93408203125, 3.337158203125, 3.740234375, 4.143310546875, 4.54638671875, 4.949462890625, 5.3525390625, 5.755615234375, 6.15869140625, 6.561767578125, 6.96484375, 7.367919921875, 7.77099609375, 8.174072265625, 8.5771484375, 8.980224609375, 9.38330078125, 9.786376953125, 10.189453125, 10.592529296875, 10.99560546875, 11.398681640625, 11.8017578125, 12.204833984375, 12.60791015625, 13.010986328125, 13.4140625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 9.0, 9.0, 3.0, 9.0, 11.0, 17.0, 22.0, 28.0, 30.0, 48.0, 65.0, 80.0, 109.0, 134.0, 153.0, 212.0, 298.0, 364.0, 412.0, 408.0, 353.0, 304.0, 237.0, 184.0, 142.0, 116.0, 72.0, 61.0, 32.0, 31.0, 34.0, 29.0, 10.0, 12.0, 17.0, 4.0, 6.0, 2.0, 1.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.671875, -10.349609375, -10.02734375, -9.705078125, -9.3828125, -9.060546875, -8.73828125, -8.416015625, -8.09375, -7.771484375, -7.44921875, -7.126953125, -6.8046875, -6.482421875, -6.16015625, -5.837890625, -5.515625, -5.193359375, -4.87109375, -4.548828125, -4.2265625, -3.904296875, -3.58203125, -3.259765625, -2.9375, -2.615234375, -2.29296875, -1.970703125, -1.6484375, -1.326171875, -1.00390625, -0.681640625, -0.359375, -0.037109375, 0.28515625, 0.607421875, 0.9296875, 1.251953125, 1.57421875, 1.896484375, 2.21875, 2.541015625, 2.86328125, 3.185546875, 3.5078125, 3.830078125, 4.15234375, 4.474609375, 4.796875, 5.119140625, 5.44140625, 5.763671875, 6.0859375, 6.408203125, 6.73046875, 7.052734375, 7.375, 7.697265625, 8.01953125, 8.341796875, 8.6640625, 8.986328125, 9.30859375, 9.630859375, 9.953125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 2.0, 3.0, 3.0, 7.0, 9.0, 11.0, 26.0, 20.0, 30.0, 39.0, 38.0, 63.0, 101.0, 149.0, 233.0, 358.0, 736.0, 2840.0, 66154.0, 2627611.0, 1460033.0, 32288.0, 1867.0, 586.0, 333.0, 210.0, 143.0, 111.0, 79.0, 49.0, 33.0, 33.0, 20.0, 19.0, 12.0, 7.0, 5.0, 10.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.0625, -32.92333984375, -31.7841796875, -30.64501953125, -29.505859375, -28.36669921875, -27.2275390625, -26.08837890625, -24.94921875, -23.81005859375, -22.6708984375, -21.53173828125, -20.392578125, -19.25341796875, -18.1142578125, -16.97509765625, -15.8359375, -14.69677734375, -13.5576171875, -12.41845703125, -11.279296875, -10.14013671875, -9.0009765625, -7.86181640625, -6.72265625, -5.58349609375, -4.4443359375, -3.30517578125, -2.166015625, -1.02685546875, 0.1123046875, 1.25146484375, 2.390625, 3.52978515625, 4.6689453125, 5.80810546875, 6.947265625, 8.08642578125, 9.2255859375, 10.36474609375, 11.50390625, 12.64306640625, 13.7822265625, 14.92138671875, 16.060546875, 17.19970703125, 18.3388671875, 19.47802734375, 20.6171875, 21.75634765625, 22.8955078125, 24.03466796875, 25.173828125, 26.31298828125, 27.4521484375, 28.59130859375, 29.73046875, 30.86962890625, 32.0087890625, 33.14794921875, 34.287109375, 35.42626953125, 36.5654296875, 37.70458984375, 38.84375]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [4.0, 7.0, 36.0, 129.0, 244.0, 301.0, 183.0, 83.0, 28.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.56815528869629, -17.559894561767578, -13.551631927490234, -9.543370246887207, -5.53510856628418, -1.526845932006836, 2.481414794921875, 6.489675521850586, 10.49793815612793, 14.506199836730957, 18.514461517333984, 22.522724151611328, 26.53098487854004, 30.539247512817383, 34.547508239746094, 38.55577087402344, 42.56403350830078, 46.572296142578125, 50.58055877685547, 54.58881759643555, 58.59708023071289, 62.605342864990234, 66.61360168457031, 70.62186431884766, 74.630126953125, 78.63838958740234, 82.64665222167969, 86.65491485595703, 90.66317749023438, 94.67143249511719, 98.67969512939453, 102.68795776367188, 106.69621276855469, 110.70447540283203, 114.71273803710938, 118.72100067138672, 122.72926330566406, 126.73751831054688, 130.74578857421875, 134.75404357910156, 138.76229858398438, 142.7705535888672, 146.77882385253906, 150.78707885742188, 154.79534912109375, 158.80360412597656, 162.81187438964844, 166.82012939453125, 170.82839965820312, 174.83665466308594, 178.8449249267578, 182.85317993164062, 186.8614501953125, 190.8697052001953, 194.8779754638672, 198.88623046875, 202.89450073242188, 206.9027557373047, 210.91102600097656, 214.91928100585938, 218.92755126953125, 222.93580627441406, 226.94407653808594, 230.95233154296875, 234.96058654785156]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 4.0, 1.0, 3.0, 4.0, 8.0, 3.0, 10.0, 6.0, 11.0, 9.0, 12.0, 14.0, 17.0, 10.0, 18.0, 33.0, 18.0, 29.0, 38.0, 31.0, 29.0, 31.0, 39.0, 34.0, 43.0, 45.0, 35.0, 35.0, 48.0, 43.0, 34.0, 38.0, 27.0, 23.0, 23.0, 35.0, 33.0, 23.0, 23.0, 18.0, 10.0, 13.0, 11.0, 4.0, 8.0, 10.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.207984924316406, -32.057682037353516, -30.907379150390625, -29.757076263427734, -28.606773376464844, -27.456470489501953, -26.306169509887695, -25.155866622924805, -24.005563735961914, -22.855260848999023, -21.704957962036133, -20.554655075073242, -19.404354095458984, -18.254051208496094, -17.103748321533203, -15.953445434570312, -14.803142547607422, -13.652839660644531, -12.50253677368164, -11.352234840393066, -10.201931953430176, -9.051629066467285, -7.901326656341553, -6.75102424621582, -5.60072135925293, -4.450418472290039, -3.3001160621643066, -2.149813413619995, -0.9995107650756836, 0.15079212188720703, 1.3010945320129395, 2.451396942138672, 3.6016998291015625, 4.752002716064453, 5.9023051261901855, 7.052607536315918, 8.202910423278809, 9.3532133102417, 10.503515243530273, 11.653818130493164, 12.804121017456055, 13.954423904418945, 15.104726791381836, 16.255029678344727, 17.405330657958984, 18.555633544921875, 19.705936431884766, 20.856239318847656, 22.006542205810547, 23.156845092773438, 24.307147979736328, 25.45745086669922, 26.60775375366211, 27.758056640625, 28.908357620239258, 30.05866050720215, 31.20896339416504, 32.3592643737793, 33.50956726074219, 34.65987014770508, 35.81017303466797, 36.96047592163086, 38.11077880859375, 39.26108169555664, 40.41138458251953]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 0.0, 7.0, 5.0, 7.0, 7.0, 10.0, 13.0, 14.0, 17.0, 15.0, 20.0, 37.0, 34.0, 30.0, 35.0, 33.0, 34.0, 54.0, 53.0, 49.0, 54.0, 39.0, 42.0, 44.0, 44.0, 36.0, 27.0, 38.0, 27.0, 22.0, 25.0, 26.0, 34.0, 11.0, 12.0, 14.0, 11.0, 10.0, 7.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.69140625, -6.45904541015625, -6.2266845703125, -5.99432373046875, -5.761962890625, -5.52960205078125, -5.2972412109375, -5.06488037109375, -4.83251953125, -4.60015869140625, -4.3677978515625, -4.13543701171875, -3.903076171875, -3.67071533203125, -3.4383544921875, -3.20599365234375, -2.9736328125, -2.74127197265625, -2.5089111328125, -2.27655029296875, -2.044189453125, -1.81182861328125, -1.5794677734375, -1.34710693359375, -1.11474609375, -0.88238525390625, -0.6500244140625, -0.41766357421875, -0.185302734375, 0.04705810546875, 0.2794189453125, 0.51177978515625, 0.744140625, 0.97650146484375, 1.2088623046875, 1.44122314453125, 1.673583984375, 1.90594482421875, 2.1383056640625, 2.37066650390625, 2.60302734375, 2.83538818359375, 3.0677490234375, 3.30010986328125, 3.532470703125, 3.76483154296875, 3.9971923828125, 4.22955322265625, 4.4619140625, 4.69427490234375, 4.9266357421875, 5.15899658203125, 5.391357421875, 5.62371826171875, 5.8560791015625, 6.08843994140625, 6.32080078125, 6.55316162109375, 6.7855224609375, 7.01788330078125, 7.250244140625, 7.48260498046875, 7.7149658203125, 7.94732666015625, 8.1796875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 10.0, 12.0, 21.0, 29.0, 51.0, 55.0, 112.0, 164.0, 298.0, 434.0, 790.0, 1338.0, 2071.0, 3442.0, 5386.0, 8926.0, 14080.0, 22202.0, 33797.0, 49999.0, 70913.0, 94456.0, 116309.0, 130085.0, 125994.0, 106652.0, 82773.0, 60796.0, 41654.0, 27943.0, 17995.0, 11551.0, 7048.0, 4271.0, 2735.0, 1628.0, 946.0, 609.0, 361.0, 222.0, 162.0, 86.0, 74.0, 38.0, 14.0, 9.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.8583984375, -0.8321990966796875, -0.805999755859375, -0.7798004150390625, -0.75360107421875, -0.7274017333984375, -0.701202392578125, -0.6750030517578125, -0.6488037109375, -0.6226043701171875, -0.596405029296875, -0.5702056884765625, -0.54400634765625, -0.5178070068359375, -0.491607666015625, -0.4654083251953125, -0.439208984375, -0.4130096435546875, -0.386810302734375, -0.3606109619140625, -0.33441162109375, -0.3082122802734375, -0.282012939453125, -0.2558135986328125, -0.2296142578125, -0.2034149169921875, -0.177215576171875, -0.1510162353515625, -0.12481689453125, -0.0986175537109375, -0.072418212890625, -0.0462188720703125, -0.02001953125, 0.0061798095703125, 0.032379150390625, 0.0585784912109375, 0.08477783203125, 0.1109771728515625, 0.137176513671875, 0.1633758544921875, 0.1895751953125, 0.2157745361328125, 0.241973876953125, 0.2681732177734375, 0.29437255859375, 0.3205718994140625, 0.346771240234375, 0.3729705810546875, 0.399169921875, 0.4253692626953125, 0.451568603515625, 0.4777679443359375, 0.50396728515625, 0.5301666259765625, 0.556365966796875, 0.5825653076171875, 0.6087646484375, 0.6349639892578125, 0.661163330078125, 0.6873626708984375, 0.71356201171875, 0.7397613525390625, 0.765960693359375, 0.7921600341796875, 0.818359375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 15.0, 8.0, 7.0, 22.0, 7.0, 12.0, 14.0, 12.0, 25.0, 25.0, 30.0, 25.0, 25.0, 43.0, 29.0, 36.0, 41.0, 35.0, 48.0, 1072.0, 35.0, 33.0, 42.0, 39.0, 34.0, 36.0, 29.0, 33.0, 30.0, 27.0, 31.0, 15.0, 17.0, 18.0, 11.0, 11.0, 16.0, 7.0, 6.0, 4.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.41015625, -5.2435302734375, -5.076904296875, -4.9102783203125, -4.74365234375, -4.5770263671875, -4.410400390625, -4.2437744140625, -4.0771484375, -3.9105224609375, -3.743896484375, -3.5772705078125, -3.41064453125, -3.2440185546875, -3.077392578125, -2.9107666015625, -2.744140625, -2.5775146484375, -2.410888671875, -2.2442626953125, -2.07763671875, -1.9110107421875, -1.744384765625, -1.5777587890625, -1.4111328125, -1.2445068359375, -1.077880859375, -0.9112548828125, -0.74462890625, -0.5780029296875, -0.411376953125, -0.2447509765625, -0.078125, 0.0885009765625, 0.255126953125, 0.4217529296875, 0.58837890625, 0.7550048828125, 0.921630859375, 1.0882568359375, 1.2548828125, 1.4215087890625, 1.588134765625, 1.7547607421875, 1.92138671875, 2.0880126953125, 2.254638671875, 2.4212646484375, 2.587890625, 2.7545166015625, 2.921142578125, 3.0877685546875, 3.25439453125, 3.4210205078125, 3.587646484375, 3.7542724609375, 3.9208984375, 4.0875244140625, 4.254150390625, 4.4207763671875, 4.58740234375, 4.7540283203125, 4.920654296875, 5.0872802734375, 5.25390625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 1.0, 7.0, 13.0, 12.0, 17.0, 31.0, 47.0, 58.0, 114.0, 165.0, 210.0, 347.0, 551.0, 822.0, 1267.0, 2100.0, 3421.0, 5585.0, 9349.0, 15985.0, 26335.0, 45956.0, 1880758.0, 42037.0, 24300.0, 14849.0, 8889.0, 5310.0, 3210.0, 1956.0, 1233.0, 795.0, 499.0, 310.0, 206.0, 129.0, 94.0, 55.0, 33.0, 21.0, 15.0, 13.0, 8.0, 9.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.927734375, -1.8643798828125, -1.801025390625, -1.7376708984375, -1.67431640625, -1.6109619140625, -1.547607421875, -1.4842529296875, -1.4208984375, -1.3575439453125, -1.294189453125, -1.2308349609375, -1.16748046875, -1.1041259765625, -1.040771484375, -0.9774169921875, -0.9140625, -0.8507080078125, -0.787353515625, -0.7239990234375, -0.66064453125, -0.5972900390625, -0.533935546875, -0.4705810546875, -0.4072265625, -0.3438720703125, -0.280517578125, -0.2171630859375, -0.15380859375, -0.0904541015625, -0.027099609375, 0.0362548828125, 0.099609375, 0.1629638671875, 0.226318359375, 0.2896728515625, 0.35302734375, 0.4163818359375, 0.479736328125, 0.5430908203125, 0.6064453125, 0.6697998046875, 0.733154296875, 0.7965087890625, 0.85986328125, 0.9232177734375, 0.986572265625, 1.0499267578125, 1.11328125, 1.1766357421875, 1.239990234375, 1.3033447265625, 1.36669921875, 1.4300537109375, 1.493408203125, 1.5567626953125, 1.6201171875, 1.6834716796875, 1.746826171875, 1.8101806640625, 1.87353515625, 1.9368896484375, 2.000244140625, 2.0635986328125, 2.126953125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 7.0, 5.0, 4.0, 4.0, 8.0, 8.0, 17.0, 14.0, 20.0, 20.0, 20.0, 21.0, 32.0, 34.0, 38.0, 48.0, 50.0, 64.0, 61.0, 49.0, 58.0, 47.0, 47.0, 61.0, 42.0, 48.0, 22.0, 28.0, 17.0, 25.0, 11.0, 15.0, 14.0, 9.0, 4.0, 4.0, 3.0, 3.0, 2.0, 7.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.04083251953125, -0.03957986831665039, -0.03832721710205078, -0.03707456588745117, -0.03582191467285156, -0.03456926345825195, -0.033316612243652344, -0.032063961029052734, -0.030811309814453125, -0.029558658599853516, -0.028306007385253906, -0.027053356170654297, -0.025800704956054688, -0.024548053741455078, -0.02329540252685547, -0.02204275131225586, -0.02079010009765625, -0.01953744888305664, -0.01828479766845703, -0.017032146453857422, -0.015779495239257812, -0.014526844024658203, -0.013274192810058594, -0.012021541595458984, -0.010768890380859375, -0.009516239166259766, -0.008263587951660156, -0.007010936737060547, -0.0057582855224609375, -0.004505634307861328, -0.0032529830932617188, -0.0020003318786621094, -0.0007476806640625, 0.0005049705505371094, 0.0017576217651367188, 0.003010272979736328, 0.0042629241943359375, 0.005515575408935547, 0.006768226623535156, 0.008020877838134766, 0.009273529052734375, 0.010526180267333984, 0.011778831481933594, 0.013031482696533203, 0.014284133911132812, 0.015536785125732422, 0.01678943634033203, 0.01804208755493164, 0.01929473876953125, 0.02054738998413086, 0.02180004119873047, 0.023052692413330078, 0.024305343627929688, 0.025557994842529297, 0.026810646057128906, 0.028063297271728516, 0.029315948486328125, 0.030568599700927734, 0.031821250915527344, 0.03307390213012695, 0.03432655334472656, 0.03557920455932617, 0.03683185577392578, 0.03808450698852539, 0.039337158203125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 5.0, 2.0, 4.0, 3.0, 4.0, 8.0, 13.0, 14.0, 15.0, 17.0, 32.0, 26.0, 48.0, 51.0, 93.0, 110.0, 191.0, 288.0, 649.0, 5263.0, 1036229.0, 3916.0, 620.0, 296.0, 181.0, 99.0, 92.0, 60.0, 38.0, 35.0, 32.0, 13.0, 28.0, 19.0, 15.0, 10.0, 4.0, 5.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8310546875, -0.8046493530273438, -0.7782440185546875, -0.7518386840820312, -0.725433349609375, -0.6990280151367188, -0.6726226806640625, -0.6462173461914062, -0.61981201171875, -0.5934066772460938, -0.5670013427734375, -0.5405960083007812, -0.514190673828125, -0.48778533935546875, -0.4613800048828125, -0.43497467041015625, -0.4085693359375, -0.38216400146484375, -0.3557586669921875, -0.32935333251953125, -0.302947998046875, -0.27654266357421875, -0.2501373291015625, -0.22373199462890625, -0.19732666015625, -0.17092132568359375, -0.1445159912109375, -0.11811065673828125, -0.091705322265625, -0.06529998779296875, -0.0388946533203125, -0.01248931884765625, 0.013916015625, 0.04032135009765625, 0.0667266845703125, 0.09313201904296875, 0.119537353515625, 0.14594268798828125, 0.1723480224609375, 0.19875335693359375, 0.22515869140625, 0.25156402587890625, 0.2779693603515625, 0.30437469482421875, 0.330780029296875, 0.35718536376953125, 0.3835906982421875, 0.40999603271484375, 0.4364013671875, 0.46280670166015625, 0.4892120361328125, 0.5156173706054688, 0.542022705078125, 0.5684280395507812, 0.5948333740234375, 0.6212387084960938, 0.64764404296875, 0.6740493774414062, 0.7004547119140625, 0.7268600463867188, 0.753265380859375, 0.7796707153320312, 0.8060760498046875, 0.8324813842773438, 0.85888671875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 16.0, 963.0, 38.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7048772573471069, -0.677444338798523, -0.650011420249939, -0.622578501701355, -0.5951456427574158, -0.5677127242088318, -0.5402798056602478, -0.5128468871116638, -0.4854139983654022, -0.45798107981681824, -0.43054819107055664, -0.40311527252197266, -0.37568235397338867, -0.3482494652271271, -0.3208165466785431, -0.2933836579322815, -0.2659507393836975, -0.23851783573627472, -0.21108493208885193, -0.18365201354026794, -0.15621910989284515, -0.12878620624542236, -0.10135328769683838, -0.07392038404941559, -0.0464874804019928, -0.01905457302927971, 0.00837833434343338, 0.03581124544143677, 0.06324414908885956, 0.09067705273628235, 0.11810997128486633, 0.14554287493228912, 0.17297577857971191, 0.2004086822271347, 0.2278415858745575, 0.2552745044231415, 0.2827073931694031, 0.31014031171798706, 0.33757323026657104, 0.36500614881515503, 0.3924390375614166, 0.4198719561100006, 0.4473048448562622, 0.4747377634048462, 0.5021706819534302, 0.5296036005020142, 0.5570365190505981, 0.5844693779945374, 0.6119022965431213, 0.6393352150917053, 0.6667681336402893, 0.6942009925842285, 0.7216339111328125, 0.7490668296813965, 0.7764997482299805, 0.8039326667785645, 0.8313655853271484, 0.8587985038757324, 0.8862314224243164, 0.9136643409729004, 0.9410971999168396, 0.9685301184654236, 0.9959630370140076, 1.0233958959579468, 1.0508288145065308]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 5.0, 6.0, 2.0, 2.0, 5.0, 5.0, 8.0, 10.0, 5.0, 15.0, 13.0, 10.0, 15.0, 22.0, 24.0, 15.0, 27.0, 27.0, 28.0, 48.0, 29.0, 27.0, 34.0, 27.0, 35.0, 33.0, 30.0, 29.0, 31.0, 33.0, 28.0, 30.0, 37.0, 36.0, 30.0, 29.0, 17.0, 29.0, 18.0, 17.0, 18.0, 17.0, 19.0, 16.0, 9.0, 10.0, 7.0, 8.0, 10.0, 10.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.06905996799468994, -0.06679924577474594, -0.06453851610422134, -0.062277793884277344, -0.060017067939043045, -0.057756341993808746, -0.055495619773864746, -0.05323489382863045, -0.05097416788339615, -0.04871344193816185, -0.04645271599292755, -0.04419199377298355, -0.04193126782774925, -0.039670541882514954, -0.03740981966257095, -0.035149093717336655, -0.032888367772102356, -0.030627641826868057, -0.028366917744278908, -0.02610619366168976, -0.02384546771645546, -0.02158474177122116, -0.01932401768863201, -0.017063293606042862, -0.014802567660808563, -0.01254184264689684, -0.010281117632985115, -0.008020392619073391, -0.005759667605161667, -0.0034989425912499428, -0.0012382175773382187, 0.0010225065052509308, 0.0032832324504852295, 0.005543957464396954, 0.007804682478308678, 0.010065407492220402, 0.012326132506132126, 0.01458685752004385, 0.016847582533955574, 0.019108306616544724, 0.021369032561779022, 0.02362975850701332, 0.02589048258960247, 0.02815120667219162, 0.03041193261742592, 0.03267265856266022, 0.03493338078260422, 0.037194106727838516, 0.039454832673072815, 0.041715558618307114, 0.04397628456354141, 0.04623700678348541, 0.04849773272871971, 0.05075845867395401, 0.05301918089389801, 0.05527990683913231, 0.05754063278436661, 0.059801358729600906, 0.062062084674835205, 0.0643228068947792, 0.0665835291147232, 0.0688442587852478, 0.0711049810051918, 0.0733657032251358, 0.0756264328956604]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 10.0, 3.0, 4.0, 5.0, 4.0, 4.0, 9.0, 12.0, 16.0, 11.0, 20.0, 18.0, 28.0, 20.0, 32.0, 40.0, 33.0, 41.0, 38.0, 43.0, 47.0, 38.0, 47.0, 47.0, 38.0, 30.0, 41.0, 33.0, 36.0, 39.0, 38.0, 23.0, 27.0, 20.0, 18.0, 17.0, 18.0, 10.0, 15.0, 13.0, 8.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.08203125, -5.86163330078125, -5.6412353515625, -5.42083740234375, -5.200439453125, -4.98004150390625, -4.7596435546875, -4.53924560546875, -4.31884765625, -4.09844970703125, -3.8780517578125, -3.65765380859375, -3.437255859375, -3.21685791015625, -2.9964599609375, -2.77606201171875, -2.5556640625, -2.33526611328125, -2.1148681640625, -1.89447021484375, -1.674072265625, -1.45367431640625, -1.2332763671875, -1.01287841796875, -0.79248046875, -0.57208251953125, -0.3516845703125, -0.13128662109375, 0.089111328125, 0.30950927734375, 0.5299072265625, 0.75030517578125, 0.970703125, 1.19110107421875, 1.4114990234375, 1.63189697265625, 1.852294921875, 2.07269287109375, 2.2930908203125, 2.51348876953125, 2.73388671875, 2.95428466796875, 3.1746826171875, 3.39508056640625, 3.615478515625, 3.83587646484375, 4.0562744140625, 4.27667236328125, 4.4970703125, 4.71746826171875, 4.9378662109375, 5.15826416015625, 5.378662109375, 5.59906005859375, 5.8194580078125, 6.03985595703125, 6.26025390625, 6.48065185546875, 6.7010498046875, 6.92144775390625, 7.141845703125, 7.36224365234375, 7.5826416015625, 7.80303955078125, 8.0234375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 2.0, 6.0, 7.0, 7.0, 6.0, 10.0, 14.0, 14.0, 19.0, 20.0, 30.0, 25.0, 42.0, 58.0, 71.0, 136.0, 247.0, 523.0, 948.0, 2137.0, 4613.0, 9881.0, 21931.0, 56306.0, 186726.0, 444615.0, 213273.0, 62684.0, 23781.0, 10735.0, 5026.0, 2328.0, 1113.0, 483.0, 240.0, 131.0, 79.0, 65.0, 51.0, 46.0, 34.0, 34.0, 18.0, 11.0, 12.0, 8.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.953125, -8.650146484375, -8.34716796875, -8.044189453125, -7.7412109375, -7.438232421875, -7.13525390625, -6.832275390625, -6.529296875, -6.226318359375, -5.92333984375, -5.620361328125, -5.3173828125, -5.014404296875, -4.71142578125, -4.408447265625, -4.10546875, -3.802490234375, -3.49951171875, -3.196533203125, -2.8935546875, -2.590576171875, -2.28759765625, -1.984619140625, -1.681640625, -1.378662109375, -1.07568359375, -0.772705078125, -0.4697265625, -0.166748046875, 0.13623046875, 0.439208984375, 0.7421875, 1.045166015625, 1.34814453125, 1.651123046875, 1.9541015625, 2.257080078125, 2.56005859375, 2.863037109375, 3.166015625, 3.468994140625, 3.77197265625, 4.074951171875, 4.3779296875, 4.680908203125, 4.98388671875, 5.286865234375, 5.58984375, 5.892822265625, 6.19580078125, 6.498779296875, 6.8017578125, 7.104736328125, 7.40771484375, 7.710693359375, 8.013671875, 8.316650390625, 8.61962890625, 8.922607421875, 9.2255859375, 9.528564453125, 9.83154296875, 10.134521484375, 10.4375]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 0.0, 4.0, 6.0, 7.0, 11.0, 4.0, 13.0, 13.0, 17.0, 12.0, 22.0, 25.0, 15.0, 30.0, 37.0, 39.0, 49.0, 54.0, 56.0, 110.0, 184.0, 1429.0, 321.0, 147.0, 68.0, 49.0, 42.0, 38.0, 35.0, 30.0, 35.0, 31.0, 24.0, 20.0, 20.0, 14.0, 5.0, 9.0, 8.0, 1.0, 6.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-24.890625, -24.17529296875, -23.4599609375, -22.74462890625, -22.029296875, -21.31396484375, -20.5986328125, -19.88330078125, -19.16796875, -18.45263671875, -17.7373046875, -17.02197265625, -16.306640625, -15.59130859375, -14.8759765625, -14.16064453125, -13.4453125, -12.72998046875, -12.0146484375, -11.29931640625, -10.583984375, -9.86865234375, -9.1533203125, -8.43798828125, -7.72265625, -7.00732421875, -6.2919921875, -5.57666015625, -4.861328125, -4.14599609375, -3.4306640625, -2.71533203125, -2.0, -1.28466796875, -0.5693359375, 0.14599609375, 0.861328125, 1.57666015625, 2.2919921875, 3.00732421875, 3.72265625, 4.43798828125, 5.1533203125, 5.86865234375, 6.583984375, 7.29931640625, 8.0146484375, 8.72998046875, 9.4453125, 10.16064453125, 10.8759765625, 11.59130859375, 12.306640625, 13.02197265625, 13.7373046875, 14.45263671875, 15.16796875, 15.88330078125, 16.5986328125, 17.31396484375, 18.029296875, 18.74462890625, 19.4599609375, 20.17529296875, 20.890625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 7.0, 7.0, 7.0, 8.0, 8.0, 19.0, 13.0, 24.0, 24.0, 38.0, 55.0, 62.0, 84.0, 114.0, 166.0, 284.0, 600.0, 2628.0, 36884.0, 2853157.0, 242103.0, 7228.0, 986.0, 401.0, 240.0, 146.0, 85.0, 79.0, 62.0, 34.0, 27.0, 27.0, 17.0, 22.0, 9.0, 13.0, 13.0, 6.0, 9.0, 5.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.84375, -40.56494140625, -39.2861328125, -38.00732421875, -36.728515625, -35.44970703125, -34.1708984375, -32.89208984375, -31.61328125, -30.33447265625, -29.0556640625, -27.77685546875, -26.498046875, -25.21923828125, -23.9404296875, -22.66162109375, -21.3828125, -20.10400390625, -18.8251953125, -17.54638671875, -16.267578125, -14.98876953125, -13.7099609375, -12.43115234375, -11.15234375, -9.87353515625, -8.5947265625, -7.31591796875, -6.037109375, -4.75830078125, -3.4794921875, -2.20068359375, -0.921875, 0.35693359375, 1.6357421875, 2.91455078125, 4.193359375, 5.47216796875, 6.7509765625, 8.02978515625, 9.30859375, 10.58740234375, 11.8662109375, 13.14501953125, 14.423828125, 15.70263671875, 16.9814453125, 18.26025390625, 19.5390625, 20.81787109375, 22.0966796875, 23.37548828125, 24.654296875, 25.93310546875, 27.2119140625, 28.49072265625, 29.76953125, 31.04833984375, 32.3271484375, 33.60595703125, 34.884765625, 36.16357421875, 37.4423828125, 38.72119140625, 40.0]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 42.0, 420.0, 468.0, 81.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-276.24395751953125, -270.9400634765625, -265.6361389160156, -260.3322448730469, -255.0283203125, -249.72442626953125, -244.42051696777344, -239.11660766601562, -233.8126983642578, -228.5087890625, -223.2048797607422, -217.90097045898438, -212.59707641601562, -207.2931671142578, -201.9892578125, -196.6853485107422, -191.38143920898438, -186.07752990722656, -180.77362060546875, -175.46971130371094, -170.16580200195312, -164.86190795898438, -159.55799865722656, -154.25408935546875, -148.95018005371094, -143.64627075195312, -138.3423614501953, -133.0384521484375, -127.73455047607422, -122.4306411743164, -117.12673950195312, -111.82283020019531, -106.51892852783203, -101.21501922607422, -95.91111755371094, -90.60720825195312, -85.30329895019531, -79.9993896484375, -74.69548034667969, -69.3915786743164, -64.0876693725586, -58.78376007080078, -53.479854583740234, -48.17594909667969, -42.872039794921875, -37.56813049316406, -32.264225006103516, -26.96031951904297, -21.656410217285156, -16.352502822875977, -11.048595428466797, -5.744688034057617, -0.4407806396484375, 4.863126754760742, 10.167034149169922, 15.470939636230469, 20.77484893798828, 26.07875633239746, 31.38266372680664, 36.68656921386719, 41.990478515625, 47.29438781738281, 52.59829330444336, 57.902198791503906, 63.20610809326172]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 12.0, 6.0, 9.0, 8.0, 9.0, 11.0, 20.0, 16.0, 14.0, 14.0, 27.0, 26.0, 23.0, 31.0, 29.0, 39.0, 31.0, 39.0, 46.0, 34.0, 49.0, 40.0, 33.0, 38.0, 46.0, 35.0, 34.0, 32.0, 37.0, 36.0, 24.0, 22.0, 18.0, 19.0, 18.0, 13.0, 11.0, 8.0, 12.0, 7.0, 8.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-55.91427230834961, -54.134429931640625, -52.35458755493164, -50.574745178222656, -48.794898986816406, -47.01506042480469, -45.23521423339844, -43.45537185668945, -41.67552947998047, -39.895687103271484, -38.1158447265625, -36.336002349853516, -34.55615997314453, -32.77631378173828, -30.996471405029297, -29.216629028320312, -27.436786651611328, -25.656944274902344, -23.87710189819336, -22.097257614135742, -20.317415237426758, -18.537572860717773, -16.757728576660156, -14.977886199951172, -13.198043823242188, -11.418201446533203, -9.638358116149902, -7.85851526260376, -6.078672409057617, -4.298830032348633, -2.518986701965332, -0.7391433715820312, 1.0406951904296875, 2.82053804397583, 4.600380897521973, 6.380223751068115, 8.160066604614258, 9.939908981323242, 11.719752311706543, 13.499595642089844, 15.279438018798828, 17.059280395507812, 18.839122772216797, 20.618967056274414, 22.3988094329834, 24.178651809692383, 25.95849609375, 27.738338470458984, 29.51818084716797, 31.298023223876953, 33.07786560058594, 34.85770797729492, 36.637550354003906, 38.417396545410156, 40.19723892211914, 41.977081298828125, 43.75692367553711, 45.536766052246094, 47.31660842895508, 49.09645080566406, 50.87629699707031, 52.65613555908203, 54.43598175048828, 56.215824127197266, 57.99566650390625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 4.0, 6.0, 2.0, 11.0, 15.0, 11.0, 19.0, 22.0, 22.0, 23.0, 21.0, 34.0, 32.0, 31.0, 42.0, 47.0, 37.0, 37.0, 40.0, 55.0, 45.0, 38.0, 45.0, 26.0, 41.0, 36.0, 27.0, 24.0, 37.0, 26.0, 19.0, 20.0, 24.0, 21.0, 10.0, 9.0, 16.0, 5.0, 5.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.25, -7.01507568359375, -6.7801513671875, -6.54522705078125, -6.310302734375, -6.07537841796875, -5.8404541015625, -5.60552978515625, -5.37060546875, -5.13568115234375, -4.9007568359375, -4.66583251953125, -4.430908203125, -4.19598388671875, -3.9610595703125, -3.72613525390625, -3.4912109375, -3.25628662109375, -3.0213623046875, -2.78643798828125, -2.551513671875, -2.31658935546875, -2.0816650390625, -1.84674072265625, -1.61181640625, -1.37689208984375, -1.1419677734375, -0.90704345703125, -0.672119140625, -0.43719482421875, -0.2022705078125, 0.03265380859375, 0.267578125, 0.50250244140625, 0.7374267578125, 0.97235107421875, 1.207275390625, 1.44219970703125, 1.6771240234375, 1.91204833984375, 2.14697265625, 2.38189697265625, 2.6168212890625, 2.85174560546875, 3.086669921875, 3.32159423828125, 3.5565185546875, 3.79144287109375, 4.0263671875, 4.26129150390625, 4.4962158203125, 4.73114013671875, 4.966064453125, 5.20098876953125, 5.4359130859375, 5.67083740234375, 5.90576171875, 6.14068603515625, 6.3756103515625, 6.61053466796875, 6.845458984375, 7.08038330078125, 7.3153076171875, 7.55023193359375, 7.78515625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 6.0, 6.0, 5.0, 6.0, 15.0, 14.0, 18.0, 32.0, 42.0, 58.0, 88.0, 125.0, 320.0, 822.0, 2513.0, 8425.0, 31746.0, 127487.0, 513874.0, 1533999.0, 1397562.0, 433895.0, 106880.0, 25875.0, 6945.0, 2133.0, 708.0, 281.0, 122.0, 80.0, 46.0, 30.0, 30.0, 27.0, 16.0, 13.0, 7.0, 10.0, 8.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4609375, -9.1448974609375, -8.828857421875, -8.5128173828125, -8.19677734375, -7.8807373046875, -7.564697265625, -7.2486572265625, -6.9326171875, -6.6165771484375, -6.300537109375, -5.9844970703125, -5.66845703125, -5.3524169921875, -5.036376953125, -4.7203369140625, -4.404296875, -4.0882568359375, -3.772216796875, -3.4561767578125, -3.14013671875, -2.8240966796875, -2.508056640625, -2.1920166015625, -1.8759765625, -1.5599365234375, -1.243896484375, -0.9278564453125, -0.61181640625, -0.2957763671875, 0.020263671875, 0.3363037109375, 0.65234375, 0.9683837890625, 1.284423828125, 1.6004638671875, 1.91650390625, 2.2325439453125, 2.548583984375, 2.8646240234375, 3.1806640625, 3.4967041015625, 3.812744140625, 4.1287841796875, 4.44482421875, 4.7608642578125, 5.076904296875, 5.3929443359375, 5.708984375, 6.0250244140625, 6.341064453125, 6.6571044921875, 6.97314453125, 7.2891845703125, 7.605224609375, 7.9212646484375, 8.2373046875, 8.5533447265625, 8.869384765625, 9.1854248046875, 9.50146484375, 9.8175048828125, 10.133544921875, 10.4495849609375, 10.765625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 6.0, 9.0, 6.0, 9.0, 10.0, 14.0, 26.0, 15.0, 31.0, 46.0, 63.0, 68.0, 96.0, 140.0, 166.0, 248.0, 284.0, 346.0, 347.0, 385.0, 370.0, 306.0, 231.0, 199.0, 170.0, 111.0, 77.0, 65.0, 57.0, 39.0, 27.0, 25.0, 20.0, 11.0, 10.0, 9.0, 14.0, 4.0, 3.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.734375, -8.4251708984375, -8.115966796875, -7.8067626953125, -7.49755859375, -7.1883544921875, -6.879150390625, -6.5699462890625, -6.2607421875, -5.9515380859375, -5.642333984375, -5.3331298828125, -5.02392578125, -4.7147216796875, -4.405517578125, -4.0963134765625, -3.787109375, -3.4779052734375, -3.168701171875, -2.8594970703125, -2.55029296875, -2.2410888671875, -1.931884765625, -1.6226806640625, -1.3134765625, -1.0042724609375, -0.695068359375, -0.3858642578125, -0.07666015625, 0.2325439453125, 0.541748046875, 0.8509521484375, 1.16015625, 1.4693603515625, 1.778564453125, 2.0877685546875, 2.39697265625, 2.7061767578125, 3.015380859375, 3.3245849609375, 3.6337890625, 3.9429931640625, 4.252197265625, 4.5614013671875, 4.87060546875, 5.1798095703125, 5.489013671875, 5.7982177734375, 6.107421875, 6.4166259765625, 6.725830078125, 7.0350341796875, 7.34423828125, 7.6534423828125, 7.962646484375, 8.2718505859375, 8.5810546875, 8.8902587890625, 9.199462890625, 9.5086669921875, 9.81787109375, 10.1270751953125, 10.436279296875, 10.7454833984375, 11.0546875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 8.0, 6.0, 11.0, 15.0, 17.0, 17.0, 25.0, 39.0, 39.0, 73.0, 104.0, 138.0, 185.0, 306.0, 487.0, 994.0, 3222.0, 23026.0, 295005.0, 2875319.0, 923669.0, 61733.0, 6673.0, 1460.0, 582.0, 346.0, 236.0, 145.0, 129.0, 76.0, 45.0, 38.0, 24.0, 21.0, 11.0, 14.0, 14.0, 8.0, 9.0, 2.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-26.765625, -25.994384765625, -25.22314453125, -24.451904296875, -23.6806640625, -22.909423828125, -22.13818359375, -21.366943359375, -20.595703125, -19.824462890625, -19.05322265625, -18.281982421875, -17.5107421875, -16.739501953125, -15.96826171875, -15.197021484375, -14.42578125, -13.654541015625, -12.88330078125, -12.112060546875, -11.3408203125, -10.569580078125, -9.79833984375, -9.027099609375, -8.255859375, -7.484619140625, -6.71337890625, -5.942138671875, -5.1708984375, -4.399658203125, -3.62841796875, -2.857177734375, -2.0859375, -1.314697265625, -0.54345703125, 0.227783203125, 0.9990234375, 1.770263671875, 2.54150390625, 3.312744140625, 4.083984375, 4.855224609375, 5.62646484375, 6.397705078125, 7.1689453125, 7.940185546875, 8.71142578125, 9.482666015625, 10.25390625, 11.025146484375, 11.79638671875, 12.567626953125, 13.3388671875, 14.110107421875, 14.88134765625, 15.652587890625, 16.423828125, 17.195068359375, 17.96630859375, 18.737548828125, 19.5087890625, 20.280029296875, 21.05126953125, 21.822509765625, 22.59375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 18.0, 22.0, 72.0, 132.0, 197.0, 213.0, 158.0, 98.0, 60.0, 27.0, 9.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-124.78626251220703, -121.91448974609375, -119.04270935058594, -116.17093658447266, -113.29916381835938, -110.4273910522461, -107.55561828613281, -104.683837890625, -101.81206512451172, -98.94029235839844, -96.06851196289062, -93.19673919677734, -90.32496643066406, -87.45319366455078, -84.5814208984375, -81.70964050292969, -78.8378677368164, -75.96609497070312, -73.09431457519531, -70.22254180908203, -67.35076904296875, -64.47899627685547, -61.60721969604492, -58.735443115234375, -55.863670349121094, -52.99189758300781, -50.120121002197266, -47.24834442138672, -44.37657165527344, -41.504798889160156, -38.63302230834961, -35.76124572753906, -32.88947677612305, -30.017702102661133, -27.14592742919922, -24.274152755737305, -21.40237808227539, -18.530603408813477, -15.658828735351562, -12.787054061889648, -9.915279388427734, -7.04350471496582, -4.171730041503906, -1.2999553680419922, 1.5718193054199219, 4.443593978881836, 7.31536865234375, 10.187143325805664, 13.058917999267578, 15.930692672729492, 18.802467346191406, 21.67424201965332, 24.546016693115234, 27.41779136657715, 30.289566040039062, 33.161338806152344, 36.03311538696289, 38.90489196777344, 41.77666473388672, 44.6484375, 47.52021408081055, 50.391990661621094, 53.263763427734375, 56.135536193847656, 59.0073127746582]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 10.0, 8.0, 3.0, 3.0, 7.0, 15.0, 26.0, 27.0, 25.0, 22.0, 25.0, 33.0, 38.0, 25.0, 52.0, 47.0, 38.0, 39.0, 50.0, 59.0, 44.0, 50.0, 56.0, 44.0, 36.0, 26.0, 30.0, 31.0, 24.0, 29.0, 20.0, 9.0, 16.0, 14.0, 3.0, 7.0, 3.0, 4.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.99076461791992, -42.73167419433594, -41.47258758544922, -40.213497161865234, -38.95440673828125, -37.69532012939453, -36.43622970581055, -35.17713928222656, -33.918052673339844, -32.65896224975586, -31.399873733520508, -30.140785217285156, -28.881694793701172, -27.62260627746582, -26.36351776123047, -25.104427337646484, -23.8453369140625, -22.58624839782715, -21.327157974243164, -20.068069458007812, -18.808979034423828, -17.549890518188477, -16.290802001953125, -15.031712532043457, -13.772623062133789, -12.513533592224121, -11.254444122314453, -9.995355606079102, -8.736266136169434, -7.477176666259766, -6.218087673187256, -4.958998680114746, -3.6999130249023438, -2.440823793411255, -1.181734561920166, 0.07735466957092285, 1.3364439010620117, 2.5955333709716797, 3.8546223640441895, 5.113711357116699, 6.372800827026367, 7.631890296936035, 8.890979766845703, 10.150068283081055, 11.409157752990723, 12.66824722290039, 13.927335739135742, 15.18642520904541, 16.445514678955078, 17.70460319519043, 18.963693618774414, 20.222782135009766, 21.48187255859375, 22.7409610748291, 24.000049591064453, 25.259140014648438, 26.51822853088379, 27.77731704711914, 29.036407470703125, 30.295495986938477, 31.554584503173828, 32.81367492675781, 34.0727653503418, 35.331851959228516, 36.5909423828125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 3.0, 10.0, 7.0, 8.0, 16.0, 11.0, 11.0, 20.0, 26.0, 16.0, 31.0, 28.0, 35.0, 30.0, 36.0, 39.0, 37.0, 40.0, 50.0, 49.0, 48.0, 41.0, 36.0, 42.0, 38.0, 43.0, 35.0, 28.0, 25.0, 32.0, 28.0, 18.0, 13.0, 16.0, 10.0, 13.0, 5.0, 6.0, 6.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.24609375, -7.00836181640625, -6.7706298828125, -6.53289794921875, -6.295166015625, -6.05743408203125, -5.8197021484375, -5.58197021484375, -5.34423828125, -5.10650634765625, -4.8687744140625, -4.63104248046875, -4.393310546875, -4.15557861328125, -3.9178466796875, -3.68011474609375, -3.4423828125, -3.20465087890625, -2.9669189453125, -2.72918701171875, -2.491455078125, -2.25372314453125, -2.0159912109375, -1.77825927734375, -1.54052734375, -1.30279541015625, -1.0650634765625, -0.82733154296875, -0.589599609375, -0.35186767578125, -0.1141357421875, 0.12359619140625, 0.361328125, 0.59906005859375, 0.8367919921875, 1.07452392578125, 1.312255859375, 1.54998779296875, 1.7877197265625, 2.02545166015625, 2.26318359375, 2.50091552734375, 2.7386474609375, 2.97637939453125, 3.214111328125, 3.45184326171875, 3.6895751953125, 3.92730712890625, 4.1650390625, 4.40277099609375, 4.6405029296875, 4.87823486328125, 5.115966796875, 5.35369873046875, 5.5914306640625, 5.82916259765625, 6.06689453125, 6.30462646484375, 6.5423583984375, 6.78009033203125, 7.017822265625, 7.25555419921875, 7.4932861328125, 7.73101806640625, 7.96875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 10.0, 18.0, 26.0, 51.0, 61.0, 77.0, 133.0, 162.0, 292.0, 432.0, 675.0, 1079.0, 1678.0, 2787.0, 4268.0, 6807.0, 10402.0, 15904.0, 24112.0, 35439.0, 50828.0, 70242.0, 92264.0, 111932.0, 124689.0, 120385.0, 102947.0, 81255.0, 60416.0, 43188.0, 29845.0, 19797.0, 13074.0, 8317.0, 5433.0, 3439.0, 2185.0, 1445.0, 842.0, 540.0, 351.0, 250.0, 166.0, 108.0, 75.0, 43.0, 26.0, 27.0, 14.0, 9.0, 1.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.76953125, -0.7445144653320312, -0.7194976806640625, -0.6944808959960938, -0.669464111328125, -0.6444473266601562, -0.6194305419921875, -0.5944137573242188, -0.56939697265625, -0.5443801879882812, -0.5193634033203125, -0.49434661865234375, -0.469329833984375, -0.44431304931640625, -0.4192962646484375, -0.39427947998046875, -0.3692626953125, -0.34424591064453125, -0.3192291259765625, -0.29421234130859375, -0.269195556640625, -0.24417877197265625, -0.2191619873046875, -0.19414520263671875, -0.16912841796875, -0.14411163330078125, -0.1190948486328125, -0.09407806396484375, -0.069061279296875, -0.04404449462890625, -0.0190277099609375, 0.00598907470703125, 0.031005859375, 0.05602264404296875, 0.0810394287109375, 0.10605621337890625, 0.131072998046875, 0.15608978271484375, 0.1811065673828125, 0.20612335205078125, 0.23114013671875, 0.25615692138671875, 0.2811737060546875, 0.30619049072265625, 0.331207275390625, 0.35622406005859375, 0.3812408447265625, 0.40625762939453125, 0.4312744140625, 0.45629119873046875, 0.4813079833984375, 0.5063247680664062, 0.531341552734375, 0.5563583374023438, 0.5813751220703125, 0.6063919067382812, 0.63140869140625, 0.6564254760742188, 0.6814422607421875, 0.7064590454101562, 0.731475830078125, 0.7564926147460938, 0.7815093994140625, 0.8065261840820312, 0.83154296875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 5.0, 5.0, 5.0, 1.0, 3.0, 13.0, 11.0, 15.0, 10.0, 17.0, 14.0, 22.0, 21.0, 21.0, 32.0, 35.0, 36.0, 29.0, 31.0, 38.0, 33.0, 29.0, 37.0, 1066.0, 30.0, 47.0, 43.0, 39.0, 39.0, 42.0, 28.0, 28.0, 25.0, 21.0, 21.0, 17.0, 21.0, 13.0, 8.0, 14.0, 12.0, 9.0, 7.0, 9.0, 5.0, 6.0, 9.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-5.84375, -5.67388916015625, -5.5040283203125, -5.33416748046875, -5.164306640625, -4.99444580078125, -4.8245849609375, -4.65472412109375, -4.48486328125, -4.31500244140625, -4.1451416015625, -3.97528076171875, -3.805419921875, -3.63555908203125, -3.4656982421875, -3.29583740234375, -3.1259765625, -2.95611572265625, -2.7862548828125, -2.61639404296875, -2.446533203125, -2.27667236328125, -2.1068115234375, -1.93695068359375, -1.76708984375, -1.59722900390625, -1.4273681640625, -1.25750732421875, -1.087646484375, -0.91778564453125, -0.7479248046875, -0.57806396484375, -0.408203125, -0.23834228515625, -0.0684814453125, 0.10137939453125, 0.271240234375, 0.44110107421875, 0.6109619140625, 0.78082275390625, 0.95068359375, 1.12054443359375, 1.2904052734375, 1.46026611328125, 1.630126953125, 1.79998779296875, 1.9698486328125, 2.13970947265625, 2.3095703125, 2.47943115234375, 2.6492919921875, 2.81915283203125, 2.989013671875, 3.15887451171875, 3.3287353515625, 3.49859619140625, 3.66845703125, 3.83831787109375, 4.0081787109375, 4.17803955078125, 4.347900390625, 4.51776123046875, 4.6876220703125, 4.85748291015625, 5.02734375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 2.0, 7.0, 14.0, 19.0, 21.0, 45.0, 70.0, 98.0, 162.0, 229.0, 353.0, 557.0, 849.0, 1472.0, 2427.0, 4098.0, 7160.0, 12247.0, 21966.0, 38085.0, 1871887.0, 64558.0, 29790.0, 17039.0, 9883.0, 5722.0, 3263.0, 1958.0, 1158.0, 731.0, 444.0, 321.0, 172.0, 113.0, 63.0, 38.0, 36.0, 24.0, 19.0, 8.0, 3.0, 1.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9228515625, -1.8536529541015625, -1.784454345703125, -1.7152557373046875, -1.64605712890625, -1.5768585205078125, -1.507659912109375, -1.4384613037109375, -1.3692626953125, -1.3000640869140625, -1.230865478515625, -1.1616668701171875, -1.09246826171875, -1.0232696533203125, -0.954071044921875, -0.8848724365234375, -0.815673828125, -0.7464752197265625, -0.677276611328125, -0.6080780029296875, -0.53887939453125, -0.4696807861328125, -0.400482177734375, -0.3312835693359375, -0.2620849609375, -0.1928863525390625, -0.123687744140625, -0.0544891357421875, 0.01470947265625, 0.0839080810546875, 0.153106689453125, 0.2223052978515625, 0.29150390625, 0.3607025146484375, 0.429901123046875, 0.4990997314453125, 0.56829833984375, 0.6374969482421875, 0.706695556640625, 0.7758941650390625, 0.8450927734375, 0.9142913818359375, 0.983489990234375, 1.0526885986328125, 1.12188720703125, 1.1910858154296875, 1.260284423828125, 1.3294830322265625, 1.398681640625, 1.4678802490234375, 1.537078857421875, 1.6062774658203125, 1.67547607421875, 1.7446746826171875, 1.813873291015625, 1.8830718994140625, 1.9522705078125, 2.0214691162109375, 2.090667724609375, 2.1598663330078125, 2.22906494140625, 2.2982635498046875, 2.367462158203125, 2.4366607666015625, 2.505859375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 3.0, 5.0, 7.0, 10.0, 7.0, 11.0, 24.0, 20.0, 23.0, 24.0, 31.0, 31.0, 30.0, 42.0, 40.0, 47.0, 49.0, 45.0, 38.0, 45.0, 36.0, 52.0, 43.0, 37.0, 40.0, 35.0, 36.0, 27.0, 24.0, 21.0, 23.0, 21.0, 15.0, 11.0, 6.0, 9.0, 5.0, 3.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.036895751953125, -0.03567218780517578, -0.03444862365722656, -0.033225059509277344, -0.032001495361328125, -0.030777931213378906, -0.029554367065429688, -0.02833080291748047, -0.02710723876953125, -0.02588367462158203, -0.024660110473632812, -0.023436546325683594, -0.022212982177734375, -0.020989418029785156, -0.019765853881835938, -0.01854228973388672, -0.0173187255859375, -0.01609516143798828, -0.014871597290039062, -0.013648033142089844, -0.012424468994140625, -0.011200904846191406, -0.009977340698242188, -0.008753776550292969, -0.00753021240234375, -0.006306648254394531, -0.0050830841064453125, -0.0038595199584960938, -0.002635955810546875, -0.0014123916625976562, -0.0001888275146484375, 0.0010347366333007812, 0.00225830078125, 0.0034818649291992188, 0.0047054290771484375, 0.005928993225097656, 0.007152557373046875, 0.008376121520996094, 0.009599685668945312, 0.010823249816894531, 0.01204681396484375, 0.013270378112792969, 0.014493942260742188, 0.015717506408691406, 0.016941070556640625, 0.018164634704589844, 0.019388198852539062, 0.02061176300048828, 0.0218353271484375, 0.02305889129638672, 0.024282455444335938, 0.025506019592285156, 0.026729583740234375, 0.027953147888183594, 0.029176712036132812, 0.03040027618408203, 0.03162384033203125, 0.03284740447998047, 0.03407096862792969, 0.035294532775878906, 0.036518096923828125, 0.037741661071777344, 0.03896522521972656, 0.04018878936767578, 0.041412353515625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 2.0, 5.0, 11.0, 7.0, 16.0, 17.0, 25.0, 28.0, 28.0, 38.0, 52.0, 70.0, 96.0, 116.0, 195.0, 344.0, 804.0, 10652.0, 1032741.0, 1776.0, 579.0, 290.0, 168.0, 100.0, 89.0, 51.0, 39.0, 40.0, 33.0, 33.0, 32.0, 14.0, 8.0, 10.0, 7.0, 5.0, 5.0, 5.0, 3.0, 9.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9453125, -0.917755126953125, -0.89019775390625, -0.862640380859375, -0.8350830078125, -0.807525634765625, -0.77996826171875, -0.752410888671875, -0.724853515625, -0.697296142578125, -0.66973876953125, -0.642181396484375, -0.6146240234375, -0.587066650390625, -0.55950927734375, -0.531951904296875, -0.50439453125, -0.476837158203125, -0.44927978515625, -0.421722412109375, -0.3941650390625, -0.366607666015625, -0.33905029296875, -0.311492919921875, -0.283935546875, -0.256378173828125, -0.22882080078125, -0.201263427734375, -0.1737060546875, -0.146148681640625, -0.11859130859375, -0.091033935546875, -0.0634765625, -0.035919189453125, -0.00836181640625, 0.019195556640625, 0.0467529296875, 0.074310302734375, 0.10186767578125, 0.129425048828125, 0.156982421875, 0.184539794921875, 0.21209716796875, 0.239654541015625, 0.2672119140625, 0.294769287109375, 0.32232666015625, 0.349884033203125, 0.37744140625, 0.404998779296875, 0.43255615234375, 0.460113525390625, 0.4876708984375, 0.515228271484375, 0.54278564453125, 0.570343017578125, 0.597900390625, 0.625457763671875, 0.65301513671875, 0.680572509765625, 0.7081298828125, 0.735687255859375, 0.76324462890625, 0.790802001953125, 0.818359375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 46.0, 883.0, 81.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6308881044387817, -0.6191442608833313, -0.6074004769325256, -0.5956566333770752, -0.5839128494262695, -0.5721690058708191, -0.5604252219200134, -0.548681378364563, -0.5369375944137573, -0.5251937508583069, -0.5134499669075012, -0.5017061233520508, -0.4899623394012451, -0.4782184958457947, -0.4664746820926666, -0.4547308683395386, -0.44298702478408813, -0.4312432110309601, -0.41949939727783203, -0.407755583524704, -0.3960117697715759, -0.3842679262161255, -0.37252411246299744, -0.3607802987098694, -0.34903648495674133, -0.3372926712036133, -0.32554885745048523, -0.3138050436973572, -0.30206120014190674, -0.2903173863887787, -0.27857357263565063, -0.2668297588825226, -0.25508591532707214, -0.2433421015739441, -0.23159828782081604, -0.2198544591665268, -0.20811064541339874, -0.1963668316602707, -0.18462300300598145, -0.1728791892528534, -0.16113537549972534, -0.1493915617465973, -0.13764774799346924, -0.12590391933918, -0.11416010558605194, -0.10241629183292389, -0.09067247062921524, -0.07892864942550659, -0.06718484312295914, -0.05544102564454079, -0.043697208166122437, -0.031953390687704086, -0.020209573209285736, -0.008465755730867386, 0.0032780617475509644, 0.015021882951259613, 0.026765696704387665, 0.038509514182806015, 0.050253331661224365, 0.061997149139642715, 0.07374096661806107, 0.08548478782176971, 0.09722860157489777, 0.10897242277860641, 0.12071623653173447]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 11.0, 11.0, 13.0, 13.0, 18.0, 10.0, 15.0, 19.0, 21.0, 31.0, 34.0, 27.0, 38.0, 41.0, 35.0, 44.0, 44.0, 47.0, 43.0, 48.0, 43.0, 38.0, 46.0, 41.0, 29.0, 25.0, 41.0, 34.0, 22.0, 17.0, 18.0, 18.0, 10.0, 16.0, 14.0, 3.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.08119797706604004, -0.07895153760910034, -0.07670509070158005, -0.07445864379405975, -0.07221220433712006, -0.06996576488018036, -0.06771931797266006, -0.06547287106513977, -0.06322643160820007, -0.06097998842597008, -0.05873354524374008, -0.056487102061510086, -0.05424065887928009, -0.051994215697050095, -0.0497477725148201, -0.0475013293325901, -0.04525488615036011, -0.04300844296813011, -0.040761999785900116, -0.03851555660367012, -0.036269113421440125, -0.03402267023921013, -0.03177622705698013, -0.029529783874750137, -0.02728334069252014, -0.025036897510290146, -0.02279045432806015, -0.020544011145830154, -0.01829756796360016, -0.016051124781370163, -0.013804681599140167, -0.011558238416910172, -0.009311795234680176, -0.00706535205245018, -0.004818908870220184, -0.0025724656879901886, -0.00032602250576019287, 0.0019204206764698029, 0.004166863858699799, 0.006413307040929794, 0.00865975022315979, 0.010906193405389786, 0.013152636587619781, 0.015399079769849777, 0.017645522952079773, 0.01989196613430977, 0.022138409316539764, 0.02438485249876976, 0.026631295680999756, 0.02887773886322975, 0.031124182045459747, 0.03337062522768974, 0.03561706840991974, 0.037863511592149734, 0.04010995477437973, 0.042356397956609726, 0.04460284113883972, 0.04684928432106972, 0.04909572750329971, 0.05134217068552971, 0.053588613867759705, 0.0558350570499897, 0.058081500232219696, 0.06032794341444969, 0.06257438659667969]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 8.0, 2.0, 1.0, 7.0, 4.0, 3.0, 2.0, 5.0, 7.0, 12.0, 12.0, 11.0, 19.0, 22.0, 22.0, 20.0, 28.0, 28.0, 38.0, 40.0, 28.0, 49.0, 35.0, 36.0, 53.0, 35.0, 36.0, 44.0, 37.0, 36.0, 37.0, 25.0, 31.0, 27.0, 31.0, 36.0, 23.0, 22.0, 19.0, 14.0, 10.0, 18.0, 9.0, 7.0, 2.0, 5.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-6.6796875, -6.4608154296875, -6.241943359375, -6.0230712890625, -5.80419921875, -5.5853271484375, -5.366455078125, -5.1475830078125, -4.9287109375, -4.7098388671875, -4.490966796875, -4.2720947265625, -4.05322265625, -3.8343505859375, -3.615478515625, -3.3966064453125, -3.177734375, -2.9588623046875, -2.739990234375, -2.5211181640625, -2.30224609375, -2.0833740234375, -1.864501953125, -1.6456298828125, -1.4267578125, -1.2078857421875, -0.989013671875, -0.7701416015625, -0.55126953125, -0.3323974609375, -0.113525390625, 0.1053466796875, 0.32421875, 0.5430908203125, 0.761962890625, 0.9808349609375, 1.19970703125, 1.4185791015625, 1.637451171875, 1.8563232421875, 2.0751953125, 2.2940673828125, 2.512939453125, 2.7318115234375, 2.95068359375, 3.1695556640625, 3.388427734375, 3.6072998046875, 3.826171875, 4.0450439453125, 4.263916015625, 4.4827880859375, 4.70166015625, 4.9205322265625, 5.139404296875, 5.3582763671875, 5.5771484375, 5.7960205078125, 6.014892578125, 6.2337646484375, 6.45263671875, 6.6715087890625, 6.890380859375, 7.1092529296875, 7.328125]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 3.0, 6.0, 4.0, 10.0, 8.0, 13.0, 22.0, 18.0, 25.0, 38.0, 35.0, 51.0, 67.0, 107.0, 158.0, 272.0, 509.0, 1069.0, 2431.0, 5549.0, 12999.0, 32835.0, 103697.0, 540521.0, 256866.0, 55439.0, 20354.0, 8431.0, 3569.0, 1645.0, 757.0, 366.0, 213.0, 120.0, 85.0, 63.0, 43.0, 36.0, 30.0, 15.0, 23.0, 15.0, 11.0, 8.0, 4.0, 4.0, 6.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-13.4609375, -13.0369873046875, -12.613037109375, -12.1890869140625, -11.76513671875, -11.3411865234375, -10.917236328125, -10.4932861328125, -10.0693359375, -9.6453857421875, -9.221435546875, -8.7974853515625, -8.37353515625, -7.9495849609375, -7.525634765625, -7.1016845703125, -6.677734375, -6.2537841796875, -5.829833984375, -5.4058837890625, -4.98193359375, -4.5579833984375, -4.134033203125, -3.7100830078125, -3.2861328125, -2.8621826171875, -2.438232421875, -2.0142822265625, -1.59033203125, -1.1663818359375, -0.742431640625, -0.3184814453125, 0.10546875, 0.5294189453125, 0.953369140625, 1.3773193359375, 1.80126953125, 2.2252197265625, 2.649169921875, 3.0731201171875, 3.4970703125, 3.9210205078125, 4.344970703125, 4.7689208984375, 5.19287109375, 5.6168212890625, 6.040771484375, 6.4647216796875, 6.888671875, 7.3126220703125, 7.736572265625, 8.1605224609375, 8.58447265625, 9.0084228515625, 9.432373046875, 9.8563232421875, 10.2802734375, 10.7042236328125, 11.128173828125, 11.5521240234375, 11.97607421875, 12.4000244140625, 12.823974609375, 13.2479248046875, 13.671875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 0.0, 1.0, 4.0, 8.0, 8.0, 9.0, 11.0, 11.0, 16.0, 22.0, 25.0, 27.0, 26.0, 46.0, 29.0, 41.0, 39.0, 59.0, 75.0, 128.0, 338.0, 1491.0, 151.0, 91.0, 54.0, 46.0, 40.0, 37.0, 35.0, 34.0, 31.0, 31.0, 11.0, 9.0, 15.0, 13.0, 9.0, 0.0, 12.0, 8.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.578125, -23.813232421875, -23.04833984375, -22.283447265625, -21.5185546875, -20.753662109375, -19.98876953125, -19.223876953125, -18.458984375, -17.694091796875, -16.92919921875, -16.164306640625, -15.3994140625, -14.634521484375, -13.86962890625, -13.104736328125, -12.33984375, -11.574951171875, -10.81005859375, -10.045166015625, -9.2802734375, -8.515380859375, -7.75048828125, -6.985595703125, -6.220703125, -5.455810546875, -4.69091796875, -3.926025390625, -3.1611328125, -2.396240234375, -1.63134765625, -0.866455078125, -0.1015625, 0.663330078125, 1.42822265625, 2.193115234375, 2.9580078125, 3.722900390625, 4.48779296875, 5.252685546875, 6.017578125, 6.782470703125, 7.54736328125, 8.312255859375, 9.0771484375, 9.842041015625, 10.60693359375, 11.371826171875, 12.13671875, 12.901611328125, 13.66650390625, 14.431396484375, 15.1962890625, 15.961181640625, 16.72607421875, 17.490966796875, 18.255859375, 19.020751953125, 19.78564453125, 20.550537109375, 21.3154296875, 22.080322265625, 22.84521484375, 23.610107421875, 24.375]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 12.0, 13.0, 11.0, 12.0, 28.0, 20.0, 29.0, 30.0, 60.0, 76.0, 76.0, 158.0, 217.0, 412.0, 1002.0, 6227.0, 147501.0, 2941680.0, 43296.0, 3114.0, 731.0, 294.0, 177.0, 139.0, 96.0, 60.0, 66.0, 34.0, 24.0, 23.0, 20.0, 16.0, 13.0, 7.0, 3.0, 4.0, 9.0, 1.0, 0.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-51.71875, -50.212890625, -48.70703125, -47.201171875, -45.6953125, -44.189453125, -42.68359375, -41.177734375, -39.671875, -38.166015625, -36.66015625, -35.154296875, -33.6484375, -32.142578125, -30.63671875, -29.130859375, -27.625, -26.119140625, -24.61328125, -23.107421875, -21.6015625, -20.095703125, -18.58984375, -17.083984375, -15.578125, -14.072265625, -12.56640625, -11.060546875, -9.5546875, -8.048828125, -6.54296875, -5.037109375, -3.53125, -2.025390625, -0.51953125, 0.986328125, 2.4921875, 3.998046875, 5.50390625, 7.009765625, 8.515625, 10.021484375, 11.52734375, 13.033203125, 14.5390625, 16.044921875, 17.55078125, 19.056640625, 20.5625, 22.068359375, 23.57421875, 25.080078125, 26.5859375, 28.091796875, 29.59765625, 31.103515625, 32.609375, 34.115234375, 35.62109375, 37.126953125, 38.6328125, 40.138671875, 41.64453125, 43.150390625, 44.65625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 26.0, 338.0, 559.0, 90.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-280.39581298828125, -274.69708251953125, -268.9983215332031, -263.2995910644531, -257.600830078125, -251.90208435058594, -246.20333862304688, -240.50460815429688, -234.80584716796875, -229.1071014404297, -223.40835571289062, -217.70960998535156, -212.0108642578125, -206.31211853027344, -200.61337280273438, -194.91464233398438, -189.2158966064453, -183.51715087890625, -177.8184051513672, -172.11965942382812, -166.42091369628906, -160.72216796875, -155.0234375, -149.32467651367188, -143.62594604492188, -137.9272003173828, -132.22845458984375, -126.52970886230469, -120.83096313476562, -115.13221740722656, -109.43347930908203, -103.73473358154297, -98.03596496582031, -92.33721923828125, -86.63847351074219, -80.93972778320312, -75.24098205566406, -69.542236328125, -63.84349822998047, -58.144752502441406, -52.446006774902344, -46.74726104736328, -41.04851531982422, -35.34977340698242, -29.65102767944336, -23.952281951904297, -18.2535400390625, -12.554794311523438, -6.856048583984375, -1.157303810119629, 4.541440963745117, 10.240184783935547, 15.93893051147461, 21.637676239013672, 27.33641815185547, 33.03516387939453, 38.733909606933594, 44.432655334472656, 50.13140106201172, 55.830142974853516, 61.52888870239258, 67.22763061523438, 72.92637634277344, 78.6251220703125, 84.32386779785156]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 10.0, 5.0, 9.0, 10.0, 12.0, 17.0, 21.0, 26.0, 21.0, 21.0, 26.0, 47.0, 34.0, 36.0, 50.0, 48.0, 58.0, 50.0, 40.0, 52.0, 39.0, 31.0, 43.0, 35.0, 50.0, 28.0, 32.0, 23.0, 33.0, 19.0, 13.0, 9.0, 15.0, 7.0, 6.0, 6.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.03476333618164, -57.985748291015625, -55.936737060546875, -53.887725830078125, -51.83871078491211, -49.789695739746094, -47.740684509277344, -45.691673278808594, -43.64265823364258, -41.59364318847656, -39.54463195800781, -37.49562072753906, -35.44660568237305, -33.39759063720703, -31.34857940673828, -29.2995662689209, -27.250553131103516, -25.201539993286133, -23.15252685546875, -21.103513717651367, -19.054500579833984, -17.0054874420166, -14.956474304199219, -12.907461166381836, -10.858448028564453, -8.80943489074707, -6.7604217529296875, -4.711408615112305, -2.662395477294922, -0.6133823394775391, 1.4356307983398438, 3.4846439361572266, 5.533653259277344, 7.582666397094727, 9.63167953491211, 11.680692672729492, 13.729705810546875, 15.778718948364258, 17.82773208618164, 19.876745223999023, 21.925758361816406, 23.97477149963379, 26.023784637451172, 28.072797775268555, 30.121810913085938, 32.17082214355469, 34.2198371887207, 36.26885223388672, 38.31786346435547, 40.36687469482422, 42.415889739990234, 44.46490478515625, 46.513916015625, 48.56292724609375, 50.611942291259766, 52.66095733642578, 54.70996856689453, 56.75897979736328, 58.8079948425293, 60.85700988769531, 62.90602111816406, 64.95503234863281, 67.00404357910156, 69.05306243896484, 71.1020736694336]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 6.0, 3.0, 5.0, 5.0, 4.0, 3.0, 8.0, 10.0, 13.0, 9.0, 15.0, 14.0, 17.0, 24.0, 27.0, 32.0, 27.0, 32.0, 33.0, 36.0, 39.0, 39.0, 53.0, 50.0, 42.0, 42.0, 34.0, 42.0, 37.0, 34.0, 41.0, 29.0, 22.0, 20.0, 32.0, 20.0, 19.0, 11.0, 25.0, 11.0, 10.0, 11.0, 2.0, 7.0, 4.0, 1.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.828125, -6.58447265625, -6.3408203125, -6.09716796875, -5.853515625, -5.60986328125, -5.3662109375, -5.12255859375, -4.87890625, -4.63525390625, -4.3916015625, -4.14794921875, -3.904296875, -3.66064453125, -3.4169921875, -3.17333984375, -2.9296875, -2.68603515625, -2.4423828125, -2.19873046875, -1.955078125, -1.71142578125, -1.4677734375, -1.22412109375, -0.98046875, -0.73681640625, -0.4931640625, -0.24951171875, -0.005859375, 0.23779296875, 0.4814453125, 0.72509765625, 0.96875, 1.21240234375, 1.4560546875, 1.69970703125, 1.943359375, 2.18701171875, 2.4306640625, 2.67431640625, 2.91796875, 3.16162109375, 3.4052734375, 3.64892578125, 3.892578125, 4.13623046875, 4.3798828125, 4.62353515625, 4.8671875, 5.11083984375, 5.3544921875, 5.59814453125, 5.841796875, 6.08544921875, 6.3291015625, 6.57275390625, 6.81640625, 7.06005859375, 7.3037109375, 7.54736328125, 7.791015625, 8.03466796875, 8.2783203125, 8.52197265625, 8.765625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 7.0, 10.0, 11.0, 25.0, 17.0, 18.0, 46.0, 44.0, 55.0, 84.0, 145.0, 242.0, 468.0, 1184.0, 2696.0, 7244.0, 20772.0, 61794.0, 188987.0, 552285.0, 1246266.0, 1259907.0, 562546.0, 193205.0, 62509.0, 21145.0, 7305.0, 2817.0, 1104.0, 562.0, 276.0, 164.0, 107.0, 53.0, 39.0, 29.0, 26.0, 25.0, 11.0, 7.0, 7.0, 9.0, 6.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.0, -6.7501220703125, -6.500244140625, -6.2503662109375, -6.00048828125, -5.7506103515625, -5.500732421875, -5.2508544921875, -5.0009765625, -4.7510986328125, -4.501220703125, -4.2513427734375, -4.00146484375, -3.7515869140625, -3.501708984375, -3.2518310546875, -3.001953125, -2.7520751953125, -2.502197265625, -2.2523193359375, -2.00244140625, -1.7525634765625, -1.502685546875, -1.2528076171875, -1.0029296875, -0.7530517578125, -0.503173828125, -0.2532958984375, -0.00341796875, 0.2464599609375, 0.496337890625, 0.7462158203125, 0.99609375, 1.2459716796875, 1.495849609375, 1.7457275390625, 1.99560546875, 2.2454833984375, 2.495361328125, 2.7452392578125, 2.9951171875, 3.2449951171875, 3.494873046875, 3.7447509765625, 3.99462890625, 4.2445068359375, 4.494384765625, 4.7442626953125, 4.994140625, 5.2440185546875, 5.493896484375, 5.7437744140625, 5.99365234375, 6.2435302734375, 6.493408203125, 6.7432861328125, 6.9931640625, 7.2430419921875, 7.492919921875, 7.7427978515625, 7.99267578125, 8.2425537109375, 8.492431640625, 8.7423095703125, 8.9921875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 11.0, 18.0, 26.0, 22.0, 41.0, 47.0, 61.0, 90.0, 144.0, 177.0, 233.0, 333.0, 406.0, 465.0, 470.0, 386.0, 314.0, 211.0, 166.0, 109.0, 77.0, 68.0, 50.0, 30.0, 22.0, 16.0, 19.0, 14.0, 9.0, 8.0, 4.0, 2.0, 4.0, 0.0, 7.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-12.3984375, -12.0213623046875, -11.644287109375, -11.2672119140625, -10.89013671875, -10.5130615234375, -10.135986328125, -9.7589111328125, -9.3818359375, -9.0047607421875, -8.627685546875, -8.2506103515625, -7.87353515625, -7.4964599609375, -7.119384765625, -6.7423095703125, -6.365234375, -5.9881591796875, -5.611083984375, -5.2340087890625, -4.85693359375, -4.4798583984375, -4.102783203125, -3.7257080078125, -3.3486328125, -2.9715576171875, -2.594482421875, -2.2174072265625, -1.84033203125, -1.4632568359375, -1.086181640625, -0.7091064453125, -0.33203125, 0.0450439453125, 0.422119140625, 0.7991943359375, 1.17626953125, 1.5533447265625, 1.930419921875, 2.3074951171875, 2.6845703125, 3.0616455078125, 3.438720703125, 3.8157958984375, 4.19287109375, 4.5699462890625, 4.947021484375, 5.3240966796875, 5.701171875, 6.0782470703125, 6.455322265625, 6.8323974609375, 7.20947265625, 7.5865478515625, 7.963623046875, 8.3406982421875, 8.7177734375, 9.0948486328125, 9.471923828125, 9.8489990234375, 10.22607421875, 10.6031494140625, 10.980224609375, 11.3572998046875, 11.734375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 13.0, 16.0, 21.0, 31.0, 27.0, 66.0, 80.0, 142.0, 225.0, 437.0, 828.0, 2558.0, 23293.0, 752883.0, 3269718.0, 133901.0, 7135.0, 1436.0, 582.0, 340.0, 164.0, 112.0, 77.0, 55.0, 29.0, 28.0, 23.0, 10.0, 10.0, 7.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.46875, -32.3984375, -31.328125, -30.2578125, -29.1875, -28.1171875, -27.046875, -25.9765625, -24.90625, -23.8359375, -22.765625, -21.6953125, -20.625, -19.5546875, -18.484375, -17.4140625, -16.34375, -15.2734375, -14.203125, -13.1328125, -12.0625, -10.9921875, -9.921875, -8.8515625, -7.78125, -6.7109375, -5.640625, -4.5703125, -3.5, -2.4296875, -1.359375, -0.2890625, 0.78125, 1.8515625, 2.921875, 3.9921875, 5.0625, 6.1328125, 7.203125, 8.2734375, 9.34375, 10.4140625, 11.484375, 12.5546875, 13.625, 14.6953125, 15.765625, 16.8359375, 17.90625, 18.9765625, 20.046875, 21.1171875, 22.1875, 23.2578125, 24.328125, 25.3984375, 26.46875, 27.5390625, 28.609375, 29.6796875, 30.75, 31.8203125, 32.890625, 33.9609375, 35.03125]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 26.0, 497.0, 468.0, 27.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-585.32373046875, -573.8355712890625, -562.3473510742188, -550.8591918945312, -539.3710327148438, -527.8828125, -516.3946533203125, -504.906494140625, -493.4183044433594, -481.93011474609375, -470.44195556640625, -458.9537658691406, -447.4656066894531, -435.9774169921875, -424.4892578125, -413.0010681152344, -401.51287841796875, -390.0246887207031, -378.5365295410156, -367.04833984375, -355.5601806640625, -344.0719909667969, -332.58380126953125, -321.09564208984375, -309.60748291015625, -298.1192932128906, -286.6311340332031, -275.1429443359375, -263.65478515625, -252.16659545898438, -240.6784210205078, -229.19024658203125, -217.70205688476562, -206.21388244628906, -194.7257080078125, -183.23751831054688, -171.7493438720703, -160.26116943359375, -148.7729949951172, -137.28482055664062, -125.79663848876953, -114.30846405029297, -102.82028198242188, -91.33210754394531, -79.84393310546875, -68.35575103759766, -56.867576599121094, -45.37939453125, -33.89122009277344, -22.40304183959961, -10.914865493774414, 0.5733108520507812, 12.06148910522461, 23.549667358398438, 35.037841796875, 46.526023864746094, 58.014198303222656, 69.50237274169922, 80.99055480957031, 92.47872924804688, 103.96690368652344, 115.45508575439453, 126.9432601928711, 138.4314422607422, 149.91961669921875]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 9.0, 4.0, 12.0, 7.0, 10.0, 12.0, 18.0, 20.0, 20.0, 33.0, 26.0, 25.0, 37.0, 30.0, 30.0, 47.0, 44.0, 41.0, 49.0, 41.0, 54.0, 38.0, 46.0, 40.0, 38.0, 44.0, 27.0, 26.0, 27.0, 27.0, 19.0, 16.0, 20.0, 12.0, 17.0, 4.0, 7.0, 7.0, 6.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.561790466308594, -43.118804931640625, -41.67581558227539, -40.23283004760742, -38.78984069824219, -37.34685516357422, -35.90386962890625, -34.460880279541016, -33.01789474487305, -31.574907302856445, -30.131919860839844, -28.688934326171875, -27.245946884155273, -25.802959442138672, -24.35997200012207, -22.91698455810547, -21.473997116088867, -20.031009674072266, -18.588022232055664, -17.145034790039062, -15.702049255371094, -14.259061813354492, -12.81607437133789, -11.373087882995605, -9.930100440979004, -8.487112998962402, -7.044126510620117, -5.601139068603516, -4.158152103424072, -2.715165138244629, -1.2721776962280273, 0.1708087921142578, 1.6137962341308594, 3.0567831993103027, 4.499770164489746, 5.942757606506348, 7.385744571685791, 8.828731536865234, 10.271718978881836, 11.714705467224121, 13.157692909240723, 14.600680351257324, 16.04366683959961, 17.48665428161621, 18.929641723632812, 20.37262725830078, 21.815616607666016, 23.258602142333984, 24.701589584350586, 26.144577026367188, 27.58756446838379, 29.03055191040039, 30.47353744506836, 31.91652488708496, 33.35951232910156, 34.80249786376953, 36.245487213134766, 37.688472747802734, 39.13146209716797, 40.57444763183594, 42.01743698120117, 43.46042251586914, 44.903411865234375, 46.346397399902344, 47.78938293457031]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 5.0, 5.0, 7.0, 6.0, 10.0, 8.0, 17.0, 12.0, 15.0, 24.0, 24.0, 38.0, 30.0, 39.0, 43.0, 40.0, 42.0, 45.0, 36.0, 44.0, 43.0, 54.0, 56.0, 38.0, 37.0, 33.0, 41.0, 42.0, 30.0, 24.0, 21.0, 13.0, 14.0, 17.0, 14.0, 9.0, 8.0, 8.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.140625, -7.8861083984375, -7.631591796875, -7.3770751953125, -7.12255859375, -6.8680419921875, -6.613525390625, -6.3590087890625, -6.1044921875, -5.8499755859375, -5.595458984375, -5.3409423828125, -5.08642578125, -4.8319091796875, -4.577392578125, -4.3228759765625, -4.068359375, -3.8138427734375, -3.559326171875, -3.3048095703125, -3.05029296875, -2.7957763671875, -2.541259765625, -2.2867431640625, -2.0322265625, -1.7777099609375, -1.523193359375, -1.2686767578125, -1.01416015625, -0.7596435546875, -0.505126953125, -0.2506103515625, 0.00390625, 0.2584228515625, 0.512939453125, 0.7674560546875, 1.02197265625, 1.2764892578125, 1.531005859375, 1.7855224609375, 2.0400390625, 2.2945556640625, 2.549072265625, 2.8035888671875, 3.05810546875, 3.3126220703125, 3.567138671875, 3.8216552734375, 4.076171875, 4.3306884765625, 4.585205078125, 4.8397216796875, 5.09423828125, 5.3487548828125, 5.603271484375, 5.8577880859375, 6.1123046875, 6.3668212890625, 6.621337890625, 6.8758544921875, 7.13037109375, 7.3848876953125, 7.639404296875, 7.8939208984375, 8.1484375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 8.0, 15.0, 22.0, 40.0, 61.0, 73.0, 151.0, 210.0, 348.0, 615.0, 959.0, 1579.0, 2683.0, 4315.0, 7205.0, 11915.0, 19435.0, 31246.0, 49006.0, 73214.0, 101763.0, 130415.0, 145766.0, 136054.0, 108756.0, 78741.0, 53615.0, 34374.0, 21957.0, 13226.0, 8195.0, 4956.0, 3036.0, 1822.0, 1092.0, 664.0, 396.0, 220.0, 153.0, 95.0, 59.0, 46.0, 31.0, 6.0, 5.0, 5.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.93408203125, -0.9045333862304688, -0.8749847412109375, -0.8454360961914062, -0.815887451171875, -0.7863388061523438, -0.7567901611328125, -0.7272415161132812, -0.69769287109375, -0.6681442260742188, -0.6385955810546875, -0.6090469360351562, -0.579498291015625, -0.5499496459960938, -0.5204010009765625, -0.49085235595703125, -0.4613037109375, -0.43175506591796875, -0.4022064208984375, -0.37265777587890625, -0.343109130859375, -0.31356048583984375, -0.2840118408203125, -0.25446319580078125, -0.22491455078125, -0.19536590576171875, -0.1658172607421875, -0.13626861572265625, -0.106719970703125, -0.07717132568359375, -0.0476226806640625, -0.01807403564453125, 0.011474609375, 0.04102325439453125, 0.0705718994140625, 0.10012054443359375, 0.129669189453125, 0.15921783447265625, 0.1887664794921875, 0.21831512451171875, 0.24786376953125, 0.27741241455078125, 0.3069610595703125, 0.33650970458984375, 0.366058349609375, 0.39560699462890625, 0.4251556396484375, 0.45470428466796875, 0.4842529296875, 0.5138015747070312, 0.5433502197265625, 0.5728988647460938, 0.602447509765625, 0.6319961547851562, 0.6615447998046875, 0.6910934448242188, 0.72064208984375, 0.7501907348632812, 0.7797393798828125, 0.8092880249023438, 0.838836669921875, 0.8683853149414062, 0.8979339599609375, 0.9274826049804688, 0.95703125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 9.0, 6.0, 6.0, 13.0, 14.0, 8.0, 15.0, 21.0, 20.0, 28.0, 28.0, 39.0, 41.0, 28.0, 37.0, 37.0, 36.0, 46.0, 45.0, 1079.0, 49.0, 39.0, 33.0, 39.0, 39.0, 33.0, 29.0, 23.0, 29.0, 20.0, 19.0, 23.0, 23.0, 15.0, 16.0, 12.0, 7.0, 3.0, 8.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.609375, -5.42364501953125, -5.2379150390625, -5.05218505859375, -4.866455078125, -4.68072509765625, -4.4949951171875, -4.30926513671875, -4.12353515625, -3.93780517578125, -3.7520751953125, -3.56634521484375, -3.380615234375, -3.19488525390625, -3.0091552734375, -2.82342529296875, -2.6376953125, -2.45196533203125, -2.2662353515625, -2.08050537109375, -1.894775390625, -1.70904541015625, -1.5233154296875, -1.33758544921875, -1.15185546875, -0.96612548828125, -0.7803955078125, -0.59466552734375, -0.408935546875, -0.22320556640625, -0.0374755859375, 0.14825439453125, 0.333984375, 0.51971435546875, 0.7054443359375, 0.89117431640625, 1.076904296875, 1.26263427734375, 1.4483642578125, 1.63409423828125, 1.81982421875, 2.00555419921875, 2.1912841796875, 2.37701416015625, 2.562744140625, 2.74847412109375, 2.9342041015625, 3.11993408203125, 3.3056640625, 3.49139404296875, 3.6771240234375, 3.86285400390625, 4.048583984375, 4.23431396484375, 4.4200439453125, 4.60577392578125, 4.79150390625, 4.97723388671875, 5.1629638671875, 5.34869384765625, 5.534423828125, 5.72015380859375, 5.9058837890625, 6.09161376953125, 6.27734375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 2.0, 3.0, 2.0, 10.0, 6.0, 13.0, 15.0, 21.0, 31.0, 41.0, 46.0, 78.0, 132.0, 186.0, 300.0, 451.0, 665.0, 1134.0, 1758.0, 2742.0, 4511.0, 7335.0, 12258.0, 20227.0, 33383.0, 1746373.0, 183727.0, 31841.0, 19390.0, 11778.0, 7037.0, 4250.0, 2670.0, 1687.0, 1029.0, 686.0, 449.0, 262.0, 170.0, 137.0, 86.0, 60.0, 39.0, 38.0, 20.0, 12.0, 8.0, 12.0, 8.0, 6.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0], "bins": [-2.03125, -1.967681884765625, -1.90411376953125, -1.840545654296875, -1.7769775390625, -1.713409423828125, -1.64984130859375, -1.586273193359375, -1.522705078125, -1.459136962890625, -1.39556884765625, -1.332000732421875, -1.2684326171875, -1.204864501953125, -1.14129638671875, -1.077728271484375, -1.01416015625, -0.950592041015625, -0.88702392578125, -0.823455810546875, -0.7598876953125, -0.696319580078125, -0.63275146484375, -0.569183349609375, -0.505615234375, -0.442047119140625, -0.37847900390625, -0.314910888671875, -0.2513427734375, -0.187774658203125, -0.12420654296875, -0.060638427734375, 0.0029296875, 0.066497802734375, 0.13006591796875, 0.193634033203125, 0.2572021484375, 0.320770263671875, 0.38433837890625, 0.447906494140625, 0.511474609375, 0.575042724609375, 0.63861083984375, 0.702178955078125, 0.7657470703125, 0.829315185546875, 0.89288330078125, 0.956451416015625, 1.02001953125, 1.083587646484375, 1.14715576171875, 1.210723876953125, 1.2742919921875, 1.337860107421875, 1.40142822265625, 1.464996337890625, 1.528564453125, 1.592132568359375, 1.65570068359375, 1.719268798828125, 1.7828369140625, 1.846405029296875, 1.90997314453125, 1.973541259765625, 2.037109375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 3.0, 4.0, 8.0, 6.0, 4.0, 13.0, 12.0, 11.0, 22.0, 23.0, 31.0, 22.0, 32.0, 42.0, 45.0, 34.0, 52.0, 57.0, 58.0, 70.0, 62.0, 52.0, 46.0, 42.0, 40.0, 38.0, 30.0, 21.0, 14.0, 23.0, 13.0, 11.0, 16.0, 6.0, 8.0, 6.0, 0.0, 5.0, 3.0, 3.0, 3.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0299072265625, -0.028872013092041016, -0.02783679962158203, -0.026801586151123047, -0.025766372680664062, -0.024731159210205078, -0.023695945739746094, -0.02266073226928711, -0.021625518798828125, -0.02059030532836914, -0.019555091857910156, -0.018519878387451172, -0.017484664916992188, -0.016449451446533203, -0.015414237976074219, -0.014379024505615234, -0.01334381103515625, -0.012308597564697266, -0.011273384094238281, -0.010238170623779297, -0.009202957153320312, -0.008167743682861328, -0.007132530212402344, -0.006097316741943359, -0.005062103271484375, -0.004026889801025391, -0.0029916763305664062, -0.001956462860107422, -0.0009212493896484375, 0.00011396408081054688, 0.0011491775512695312, 0.0021843910217285156, 0.0032196044921875, 0.004254817962646484, 0.005290031433105469, 0.006325244903564453, 0.0073604583740234375, 0.008395671844482422, 0.009430885314941406, 0.01046609878540039, 0.011501312255859375, 0.01253652572631836, 0.013571739196777344, 0.014606952667236328, 0.015642166137695312, 0.016677379608154297, 0.01771259307861328, 0.018747806549072266, 0.01978302001953125, 0.020818233489990234, 0.02185344696044922, 0.022888660430908203, 0.023923873901367188, 0.024959087371826172, 0.025994300842285156, 0.02702951431274414, 0.028064727783203125, 0.02909994125366211, 0.030135154724121094, 0.031170368194580078, 0.03220558166503906, 0.03324079513549805, 0.03427600860595703, 0.035311222076416016, 0.036346435546875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 2.0, 8.0, 5.0, 13.0, 26.0, 14.0, 17.0, 26.0, 34.0, 46.0, 55.0, 89.0, 104.0, 181.0, 269.0, 567.0, 2042.0, 1039162.0, 4290.0, 657.0, 297.0, 157.0, 126.0, 88.0, 54.0, 42.0, 38.0, 34.0, 20.0, 14.0, 14.0, 11.0, 11.0, 5.0, 7.0, 1.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0], "bins": [-0.81689453125, -0.7939376831054688, -0.7709808349609375, -0.7480239868164062, -0.725067138671875, -0.7021102905273438, -0.6791534423828125, -0.6561965942382812, -0.63323974609375, -0.6102828979492188, -0.5873260498046875, -0.5643692016601562, -0.541412353515625, -0.5184555053710938, -0.4954986572265625, -0.47254180908203125, -0.4495849609375, -0.42662811279296875, -0.4036712646484375, -0.38071441650390625, -0.357757568359375, -0.33480072021484375, -0.3118438720703125, -0.28888702392578125, -0.26593017578125, -0.24297332763671875, -0.2200164794921875, -0.19705963134765625, -0.174102783203125, -0.15114593505859375, -0.1281890869140625, -0.10523223876953125, -0.082275390625, -0.05931854248046875, -0.0363616943359375, -0.01340484619140625, 0.009552001953125, 0.03250885009765625, 0.0554656982421875, 0.07842254638671875, 0.10137939453125, 0.12433624267578125, 0.1472930908203125, 0.17024993896484375, 0.193206787109375, 0.21616363525390625, 0.2391204833984375, 0.26207733154296875, 0.2850341796875, 0.30799102783203125, 0.3309478759765625, 0.35390472412109375, 0.376861572265625, 0.39981842041015625, 0.4227752685546875, 0.44573211669921875, 0.46868896484375, 0.49164581298828125, 0.5146026611328125, 0.5375595092773438, 0.560516357421875, 0.5834732055664062, 0.6064300537109375, 0.6293869018554688, 0.65234375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 18.0, 372.0, 616.0, 9.0], "bins": [-0.5646805763244629, -0.5555887222290039, -0.5464969277381897, -0.5374050736427307, -0.5283132195472717, -0.5192213654518127, -0.5101295709609985, -0.5010377168655396, -0.49194586277008057, -0.48285403847694397, -0.473762184381485, -0.4646703600883484, -0.4555785059928894, -0.4464866816997528, -0.4373948276042938, -0.4283030033111572, -0.41921117901802063, -0.41011935472488403, -0.40102750062942505, -0.39193567633628845, -0.38284382224082947, -0.37375199794769287, -0.3646601438522339, -0.3555683195590973, -0.3464764952659607, -0.3373846709728241, -0.3282928168773651, -0.3192009925842285, -0.31010913848876953, -0.30101731419563293, -0.29192546010017395, -0.28283363580703735, -0.27374178171157837, -0.2646499574184418, -0.2555581033229828, -0.246466264128685, -0.2373744249343872, -0.2282826006412506, -0.21919076144695282, -0.21009892225265503, -0.20100709795951843, -0.19191525876522064, -0.18282341957092285, -0.17373158037662506, -0.16463974118232727, -0.15554791688919067, -0.14645607769489288, -0.1373642385005951, -0.1282723844051361, -0.11918054521083832, -0.11008870601654053, -0.10099687427282333, -0.09190503507852554, -0.08281319588422775, -0.07372136414051056, -0.06462952494621277, -0.055537693202495575, -0.046445854008197784, -0.03735401853919029, -0.02826218120753765, -0.01917034387588501, -0.01007850468158722, -0.0009866692125797272, 0.008105166256427765, 0.017197005450725555]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 8.0, 6.0, 5.0, 6.0, 10.0, 12.0, 14.0, 14.0, 7.0, 21.0, 18.0, 22.0, 32.0, 29.0, 32.0, 38.0, 37.0, 37.0, 38.0, 37.0, 39.0, 46.0, 31.0, 33.0, 31.0, 44.0, 40.0, 37.0, 35.0, 34.0, 28.0, 32.0, 23.0, 19.0, 17.0, 17.0, 12.0, 15.0, 10.0, 9.0, 8.0, 4.0, 2.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.05367851257324219, -0.0520218089222908, -0.050365108996629715, -0.04870840907096863, -0.04705170542001724, -0.04539500176906586, -0.04373830184340477, -0.04208160191774368, -0.0404248982667923, -0.03876819461584091, -0.037111494690179825, -0.03545479476451874, -0.03379809111356735, -0.03214138746261597, -0.03048468753695488, -0.028827985748648643, -0.027171283960342407, -0.02551458217203617, -0.023857880383729935, -0.0222011785954237, -0.020544476807117462, -0.018887775018811226, -0.01723107323050499, -0.015574371442198753, -0.013917669653892517, -0.01226096786558628, -0.010604266077280045, -0.008947564288973808, -0.007290862500667572, -0.005634160712361336, -0.0039774589240550995, -0.0023207571357488632, -0.000664055347442627, 0.0009926464408636093, 0.0026493482291698456, 0.004306050017476082, 0.005962751805782318, 0.007619453594088554, 0.00927615538239479, 0.010932857170701027, 0.012589558959007263, 0.0142462607473135, 0.015902962535619736, 0.017559664323925972, 0.019216366112232208, 0.020873067900538445, 0.02252976968884468, 0.024186471477150917, 0.025843173265457153, 0.02749987505376339, 0.029156576842069626, 0.030813278630375862, 0.0324699804186821, 0.034126684069633484, 0.03578338399529457, 0.03744008392095566, 0.03909678757190704, 0.04075349122285843, 0.042410191148519516, 0.0440668910741806, 0.04572359472513199, 0.047380298376083374, 0.04903699830174446, 0.05069369822740555, 0.052350401878356934]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 10.0, 9.0, 6.0, 5.0, 4.0, 9.0, 18.0, 19.0, 20.0, 19.0, 22.0, 32.0, 18.0, 31.0, 31.0, 45.0, 40.0, 48.0, 52.0, 42.0, 47.0, 46.0, 50.0, 42.0, 33.0, 41.0, 36.0, 42.0, 26.0, 27.0, 27.0, 20.0, 18.0, 15.0, 12.0, 7.0, 14.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4375, -7.189208984375, -6.94091796875, -6.692626953125, -6.4443359375, -6.196044921875, -5.94775390625, -5.699462890625, -5.451171875, -5.202880859375, -4.95458984375, -4.706298828125, -4.4580078125, -4.209716796875, -3.96142578125, -3.713134765625, -3.46484375, -3.216552734375, -2.96826171875, -2.719970703125, -2.4716796875, -2.223388671875, -1.97509765625, -1.726806640625, -1.478515625, -1.230224609375, -0.98193359375, -0.733642578125, -0.4853515625, -0.237060546875, 0.01123046875, 0.259521484375, 0.5078125, 0.756103515625, 1.00439453125, 1.252685546875, 1.5009765625, 1.749267578125, 1.99755859375, 2.245849609375, 2.494140625, 2.742431640625, 2.99072265625, 3.239013671875, 3.4873046875, 3.735595703125, 3.98388671875, 4.232177734375, 4.48046875, 4.728759765625, 4.97705078125, 5.225341796875, 5.4736328125, 5.721923828125, 5.97021484375, 6.218505859375, 6.466796875, 6.715087890625, 6.96337890625, 7.211669921875, 7.4599609375, 7.708251953125, 7.95654296875, 8.204833984375, 8.453125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 9.0, 6.0, 6.0, 17.0, 20.0, 32.0, 41.0, 71.0, 114.0, 149.0, 284.0, 446.0, 702.0, 1189.0, 2026.0, 3602.0, 6115.0, 10840.0, 18933.0, 32548.0, 57233.0, 104480.0, 214583.0, 275103.0, 145178.0, 75006.0, 42481.0, 24200.0, 13808.0, 8108.0, 4694.0, 2634.0, 1484.0, 913.0, 530.0, 335.0, 235.0, 171.0, 84.0, 56.0, 38.0, 26.0, 11.0, 3.0, 8.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.88671875, -7.63421630859375, -7.3817138671875, -7.12921142578125, -6.876708984375, -6.62420654296875, -6.3717041015625, -6.11920166015625, -5.86669921875, -5.61419677734375, -5.3616943359375, -5.10919189453125, -4.856689453125, -4.60418701171875, -4.3516845703125, -4.09918212890625, -3.8466796875, -3.59417724609375, -3.3416748046875, -3.08917236328125, -2.836669921875, -2.58416748046875, -2.3316650390625, -2.07916259765625, -1.82666015625, -1.57415771484375, -1.3216552734375, -1.06915283203125, -0.816650390625, -0.56414794921875, -0.3116455078125, -0.05914306640625, 0.193359375, 0.44586181640625, 0.6983642578125, 0.95086669921875, 1.203369140625, 1.45587158203125, 1.7083740234375, 1.96087646484375, 2.21337890625, 2.46588134765625, 2.7183837890625, 2.97088623046875, 3.223388671875, 3.47589111328125, 3.7283935546875, 3.98089599609375, 4.2333984375, 4.48590087890625, 4.7384033203125, 4.99090576171875, 5.243408203125, 5.49591064453125, 5.7484130859375, 6.00091552734375, 6.25341796875, 6.50592041015625, 6.7584228515625, 7.01092529296875, 7.263427734375, 7.51593017578125, 7.7684326171875, 8.02093505859375, 8.2734375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 5.0, 3.0, 7.0, 6.0, 13.0, 15.0, 14.0, 21.0, 20.0, 22.0, 20.0, 33.0, 24.0, 38.0, 44.0, 37.0, 55.0, 70.0, 106.0, 151.0, 276.0, 1313.0, 180.0, 107.0, 78.0, 63.0, 41.0, 38.0, 25.0, 31.0, 26.0, 21.0, 17.0, 19.0, 16.0, 15.0, 14.0, 13.0, 6.0, 10.0, 7.0, 7.0, 3.0, 1.0, 4.0, 3.0, 6.0, 3.0, 0.0, 1.0, 3.0, 2.0], "bins": [-20.109375, -19.5009765625, -18.892578125, -18.2841796875, -17.67578125, -17.0673828125, -16.458984375, -15.8505859375, -15.2421875, -14.6337890625, -14.025390625, -13.4169921875, -12.80859375, -12.2001953125, -11.591796875, -10.9833984375, -10.375, -9.7666015625, -9.158203125, -8.5498046875, -7.94140625, -7.3330078125, -6.724609375, -6.1162109375, -5.5078125, -4.8994140625, -4.291015625, -3.6826171875, -3.07421875, -2.4658203125, -1.857421875, -1.2490234375, -0.640625, -0.0322265625, 0.576171875, 1.1845703125, 1.79296875, 2.4013671875, 3.009765625, 3.6181640625, 4.2265625, 4.8349609375, 5.443359375, 6.0517578125, 6.66015625, 7.2685546875, 7.876953125, 8.4853515625, 9.09375, 9.7021484375, 10.310546875, 10.9189453125, 11.52734375, 12.1357421875, 12.744140625, 13.3525390625, 13.9609375, 14.5693359375, 15.177734375, 15.7861328125, 16.39453125, 17.0029296875, 17.611328125, 18.2197265625, 18.828125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 10.0, 7.0, 19.0, 15.0, 30.0, 30.0, 80.0, 107.0, 178.0, 295.0, 581.0, 1792.0, 14470.0, 297331.0, 2726048.0, 95615.0, 6761.0, 1178.0, 471.0, 258.0, 140.0, 89.0, 55.0, 36.0, 20.0, 15.0, 17.0, 10.0, 10.0, 3.0, 6.0, 7.0, 6.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.9375, -37.7333984375, -36.529296875, -35.3251953125, -34.12109375, -32.9169921875, -31.712890625, -30.5087890625, -29.3046875, -28.1005859375, -26.896484375, -25.6923828125, -24.48828125, -23.2841796875, -22.080078125, -20.8759765625, -19.671875, -18.4677734375, -17.263671875, -16.0595703125, -14.85546875, -13.6513671875, -12.447265625, -11.2431640625, -10.0390625, -8.8349609375, -7.630859375, -6.4267578125, -5.22265625, -4.0185546875, -2.814453125, -1.6103515625, -0.40625, 0.7978515625, 2.001953125, 3.2060546875, 4.41015625, 5.6142578125, 6.818359375, 8.0224609375, 9.2265625, 10.4306640625, 11.634765625, 12.8388671875, 14.04296875, 15.2470703125, 16.451171875, 17.6552734375, 18.859375, 20.0634765625, 21.267578125, 22.4716796875, 23.67578125, 24.8798828125, 26.083984375, 27.2880859375, 28.4921875, 29.6962890625, 30.900390625, 32.1044921875, 33.30859375, 34.5126953125, 35.716796875, 36.9208984375, 38.125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 61.0, 466.0, 446.0, 42.0, 0.0, 0.0, 1.0], "bins": [-459.2400207519531, -451.45587158203125, -443.6717529296875, -435.8876037597656, -428.10345458984375, -420.3193359375, -412.5351867675781, -404.75103759765625, -396.9669189453125, -389.1827697753906, -381.3986511230469, -373.614501953125, -365.8303527832031, -358.0462341308594, -350.2620849609375, -342.4779357910156, -334.69378662109375, -326.9096374511719, -319.1255187988281, -311.34136962890625, -303.5572204589844, -295.7731018066406, -287.98895263671875, -280.2048034667969, -272.4206848144531, -264.63653564453125, -256.8524169921875, -249.06826782226562, -241.2841339111328, -233.5, -225.71585083007812, -217.9317169189453, -210.1475830078125, -202.3634490966797, -194.5792999267578, -186.795166015625, -179.0110321044922, -171.22689819335938, -163.4427490234375, -155.6586151123047, -147.87448120117188, -140.09034729003906, -132.3061981201172, -124.52206420898438, -116.73793029785156, -108.95378875732422, -101.16964721679688, -93.38551330566406, -85.60137176513672, -77.81723022460938, -70.03309631347656, -62.24895477294922, -54.46481704711914, -46.68067932128906, -38.89653778076172, -31.11240005493164, -23.328262329101562, -15.544123649597168, -7.759984970092773, 0.0241546630859375, 7.808292388916016, 15.592430114746094, 23.376571655273438, 31.160709381103516, 38.944847106933594]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 6.0, 10.0, 7.0, 8.0, 12.0, 11.0, 14.0, 19.0, 16.0, 17.0, 16.0, 13.0, 20.0, 24.0, 31.0, 28.0, 27.0, 31.0, 35.0, 49.0, 40.0, 46.0, 34.0, 27.0, 44.0, 32.0, 44.0, 34.0, 35.0, 28.0, 34.0, 29.0, 24.0, 22.0, 23.0, 9.0, 16.0, 15.0, 12.0, 15.0, 8.0, 7.0, 9.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-44.36927032470703, -42.93077850341797, -41.492286682128906, -40.053794860839844, -38.61530685424805, -37.176815032958984, -35.73832321166992, -34.29983139038086, -32.8613395690918, -31.422847747802734, -29.984357833862305, -28.545866012573242, -27.10737419128418, -25.66888427734375, -24.230392456054688, -22.791900634765625, -21.353410720825195, -19.914918899536133, -18.476428985595703, -17.03793716430664, -15.599445343017578, -14.160954475402832, -12.722463607788086, -11.283971786499023, -9.845480918884277, -8.406990051269531, -6.968498229980469, -5.530007362365723, -4.091516017913818, -2.653024673461914, -1.214533805847168, 0.22395801544189453, 1.6624488830566406, 3.100940227508545, 4.539431571960449, 5.977922439575195, 7.4164137840271, 8.854905128479004, 10.29339599609375, 11.731887817382812, 13.170378684997559, 14.608869552612305, 16.047361373901367, 17.485851287841797, 18.92434310913086, 20.362834930419922, 21.801326751708984, 23.239818572998047, 24.678308486938477, 26.11680030822754, 27.55529022216797, 28.99378204345703, 30.432273864746094, 31.870765686035156, 33.30925750732422, 34.74774932861328, 36.18623733520508, 37.62472915649414, 39.0632209777832, 40.501708984375, 41.94020080566406, 43.378692626953125, 44.81718444824219, 46.25567626953125, 47.69416809082031]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 3.0, 5.0, 4.0, 9.0, 9.0, 18.0, 11.0, 19.0, 19.0, 20.0, 19.0, 26.0, 25.0, 31.0, 23.0, 35.0, 40.0, 39.0, 53.0, 37.0, 52.0, 43.0, 47.0, 41.0, 34.0, 52.0, 28.0, 20.0, 34.0, 25.0, 29.0, 24.0, 27.0, 20.0, 19.0, 13.0, 9.0, 5.0, 5.0, 10.0, 4.0, 8.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.7421875, -7.50048828125, -7.2587890625, -7.01708984375, -6.775390625, -6.53369140625, -6.2919921875, -6.05029296875, -5.80859375, -5.56689453125, -5.3251953125, -5.08349609375, -4.841796875, -4.60009765625, -4.3583984375, -4.11669921875, -3.875, -3.63330078125, -3.3916015625, -3.14990234375, -2.908203125, -2.66650390625, -2.4248046875, -2.18310546875, -1.94140625, -1.69970703125, -1.4580078125, -1.21630859375, -0.974609375, -0.73291015625, -0.4912109375, -0.24951171875, -0.0078125, 0.23388671875, 0.4755859375, 0.71728515625, 0.958984375, 1.20068359375, 1.4423828125, 1.68408203125, 1.92578125, 2.16748046875, 2.4091796875, 2.65087890625, 2.892578125, 3.13427734375, 3.3759765625, 3.61767578125, 3.859375, 4.10107421875, 4.3427734375, 4.58447265625, 4.826171875, 5.06787109375, 5.3095703125, 5.55126953125, 5.79296875, 6.03466796875, 6.2763671875, 6.51806640625, 6.759765625, 7.00146484375, 7.2431640625, 7.48486328125, 7.7265625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 9.0, 2.0, 10.0, 13.0, 17.0, 19.0, 27.0, 44.0, 67.0, 130.0, 204.0, 388.0, 878.0, 1716.0, 3867.0, 9439.0, 23817.0, 62645.0, 171072.0, 466198.0, 1095145.0, 1315898.0, 649551.0, 246672.0, 89836.0, 33451.0, 13267.0, 5303.0, 2283.0, 1096.0, 532.0, 271.0, 147.0, 79.0, 65.0, 37.0, 27.0, 22.0, 9.0, 5.0, 11.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1640625, -6.9266357421875, -6.689208984375, -6.4517822265625, -6.21435546875, -5.9769287109375, -5.739501953125, -5.5020751953125, -5.2646484375, -5.0272216796875, -4.789794921875, -4.5523681640625, -4.31494140625, -4.0775146484375, -3.840087890625, -3.6026611328125, -3.365234375, -3.1278076171875, -2.890380859375, -2.6529541015625, -2.41552734375, -2.1781005859375, -1.940673828125, -1.7032470703125, -1.4658203125, -1.2283935546875, -0.990966796875, -0.7535400390625, -0.51611328125, -0.2786865234375, -0.041259765625, 0.1961669921875, 0.43359375, 0.6710205078125, 0.908447265625, 1.1458740234375, 1.38330078125, 1.6207275390625, 1.858154296875, 2.0955810546875, 2.3330078125, 2.5704345703125, 2.807861328125, 3.0452880859375, 3.28271484375, 3.5201416015625, 3.757568359375, 3.9949951171875, 4.232421875, 4.4698486328125, 4.707275390625, 4.9447021484375, 5.18212890625, 5.4195556640625, 5.656982421875, 5.8944091796875, 6.1318359375, 6.3692626953125, 6.606689453125, 6.8441162109375, 7.08154296875, 7.3189697265625, 7.556396484375, 7.7938232421875, 8.03125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 3.0, 3.0, 2.0, 8.0, 6.0, 11.0, 19.0, 26.0, 32.0, 43.0, 63.0, 84.0, 103.0, 143.0, 238.0, 326.0, 347.0, 438.0, 439.0, 383.0, 323.0, 275.0, 186.0, 159.0, 110.0, 67.0, 56.0, 39.0, 34.0, 26.0, 16.0, 15.0, 5.0, 14.0, 9.0, 9.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3828125, -9.0501708984375, -8.717529296875, -8.3848876953125, -8.05224609375, -7.7196044921875, -7.386962890625, -7.0543212890625, -6.7216796875, -6.3890380859375, -6.056396484375, -5.7237548828125, -5.39111328125, -5.0584716796875, -4.725830078125, -4.3931884765625, -4.060546875, -3.7279052734375, -3.395263671875, -3.0626220703125, -2.72998046875, -2.3973388671875, -2.064697265625, -1.7320556640625, -1.3994140625, -1.0667724609375, -0.734130859375, -0.4014892578125, -0.06884765625, 0.2637939453125, 0.596435546875, 0.9290771484375, 1.26171875, 1.5943603515625, 1.927001953125, 2.2596435546875, 2.59228515625, 2.9249267578125, 3.257568359375, 3.5902099609375, 3.9228515625, 4.2554931640625, 4.588134765625, 4.9207763671875, 5.25341796875, 5.5860595703125, 5.918701171875, 6.2513427734375, 6.583984375, 6.9166259765625, 7.249267578125, 7.5819091796875, 7.91455078125, 8.2471923828125, 8.579833984375, 8.9124755859375, 9.2451171875, 9.5777587890625, 9.910400390625, 10.2430419921875, 10.57568359375, 10.9083251953125, 11.240966796875, 11.5736083984375, 11.90625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 6.0, 4.0, 7.0, 17.0, 11.0, 19.0, 24.0, 33.0, 46.0, 52.0, 70.0, 117.0, 223.0, 340.0, 736.0, 1719.0, 4794.0, 16667.0, 71808.0, 380737.0, 2011165.0, 1397424.0, 241009.0, 48600.0, 12142.0, 3735.0, 1391.0, 584.0, 289.0, 176.0, 106.0, 76.0, 43.0, 30.0, 22.0, 20.0, 15.0, 9.0, 8.0, 2.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.9921875, -15.505615234375, -15.01904296875, -14.532470703125, -14.0458984375, -13.559326171875, -13.07275390625, -12.586181640625, -12.099609375, -11.613037109375, -11.12646484375, -10.639892578125, -10.1533203125, -9.666748046875, -9.18017578125, -8.693603515625, -8.20703125, -7.720458984375, -7.23388671875, -6.747314453125, -6.2607421875, -5.774169921875, -5.28759765625, -4.801025390625, -4.314453125, -3.827880859375, -3.34130859375, -2.854736328125, -2.3681640625, -1.881591796875, -1.39501953125, -0.908447265625, -0.421875, 0.064697265625, 0.55126953125, 1.037841796875, 1.5244140625, 2.010986328125, 2.49755859375, 2.984130859375, 3.470703125, 3.957275390625, 4.44384765625, 4.930419921875, 5.4169921875, 5.903564453125, 6.39013671875, 6.876708984375, 7.36328125, 7.849853515625, 8.33642578125, 8.822998046875, 9.3095703125, 9.796142578125, 10.28271484375, 10.769287109375, 11.255859375, 11.742431640625, 12.22900390625, 12.715576171875, 13.2021484375, 13.688720703125, 14.17529296875, 14.661865234375, 15.1484375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 449.0, 563.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-841.950927734375, -827.4345092773438, -812.9180908203125, -798.4016723632812, -783.88525390625, -769.3687744140625, -754.8524169921875, -740.3359375, -725.8195190429688, -711.3031005859375, -696.7866821289062, -682.270263671875, -667.7538452148438, -653.2374267578125, -638.720947265625, -624.2045288085938, -609.6881103515625, -595.1716918945312, -580.6552734375, -566.1388549804688, -551.6224365234375, -537.10595703125, -522.589599609375, -508.0731506347656, -493.5567626953125, -479.04034423828125, -464.52392578125, -450.00750732421875, -435.4910583496094, -420.9746398925781, -406.4582214355469, -391.9418029785156, -377.4253845214844, -362.9089660644531, -348.3925476074219, -333.8760986328125, -319.35968017578125, -304.84326171875, -290.32684326171875, -275.8104248046875, -261.29400634765625, -246.777587890625, -232.2611541748047, -217.74473571777344, -203.22830200195312, -188.71188354492188, -174.19546508789062, -159.67904663085938, -145.16259765625, -130.64617919921875, -116.12974548339844, -101.61332702636719, -87.0969009399414, -72.58047485351562, -58.064056396484375, -43.547630310058594, -29.031204223632812, -14.514780044555664, 0.001644134521484375, 14.51806640625, 29.03449249267578, 43.55091857910156, 58.06733703613281, 72.5837631225586, 87.10018920898438]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 7.0, 5.0, 10.0, 17.0, 14.0, 17.0, 13.0, 21.0, 20.0, 17.0, 33.0, 44.0, 26.0, 37.0, 37.0, 40.0, 34.0, 45.0, 35.0, 40.0, 41.0, 50.0, 40.0, 39.0, 44.0, 29.0, 32.0, 30.0, 25.0, 19.0, 21.0, 26.0, 6.0, 17.0, 15.0, 7.0, 6.0, 8.0, 4.0, 4.0, 5.0, 5.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-40.08253479003906, -38.81862258911133, -37.554710388183594, -36.290794372558594, -35.02688217163086, -33.762969970703125, -32.49905776977539, -31.235145568847656, -29.97123146057129, -28.707319259643555, -27.443405151367188, -26.179492950439453, -24.91558074951172, -23.65166664123535, -22.387754440307617, -21.12384033203125, -19.859928131103516, -18.59601593017578, -17.332101821899414, -16.06818962097168, -14.804276466369629, -13.540363311767578, -12.276451110839844, -11.012537956237793, -9.748624801635742, -8.484711647033691, -7.220798969268799, -5.956886291503906, -4.6929731369018555, -3.4290599822998047, -2.165147304534912, -0.9012346267700195, 0.3626823425292969, 1.6265952587127686, 2.8905081748962402, 4.154420852661133, 5.418334007263184, 6.682247161865234, 7.946159839630127, 9.21007251739502, 10.47398567199707, 11.737898826599121, 13.001811981201172, 14.265724182128906, 15.529637336730957, 16.793550491333008, 18.057462692260742, 19.32137680053711, 20.585289001464844, 21.849201202392578, 23.113115310668945, 24.37702751159668, 25.640941619873047, 26.90485382080078, 28.168766021728516, 29.43267822265625, 30.696592330932617, 31.96050453186035, 33.22441864013672, 34.48833084106445, 35.75224304199219, 37.01615905761719, 38.28007125854492, 39.543983459472656, 40.80789566040039]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 10.0, 2.0, 9.0, 11.0, 13.0, 14.0, 19.0, 17.0, 16.0, 31.0, 28.0, 40.0, 34.0, 25.0, 49.0, 39.0, 47.0, 57.0, 45.0, 34.0, 53.0, 46.0, 48.0, 45.0, 37.0, 31.0, 28.0, 22.0, 28.0, 17.0, 17.0, 18.0, 22.0, 9.0, 10.0, 10.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.421875, -8.147705078125, -7.87353515625, -7.599365234375, -7.3251953125, -7.051025390625, -6.77685546875, -6.502685546875, -6.228515625, -5.954345703125, -5.68017578125, -5.406005859375, -5.1318359375, -4.857666015625, -4.58349609375, -4.309326171875, -4.03515625, -3.760986328125, -3.48681640625, -3.212646484375, -2.9384765625, -2.664306640625, -2.39013671875, -2.115966796875, -1.841796875, -1.567626953125, -1.29345703125, -1.019287109375, -0.7451171875, -0.470947265625, -0.19677734375, 0.077392578125, 0.3515625, 0.625732421875, 0.89990234375, 1.174072265625, 1.4482421875, 1.722412109375, 1.99658203125, 2.270751953125, 2.544921875, 2.819091796875, 3.09326171875, 3.367431640625, 3.6416015625, 3.915771484375, 4.18994140625, 4.464111328125, 4.73828125, 5.012451171875, 5.28662109375, 5.560791015625, 5.8349609375, 6.109130859375, 6.38330078125, 6.657470703125, 6.931640625, 7.205810546875, 7.47998046875, 7.754150390625, 8.0283203125, 8.302490234375, 8.57666015625, 8.850830078125, 9.125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 9.0, 7.0, 21.0, 23.0, 40.0, 64.0, 90.0, 148.0, 229.0, 365.0, 614.0, 1013.0, 1784.0, 2963.0, 5014.0, 8492.0, 14344.0, 24034.0, 39001.0, 62561.0, 93118.0, 127289.0, 150030.0, 149248.0, 123957.0, 90364.0, 59928.0, 37522.0, 22999.0, 13354.0, 8020.0, 4787.0, 2763.0, 1753.0, 997.0, 585.0, 410.0, 215.0, 147.0, 76.0, 58.0, 46.0, 22.0, 21.0, 5.0, 4.0, 9.0, 6.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.01953125, -0.9876251220703125, -0.955718994140625, -0.9238128662109375, -0.89190673828125, -0.8600006103515625, -0.828094482421875, -0.7961883544921875, -0.7642822265625, -0.7323760986328125, -0.700469970703125, -0.6685638427734375, -0.63665771484375, -0.6047515869140625, -0.572845458984375, -0.5409393310546875, -0.509033203125, -0.4771270751953125, -0.445220947265625, -0.4133148193359375, -0.38140869140625, -0.3495025634765625, -0.317596435546875, -0.2856903076171875, -0.2537841796875, -0.2218780517578125, -0.189971923828125, -0.1580657958984375, -0.12615966796875, -0.0942535400390625, -0.062347412109375, -0.0304412841796875, 0.00146484375, 0.0333709716796875, 0.065277099609375, 0.0971832275390625, 0.12908935546875, 0.1609954833984375, 0.192901611328125, 0.2248077392578125, 0.2567138671875, 0.2886199951171875, 0.320526123046875, 0.3524322509765625, 0.38433837890625, 0.4162445068359375, 0.448150634765625, 0.4800567626953125, 0.511962890625, 0.5438690185546875, 0.575775146484375, 0.6076812744140625, 0.63958740234375, 0.6714935302734375, 0.703399658203125, 0.7353057861328125, 0.7672119140625, 0.7991180419921875, 0.831024169921875, 0.8629302978515625, 0.89483642578125, 0.9267425537109375, 0.958648681640625, 0.9905548095703125, 1.0224609375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 9.0, 11.0, 7.0, 11.0, 16.0, 15.0, 20.0, 21.0, 24.0, 29.0, 37.0, 27.0, 32.0, 34.0, 36.0, 46.0, 40.0, 46.0, 33.0, 1060.0, 45.0, 42.0, 34.0, 26.0, 32.0, 42.0, 36.0, 24.0, 24.0, 19.0, 30.0, 16.0, 21.0, 23.0, 10.0, 8.0, 9.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.8828125, -5.70599365234375, -5.5291748046875, -5.35235595703125, -5.175537109375, -4.99871826171875, -4.8218994140625, -4.64508056640625, -4.46826171875, -4.29144287109375, -4.1146240234375, -3.93780517578125, -3.760986328125, -3.58416748046875, -3.4073486328125, -3.23052978515625, -3.0537109375, -2.87689208984375, -2.7000732421875, -2.52325439453125, -2.346435546875, -2.16961669921875, -1.9927978515625, -1.81597900390625, -1.63916015625, -1.46234130859375, -1.2855224609375, -1.10870361328125, -0.931884765625, -0.75506591796875, -0.5782470703125, -0.40142822265625, -0.224609375, -0.04779052734375, 0.1290283203125, 0.30584716796875, 0.482666015625, 0.65948486328125, 0.8363037109375, 1.01312255859375, 1.18994140625, 1.36676025390625, 1.5435791015625, 1.72039794921875, 1.897216796875, 2.07403564453125, 2.2508544921875, 2.42767333984375, 2.6044921875, 2.78131103515625, 2.9581298828125, 3.13494873046875, 3.311767578125, 3.48858642578125, 3.6654052734375, 3.84222412109375, 4.01904296875, 4.19586181640625, 4.3726806640625, 4.54949951171875, 4.726318359375, 4.90313720703125, 5.0799560546875, 5.25677490234375, 5.43359375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 6.0, 6.0, 7.0, 15.0, 19.0, 18.0, 35.0, 44.0, 69.0, 88.0, 125.0, 257.0, 357.0, 606.0, 915.0, 1454.0, 2512.0, 4015.0, 6618.0, 10629.0, 17939.0, 30551.0, 72221.0, 1860196.0, 35766.0, 20952.0, 12518.0, 7479.0, 4482.0, 2736.0, 1673.0, 1038.0, 652.0, 393.0, 269.0, 152.0, 100.0, 71.0, 41.0, 26.0, 20.0, 15.0, 9.0, 9.0, 6.0, 8.0, 6.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.07421875, -2.005401611328125, -1.93658447265625, -1.867767333984375, -1.7989501953125, -1.730133056640625, -1.66131591796875, -1.592498779296875, -1.523681640625, -1.454864501953125, -1.38604736328125, -1.317230224609375, -1.2484130859375, -1.179595947265625, -1.11077880859375, -1.041961669921875, -0.97314453125, -0.904327392578125, -0.83551025390625, -0.766693115234375, -0.6978759765625, -0.629058837890625, -0.56024169921875, -0.491424560546875, -0.422607421875, -0.353790283203125, -0.28497314453125, -0.216156005859375, -0.1473388671875, -0.078521728515625, -0.00970458984375, 0.059112548828125, 0.1279296875, 0.196746826171875, 0.26556396484375, 0.334381103515625, 0.4031982421875, 0.472015380859375, 0.54083251953125, 0.609649658203125, 0.678466796875, 0.747283935546875, 0.81610107421875, 0.884918212890625, 0.9537353515625, 1.022552490234375, 1.09136962890625, 1.160186767578125, 1.22900390625, 1.297821044921875, 1.36663818359375, 1.435455322265625, 1.5042724609375, 1.573089599609375, 1.64190673828125, 1.710723876953125, 1.779541015625, 1.848358154296875, 1.91717529296875, 1.985992431640625, 2.0548095703125, 2.123626708984375, 2.19244384765625, 2.261260986328125, 2.330078125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 8.0, 9.0, 10.0, 14.0, 11.0, 18.0, 28.0, 24.0, 32.0, 35.0, 49.0, 54.0, 47.0, 68.0, 65.0, 62.0, 75.0, 83.0, 39.0, 49.0, 32.0, 38.0, 29.0, 28.0, 19.0, 15.0, 12.0, 10.0, 8.0, 7.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.037841796875, -0.03671121597290039, -0.03558063507080078, -0.03445005416870117, -0.03331947326660156, -0.03218889236450195, -0.031058311462402344, -0.029927730560302734, -0.028797149658203125, -0.027666568756103516, -0.026535987854003906, -0.025405406951904297, -0.024274826049804688, -0.023144245147705078, -0.02201366424560547, -0.02088308334350586, -0.01975250244140625, -0.01862192153930664, -0.01749134063720703, -0.016360759735107422, -0.015230178833007812, -0.014099597930908203, -0.012969017028808594, -0.011838436126708984, -0.010707855224609375, -0.009577274322509766, -0.008446693420410156, -0.007316112518310547, -0.0061855316162109375, -0.005054950714111328, -0.003924369812011719, -0.0027937889099121094, -0.0016632080078125, -0.0005326271057128906, 0.0005979537963867188, 0.0017285346984863281, 0.0028591156005859375, 0.003989696502685547, 0.005120277404785156, 0.006250858306884766, 0.007381439208984375, 0.008512020111083984, 0.009642601013183594, 0.010773181915283203, 0.011903762817382812, 0.013034343719482422, 0.014164924621582031, 0.01529550552368164, 0.01642608642578125, 0.01755666732788086, 0.01868724822998047, 0.019817829132080078, 0.020948410034179688, 0.022078990936279297, 0.023209571838378906, 0.024340152740478516, 0.025470733642578125, 0.026601314544677734, 0.027731895446777344, 0.028862476348876953, 0.029993057250976562, 0.031123638153076172, 0.03225421905517578, 0.03338479995727539, 0.034515380859375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 6.0, 6.0, 9.0, 8.0, 13.0, 17.0, 20.0, 32.0, 43.0, 49.0, 78.0, 96.0, 145.0, 231.0, 474.0, 1512.0, 1027114.0, 16927.0, 730.0, 341.0, 187.0, 138.0, 105.0, 55.0, 47.0, 37.0, 35.0, 20.0, 23.0, 9.0, 15.0, 6.0, 7.0, 8.0, 1.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71484375, -0.69158935546875, -0.6683349609375, -0.64508056640625, -0.621826171875, -0.59857177734375, -0.5753173828125, -0.55206298828125, -0.52880859375, -0.50555419921875, -0.4822998046875, -0.45904541015625, -0.435791015625, -0.41253662109375, -0.3892822265625, -0.36602783203125, -0.3427734375, -0.31951904296875, -0.2962646484375, -0.27301025390625, -0.249755859375, -0.22650146484375, -0.2032470703125, -0.17999267578125, -0.15673828125, -0.13348388671875, -0.1102294921875, -0.08697509765625, -0.063720703125, -0.04046630859375, -0.0172119140625, 0.00604248046875, 0.029296875, 0.05255126953125, 0.0758056640625, 0.09906005859375, 0.122314453125, 0.14556884765625, 0.1688232421875, 0.19207763671875, 0.21533203125, 0.23858642578125, 0.2618408203125, 0.28509521484375, 0.308349609375, 0.33160400390625, 0.3548583984375, 0.37811279296875, 0.4013671875, 0.42462158203125, 0.4478759765625, 0.47113037109375, 0.494384765625, 0.51763916015625, 0.5408935546875, 0.56414794921875, 0.58740234375, 0.61065673828125, 0.6339111328125, 0.65716552734375, 0.680419921875, 0.70367431640625, 0.7269287109375, 0.75018310546875, 0.7734375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 6.0, 190.0, 820.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.690528154373169, -0.6748971939086914, -0.6592662334442139, -0.6436353325843811, -0.6280043721199036, -0.612373411655426, -0.5967425107955933, -0.5811115503311157, -0.5654805898666382, -0.5498496294021606, -0.5342186689376831, -0.5185877680778503, -0.5029568076133728, -0.48732584714889526, -0.4716949164867401, -0.45606398582458496, -0.4404330253601074, -0.4248020648956299, -0.40917113423347473, -0.3935402035713196, -0.37790924310684204, -0.3622782826423645, -0.34664735198020935, -0.3310164213180542, -0.31538546085357666, -0.2997545003890991, -0.28412356972694397, -0.2684926390647888, -0.2528616786003113, -0.23723073303699493, -0.2215997874736786, -0.20596884191036224, -0.1903378963470459, -0.17470695078372955, -0.1590760052204132, -0.14344505965709686, -0.12781411409378052, -0.11218316853046417, -0.09655222296714783, -0.08092127740383148, -0.06529033184051514, -0.04965938627719879, -0.034028440713882446, -0.0183974951505661, -0.002766549587249756, 0.01286439597606659, 0.028495341539382935, 0.04412628710269928, 0.059757232666015625, 0.07538817822933197, 0.09101912379264832, 0.10665006935596466, 0.122281014919281, 0.13791196048259735, 0.1535429060459137, 0.16917385160923004, 0.1848047971725464, 0.20043574273586273, 0.21606668829917908, 0.23169763386249542, 0.24732857942581177, 0.2629595398902893, 0.27859047055244446, 0.2942214012145996, 0.30985236167907715]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 0.0, 2.0, 5.0, 7.0, 8.0, 11.0, 5.0, 12.0, 14.0, 5.0, 11.0, 15.0, 22.0, 22.0, 29.0, 25.0, 25.0, 31.0, 35.0, 30.0, 33.0, 41.0, 42.0, 34.0, 36.0, 45.0, 38.0, 35.0, 36.0, 33.0, 31.0, 40.0, 35.0, 24.0, 15.0, 21.0, 27.0, 22.0, 15.0, 14.0, 13.0, 12.0, 11.0, 6.0, 9.0, 7.0, 7.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.04829782247543335, -0.046756841242313385, -0.04521586000919342, -0.043674882501363754, -0.04213390126824379, -0.040592920035123825, -0.03905194252729416, -0.037510961294174194, -0.03596998006105423, -0.034428998827934265, -0.0328880175948143, -0.031347040086984634, -0.02980605885386467, -0.028265077620744705, -0.02672409825026989, -0.025183118879795074, -0.02364213764667511, -0.022101156413555145, -0.02056017704308033, -0.019019197672605515, -0.01747821643948555, -0.015937235206365585, -0.01439625583589077, -0.01285527553409338, -0.01131429523229599, -0.0097733149304986, -0.00823233462870121, -0.00669135432690382, -0.00515037402510643, -0.00360939372330904, -0.00206841342151165, -0.0005274331197142601, 0.0010135471820831299, 0.00255452748388052, 0.00409550778567791, 0.0056364880874753, 0.00717746838927269, 0.00871844869107008, 0.01025942899286747, 0.01180040929466486, 0.01334138959646225, 0.01488236989825964, 0.01642335020005703, 0.017964329570531845, 0.01950531080365181, 0.021046292036771774, 0.02258727140724659, 0.024128250777721405, 0.02566923201084137, 0.027210213243961334, 0.02875119261443615, 0.030292171984910965, 0.03183315321803093, 0.033374134451150894, 0.03491511195898056, 0.036456093192100525, 0.03799707442522049, 0.039538055658340454, 0.04107903689146042, 0.042620014399290085, 0.04416099563241005, 0.045701976865530014, 0.04724295437335968, 0.048783935606479645, 0.05032491683959961]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 4.0, 4.0, 6.0, 8.0, 7.0, 15.0, 13.0, 11.0, 21.0, 33.0, 23.0, 20.0, 20.0, 31.0, 42.0, 37.0, 33.0, 34.0, 35.0, 39.0, 41.0, 46.0, 47.0, 39.0, 41.0, 43.0, 45.0, 33.0, 33.0, 31.0, 25.0, 24.0, 18.0, 9.0, 11.0, 13.0, 10.0, 9.0, 15.0, 5.0, 4.0, 3.0, 3.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.9140625, -7.66790771484375, -7.4217529296875, -7.17559814453125, -6.929443359375, -6.68328857421875, -6.4371337890625, -6.19097900390625, -5.94482421875, -5.69866943359375, -5.4525146484375, -5.20635986328125, -4.960205078125, -4.71405029296875, -4.4678955078125, -4.22174072265625, -3.9755859375, -3.72943115234375, -3.4832763671875, -3.23712158203125, -2.990966796875, -2.74481201171875, -2.4986572265625, -2.25250244140625, -2.00634765625, -1.76019287109375, -1.5140380859375, -1.26788330078125, -1.021728515625, -0.77557373046875, -0.5294189453125, -0.28326416015625, -0.037109375, 0.20904541015625, 0.4552001953125, 0.70135498046875, 0.947509765625, 1.19366455078125, 1.4398193359375, 1.68597412109375, 1.93212890625, 2.17828369140625, 2.4244384765625, 2.67059326171875, 2.916748046875, 3.16290283203125, 3.4090576171875, 3.65521240234375, 3.9013671875, 4.14752197265625, 4.3936767578125, 4.63983154296875, 4.885986328125, 5.13214111328125, 5.3782958984375, 5.62445068359375, 5.87060546875, 6.11676025390625, 6.3629150390625, 6.60906982421875, 6.855224609375, 7.10137939453125, 7.3475341796875, 7.59368896484375, 7.83984375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 0.0, 6.0, 3.0, 4.0, 16.0, 22.0, 33.0, 27.0, 35.0, 64.0, 89.0, 158.0, 198.0, 366.0, 694.0, 1371.0, 2809.0, 5873.0, 13071.0, 30147.0, 67032.0, 154932.0, 328009.0, 250053.0, 107339.0, 47373.0, 21014.0, 9328.0, 4210.0, 1919.0, 980.0, 521.0, 270.0, 162.0, 133.0, 89.0, 60.0, 38.0, 30.0, 22.0, 14.0, 8.0, 11.0, 6.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-11.3203125, -10.9852294921875, -10.650146484375, -10.3150634765625, -9.97998046875, -9.6448974609375, -9.309814453125, -8.9747314453125, -8.6396484375, -8.3045654296875, -7.969482421875, -7.6343994140625, -7.29931640625, -6.9642333984375, -6.629150390625, -6.2940673828125, -5.958984375, -5.6239013671875, -5.288818359375, -4.9537353515625, -4.61865234375, -4.2835693359375, -3.948486328125, -3.6134033203125, -3.2783203125, -2.9432373046875, -2.608154296875, -2.2730712890625, -1.93798828125, -1.6029052734375, -1.267822265625, -0.9327392578125, -0.59765625, -0.2625732421875, 0.072509765625, 0.4075927734375, 0.74267578125, 1.0777587890625, 1.412841796875, 1.7479248046875, 2.0830078125, 2.4180908203125, 2.753173828125, 3.0882568359375, 3.42333984375, 3.7584228515625, 4.093505859375, 4.4285888671875, 4.763671875, 5.0987548828125, 5.433837890625, 5.7689208984375, 6.10400390625, 6.4390869140625, 6.774169921875, 7.1092529296875, 7.4443359375, 7.7794189453125, 8.114501953125, 8.4495849609375, 8.78466796875, 9.1197509765625, 9.454833984375, 9.7899169921875, 10.125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 6.0, 1.0, 1.0, 3.0, 6.0, 4.0, 10.0, 11.0, 10.0, 18.0, 9.0, 13.0, 20.0, 26.0, 24.0, 36.0, 46.0, 37.0, 59.0, 59.0, 76.0, 98.0, 162.0, 1333.0, 293.0, 178.0, 92.0, 77.0, 53.0, 42.0, 33.0, 27.0, 30.0, 26.0, 27.0, 26.0, 22.0, 13.0, 7.0, 10.0, 7.0, 9.0, 5.0, 3.0, 2.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.953125, -18.273681640625, -17.59423828125, -16.914794921875, -16.2353515625, -15.555908203125, -14.87646484375, -14.197021484375, -13.517578125, -12.838134765625, -12.15869140625, -11.479248046875, -10.7998046875, -10.120361328125, -9.44091796875, -8.761474609375, -8.08203125, -7.402587890625, -6.72314453125, -6.043701171875, -5.3642578125, -4.684814453125, -4.00537109375, -3.325927734375, -2.646484375, -1.967041015625, -1.28759765625, -0.608154296875, 0.0712890625, 0.750732421875, 1.43017578125, 2.109619140625, 2.7890625, 3.468505859375, 4.14794921875, 4.827392578125, 5.5068359375, 6.186279296875, 6.86572265625, 7.545166015625, 8.224609375, 8.904052734375, 9.58349609375, 10.262939453125, 10.9423828125, 11.621826171875, 12.30126953125, 12.980712890625, 13.66015625, 14.339599609375, 15.01904296875, 15.698486328125, 16.3779296875, 17.057373046875, 17.73681640625, 18.416259765625, 19.095703125, 19.775146484375, 20.45458984375, 21.134033203125, 21.8134765625, 22.492919921875, 23.17236328125, 23.851806640625, 24.53125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 10.0, 8.0, 6.0, 9.0, 10.0, 16.0, 19.0, 32.0, 32.0, 48.0, 79.0, 110.0, 216.0, 295.0, 494.0, 1074.0, 6230.0, 147995.0, 2872184.0, 109508.0, 4955.0, 1019.0, 499.0, 282.0, 177.0, 117.0, 97.0, 45.0, 37.0, 31.0, 16.0, 15.0, 9.0, 5.0, 6.0, 5.0, 3.0, 4.0, 4.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.53125, -40.2900390625, -39.048828125, -37.8076171875, -36.56640625, -35.3251953125, -34.083984375, -32.8427734375, -31.6015625, -30.3603515625, -29.119140625, -27.8779296875, -26.63671875, -25.3955078125, -24.154296875, -22.9130859375, -21.671875, -20.4306640625, -19.189453125, -17.9482421875, -16.70703125, -15.4658203125, -14.224609375, -12.9833984375, -11.7421875, -10.5009765625, -9.259765625, -8.0185546875, -6.77734375, -5.5361328125, -4.294921875, -3.0537109375, -1.8125, -0.5712890625, 0.669921875, 1.9111328125, 3.15234375, 4.3935546875, 5.634765625, 6.8759765625, 8.1171875, 9.3583984375, 10.599609375, 11.8408203125, 13.08203125, 14.3232421875, 15.564453125, 16.8056640625, 18.046875, 19.2880859375, 20.529296875, 21.7705078125, 23.01171875, 24.2529296875, 25.494140625, 26.7353515625, 27.9765625, 29.2177734375, 30.458984375, 31.7001953125, 32.94140625, 34.1826171875, 35.423828125, 36.6650390625, 37.90625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 13.0, 14.0, 37.0, 53.0, 96.0, 129.0, 162.0, 154.0, 136.0, 88.0, 48.0, 39.0, 21.0, 12.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-72.81449127197266, -71.19512939453125, -69.57576751708984, -67.95640563964844, -66.33704376220703, -64.71768188476562, -63.09831619262695, -61.47895431518555, -59.85959243774414, -58.240230560302734, -56.62086868286133, -55.00150680541992, -53.38214111328125, -51.762779235839844, -50.14341735839844, -48.52405548095703, -46.904693603515625, -45.28533172607422, -43.66596984863281, -42.046607971191406, -40.42724609375, -38.807884216308594, -37.18851852416992, -35.569156646728516, -33.94979476928711, -32.3304328918457, -30.711071014404297, -29.091707229614258, -27.47234535217285, -25.852983474731445, -24.233619689941406, -22.6142578125, -20.99489974975586, -19.375537872314453, -17.756175994873047, -16.136812210083008, -14.517450332641602, -12.898088455200195, -11.278725624084473, -9.65936279296875, -8.040000915527344, -6.420638561248779, -4.801276206970215, -3.1819138526916504, -1.562551498413086, 0.05681037902832031, 1.676173210144043, 3.2955360412597656, 4.914897918701172, 6.534260272979736, 8.1536226272583, 9.772985458374023, 11.39234733581543, 13.011709213256836, 14.631072044372559, 16.25043487548828, 17.869796752929688, 19.489158630371094, 21.1085205078125, 22.72788429260254, 24.347246170043945, 25.96660804748535, 27.58597183227539, 29.205333709716797, 30.824695587158203]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 2.0, 6.0, 3.0, 6.0, 0.0, 7.0, 7.0, 7.0, 5.0, 8.0, 20.0, 17.0, 11.0, 16.0, 12.0, 17.0, 17.0, 25.0, 27.0, 31.0, 34.0, 30.0, 25.0, 39.0, 35.0, 30.0, 40.0, 31.0, 32.0, 36.0, 47.0, 40.0, 33.0, 30.0, 21.0, 22.0, 35.0, 29.0, 21.0, 25.0, 21.0, 16.0, 12.0, 18.0, 18.0, 13.0, 8.0, 4.0, 0.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-43.47837829589844, -42.0676383972168, -40.65690231323242, -39.24616241455078, -37.83542251586914, -36.424686431884766, -35.013946533203125, -33.60321044921875, -32.19247055053711, -30.7817325592041, -29.37099266052246, -27.960254669189453, -26.549516677856445, -25.138778686523438, -23.728038787841797, -22.31730079650879, -20.90656089782715, -19.49582290649414, -18.0850830078125, -16.674345016479492, -15.263607025146484, -13.85286808013916, -12.442129135131836, -11.031391143798828, -9.620652198791504, -8.20991325378418, -6.799175262451172, -5.388436317443848, -3.9776978492736816, -2.5669593811035156, -1.1562204360961914, 0.2545175552368164, 1.6652565002441406, 3.0759949684143066, 4.486733436584473, 5.897472381591797, 7.308210849761963, 8.718949317932129, 10.129688262939453, 11.540426254272461, 12.951165199279785, 14.36190414428711, 15.772642135620117, 17.183380126953125, 18.594120025634766, 20.004858016967773, 21.41559600830078, 22.826335906982422, 24.23707389831543, 25.647811889648438, 27.058551788330078, 28.469289779663086, 29.880027770996094, 31.290767669677734, 32.701507568359375, 34.11224365234375, 35.52298355102539, 36.93372344970703, 38.344459533691406, 39.75519943237305, 41.16593933105469, 42.57667541503906, 43.9874153137207, 45.398155212402344, 46.80889129638672]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 6.0, 11.0, 8.0, 12.0, 14.0, 15.0, 22.0, 29.0, 26.0, 22.0, 28.0, 31.0, 33.0, 45.0, 38.0, 37.0, 48.0, 45.0, 34.0, 49.0, 53.0, 39.0, 37.0, 46.0, 30.0, 38.0, 32.0, 27.0, 27.0, 21.0, 17.0, 21.0, 5.0, 8.0, 7.0, 8.0, 8.0, 5.0, 2.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.90625, -8.6322021484375, -8.358154296875, -8.0841064453125, -7.81005859375, -7.5360107421875, -7.261962890625, -6.9879150390625, -6.7138671875, -6.4398193359375, -6.165771484375, -5.8917236328125, -5.61767578125, -5.3436279296875, -5.069580078125, -4.7955322265625, -4.521484375, -4.2474365234375, -3.973388671875, -3.6993408203125, -3.42529296875, -3.1512451171875, -2.877197265625, -2.6031494140625, -2.3291015625, -2.0550537109375, -1.781005859375, -1.5069580078125, -1.23291015625, -0.9588623046875, -0.684814453125, -0.4107666015625, -0.13671875, 0.1373291015625, 0.411376953125, 0.6854248046875, 0.95947265625, 1.2335205078125, 1.507568359375, 1.7816162109375, 2.0556640625, 2.3297119140625, 2.603759765625, 2.8778076171875, 3.15185546875, 3.4259033203125, 3.699951171875, 3.9739990234375, 4.248046875, 4.5220947265625, 4.796142578125, 5.0701904296875, 5.34423828125, 5.6182861328125, 5.892333984375, 6.1663818359375, 6.4404296875, 6.7144775390625, 6.988525390625, 7.2625732421875, 7.53662109375, 7.8106689453125, 8.084716796875, 8.3587646484375, 8.6328125]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 4.0, 10.0, 7.0, 14.0, 8.0, 19.0, 16.0, 14.0, 26.0, 27.0, 57.0, 57.0, 70.0, 85.0, 145.0, 199.0, 244.0, 393.0, 1066.0, 62963.0, 4061679.0, 64676.0, 1114.0, 392.0, 247.0, 199.0, 135.0, 99.0, 62.0, 58.0, 42.0, 33.0, 24.0, 16.0, 15.0, 19.0, 13.0, 7.0, 8.0, 7.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.28125, -59.3359375, -57.390625, -55.4453125, -53.5, -51.5546875, -49.609375, -47.6640625, -45.71875, -43.7734375, -41.828125, -39.8828125, -37.9375, -35.9921875, -34.046875, -32.1015625, -30.15625, -28.2109375, -26.265625, -24.3203125, -22.375, -20.4296875, -18.484375, -16.5390625, -14.59375, -12.6484375, -10.703125, -8.7578125, -6.8125, -4.8671875, -2.921875, -0.9765625, 0.96875, 2.9140625, 4.859375, 6.8046875, 8.75, 10.6953125, 12.640625, 14.5859375, 16.53125, 18.4765625, 20.421875, 22.3671875, 24.3125, 26.2578125, 28.203125, 30.1484375, 32.09375, 34.0390625, 35.984375, 37.9296875, 39.875, 41.8203125, 43.765625, 45.7109375, 47.65625, 49.6015625, 51.546875, 53.4921875, 55.4375, 57.3828125, 59.328125, 61.2734375, 63.21875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 9.0, 5.0, 6.0, 9.0, 10.0, 12.0, 19.0, 25.0, 25.0, 35.0, 46.0, 72.0, 69.0, 117.0, 164.0, 203.0, 283.0, 406.0, 481.0, 484.0, 422.0, 335.0, 238.0, 158.0, 108.0, 88.0, 53.0, 42.0, 33.0, 26.0, 16.0, 15.0, 14.0, 9.0, 10.0, 3.0, 5.0, 5.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3125, -11.9520263671875, -11.591552734375, -11.2310791015625, -10.87060546875, -10.5101318359375, -10.149658203125, -9.7891845703125, -9.4287109375, -9.0682373046875, -8.707763671875, -8.3472900390625, -7.98681640625, -7.6263427734375, -7.265869140625, -6.9053955078125, -6.544921875, -6.1844482421875, -5.823974609375, -5.4635009765625, -5.10302734375, -4.7425537109375, -4.382080078125, -4.0216064453125, -3.6611328125, -3.3006591796875, -2.940185546875, -2.5797119140625, -2.21923828125, -1.8587646484375, -1.498291015625, -1.1378173828125, -0.77734375, -0.4168701171875, -0.056396484375, 0.3040771484375, 0.66455078125, 1.0250244140625, 1.385498046875, 1.7459716796875, 2.1064453125, 2.4669189453125, 2.827392578125, 3.1878662109375, 3.54833984375, 3.9088134765625, 4.269287109375, 4.6297607421875, 4.990234375, 5.3507080078125, 5.711181640625, 6.0716552734375, 6.43212890625, 6.7926025390625, 7.153076171875, 7.5135498046875, 7.8740234375, 8.2344970703125, 8.594970703125, 8.9554443359375, 9.31591796875, 9.6763916015625, 10.036865234375, 10.3973388671875, 10.7578125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 6.0, 12.0, 8.0, 10.0, 24.0, 35.0, 36.0, 48.0, 80.0, 78.0, 169.0, 242.0, 607.0, 2995.0, 29864.0, 529507.0, 3385016.0, 227275.0, 15234.0, 1853.0, 467.0, 226.0, 114.0, 103.0, 65.0, 55.0, 30.0, 28.0, 24.0, 9.0, 9.0, 7.0, 12.0, 9.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-35.4375, -34.435546875, -33.43359375, -32.431640625, -31.4296875, -30.427734375, -29.42578125, -28.423828125, -27.421875, -26.419921875, -25.41796875, -24.416015625, -23.4140625, -22.412109375, -21.41015625, -20.408203125, -19.40625, -18.404296875, -17.40234375, -16.400390625, -15.3984375, -14.396484375, -13.39453125, -12.392578125, -11.390625, -10.388671875, -9.38671875, -8.384765625, -7.3828125, -6.380859375, -5.37890625, -4.376953125, -3.375, -2.373046875, -1.37109375, -0.369140625, 0.6328125, 1.634765625, 2.63671875, 3.638671875, 4.640625, 5.642578125, 6.64453125, 7.646484375, 8.6484375, 9.650390625, 10.65234375, 11.654296875, 12.65625, 13.658203125, 14.66015625, 15.662109375, 16.6640625, 17.666015625, 18.66796875, 19.669921875, 20.671875, 21.673828125, 22.67578125, 23.677734375, 24.6796875, 25.681640625, 26.68359375, 27.685546875, 28.6875]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 32.0, 374.0, 506.0, 101.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.53179931640625, -72.67732238769531, -63.822837829589844, -54.96835708618164, -46.11387634277344, -37.259395599365234, -28.40491485595703, -19.550434112548828, -10.695953369140625, -1.8414726257324219, 7.013008117675781, 15.867488861083984, 24.721969604492188, 33.57645034790039, 42.430931091308594, 51.2854118347168, 60.139892578125, 68.99436950683594, 77.8488540649414, 86.70333862304688, 95.55781555175781, 104.41229248046875, 113.26677703857422, 122.12126159667969, 130.97573852539062, 139.83021545410156, 148.6846923828125, 157.5391845703125, 166.39366149902344, 175.24813842773438, 184.10263061523438, 192.9571075439453, 201.81158447265625, 210.6660614013672, 219.52053833007812, 228.37503051757812, 237.22950744628906, 246.083984375, 254.9384765625, 263.7929382324219, 272.6474304199219, 281.5019226074219, 290.35638427734375, 299.21087646484375, 308.06536865234375, 316.9198303222656, 325.7743225097656, 334.6287841796875, 343.4832763671875, 352.3377685546875, 361.1922302246094, 370.0467224121094, 378.90118408203125, 387.75567626953125, 396.61016845703125, 405.4646301269531, 414.3191223144531, 423.1736145019531, 432.028076171875, 440.882568359375, 449.737060546875, 458.5915222167969, 467.4460144042969, 476.30047607421875, 485.15496826171875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 8.0, 6.0, 7.0, 5.0, 10.0, 13.0, 11.0, 19.0, 18.0, 24.0, 27.0, 24.0, 30.0, 28.0, 32.0, 25.0, 37.0, 36.0, 32.0, 44.0, 39.0, 44.0, 34.0, 33.0, 34.0, 34.0, 38.0, 37.0, 29.0, 28.0, 24.0, 24.0, 32.0, 20.0, 20.0, 20.0, 8.0, 12.0, 10.0, 13.0, 8.0, 8.0, 6.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-40.677276611328125, -39.457611083984375, -38.23794937133789, -37.01828384399414, -35.79861831665039, -34.578956604003906, -33.359291076660156, -32.139625549316406, -30.91996192932129, -29.700298309326172, -28.480632781982422, -27.260969161987305, -26.041305541992188, -24.821640014648438, -23.60197639465332, -22.382312774658203, -21.162647247314453, -19.942983627319336, -18.723318099975586, -17.50365447998047, -16.28398895263672, -15.064325332641602, -13.844661712646484, -12.62499713897705, -11.405332565307617, -10.185667991638184, -8.96600341796875, -7.746339797973633, -6.526675224304199, -5.307010650634766, -4.08734655380249, -2.867682456970215, -1.6480140686035156, -0.42834973335266113, 0.7913146018981934, 2.010978937149048, 3.2306432723999023, 4.450307846069336, 5.669971942901611, 6.889636039733887, 8.10930061340332, 9.328965187072754, 10.548629760742188, 11.768293380737305, 12.987957954406738, 14.207622528076172, 15.427286148071289, 16.646949768066406, 17.866615295410156, 19.086278915405273, 20.305944442749023, 21.52560806274414, 22.74527359008789, 23.964937210083008, 25.184600830078125, 26.404266357421875, 27.623929977416992, 28.84359359741211, 30.06325912475586, 31.282922744750977, 32.502586364746094, 33.722251892089844, 34.941917419433594, 36.16157913208008, 37.38124465942383]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 5.0, 2.0, 5.0, 1.0, 4.0, 7.0, 6.0, 8.0, 8.0, 8.0, 15.0, 9.0, 24.0, 13.0, 15.0, 20.0, 25.0, 24.0, 30.0, 34.0, 35.0, 43.0, 32.0, 40.0, 35.0, 37.0, 37.0, 42.0, 55.0, 43.0, 37.0, 32.0, 27.0, 28.0, 25.0, 19.0, 27.0, 27.0, 22.0, 15.0, 16.0, 15.0, 9.0, 14.0, 6.0, 10.0, 5.0, 2.0, 2.0, 3.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.44140625, -7.2091064453125, -6.976806640625, -6.7445068359375, -6.51220703125, -6.2799072265625, -6.047607421875, -5.8153076171875, -5.5830078125, -5.3507080078125, -5.118408203125, -4.8861083984375, -4.65380859375, -4.4215087890625, -4.189208984375, -3.9569091796875, -3.724609375, -3.4923095703125, -3.260009765625, -3.0277099609375, -2.79541015625, -2.5631103515625, -2.330810546875, -2.0985107421875, -1.8662109375, -1.6339111328125, -1.401611328125, -1.1693115234375, -0.93701171875, -0.7047119140625, -0.472412109375, -0.2401123046875, -0.0078125, 0.2244873046875, 0.456787109375, 0.6890869140625, 0.92138671875, 1.1536865234375, 1.385986328125, 1.6182861328125, 1.8505859375, 2.0828857421875, 2.315185546875, 2.5474853515625, 2.77978515625, 3.0120849609375, 3.244384765625, 3.4766845703125, 3.708984375, 3.9412841796875, 4.173583984375, 4.4058837890625, 4.63818359375, 4.8704833984375, 5.102783203125, 5.3350830078125, 5.5673828125, 5.7996826171875, 6.031982421875, 6.2642822265625, 6.49658203125, 6.7288818359375, 6.961181640625, 7.1934814453125, 7.42578125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 5.0, 5.0, 6.0, 13.0, 23.0, 20.0, 49.0, 64.0, 74.0, 149.0, 214.0, 283.0, 419.0, 681.0, 1049.0, 1629.0, 2455.0, 3716.0, 5537.0, 8427.0, 12353.0, 18552.0, 27587.0, 39737.0, 55405.0, 75573.0, 96354.0, 114601.0, 122122.0, 113913.0, 95995.0, 75111.0, 55244.0, 38760.0, 27489.0, 18496.0, 12353.0, 8140.0, 5212.0, 3663.0, 2331.0, 1627.0, 1020.0, 699.0, 460.0, 338.0, 184.0, 134.0, 112.0, 64.0, 41.0, 31.0, 15.0, 15.0, 8.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.80322265625, -0.7777099609375, -0.752197265625, -0.7266845703125, -0.701171875, -0.6756591796875, -0.650146484375, -0.6246337890625, -0.59912109375, -0.5736083984375, -0.548095703125, -0.5225830078125, -0.4970703125, -0.4715576171875, -0.446044921875, -0.4205322265625, -0.39501953125, -0.3695068359375, -0.343994140625, -0.3184814453125, -0.29296875, -0.2674560546875, -0.241943359375, -0.2164306640625, -0.19091796875, -0.1654052734375, -0.139892578125, -0.1143798828125, -0.0888671875, -0.0633544921875, -0.037841796875, -0.0123291015625, 0.01318359375, 0.0386962890625, 0.064208984375, 0.0897216796875, 0.115234375, 0.1407470703125, 0.166259765625, 0.1917724609375, 0.21728515625, 0.2427978515625, 0.268310546875, 0.2938232421875, 0.3193359375, 0.3448486328125, 0.370361328125, 0.3958740234375, 0.42138671875, 0.4468994140625, 0.472412109375, 0.4979248046875, 0.5234375, 0.5489501953125, 0.574462890625, 0.5999755859375, 0.62548828125, 0.6510009765625, 0.676513671875, 0.7020263671875, 0.7275390625, 0.7530517578125, 0.778564453125, 0.8040771484375, 0.82958984375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 4.0, 5.0, 5.0, 8.0, 12.0, 5.0, 10.0, 13.0, 18.0, 12.0, 21.0, 13.0, 9.0, 24.0, 13.0, 28.0, 32.0, 20.0, 35.0, 32.0, 33.0, 33.0, 39.0, 33.0, 1062.0, 31.0, 46.0, 36.0, 31.0, 36.0, 35.0, 31.0, 33.0, 30.0, 22.0, 16.0, 23.0, 16.0, 14.0, 16.0, 11.0, 14.0, 12.0, 10.0, 10.0, 6.0, 3.0, 11.0, 6.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-5.0, -4.84722900390625, -4.6944580078125, -4.54168701171875, -4.388916015625, -4.23614501953125, -4.0833740234375, -3.93060302734375, -3.77783203125, -3.62506103515625, -3.4722900390625, -3.31951904296875, -3.166748046875, -3.01397705078125, -2.8612060546875, -2.70843505859375, -2.5556640625, -2.40289306640625, -2.2501220703125, -2.09735107421875, -1.944580078125, -1.79180908203125, -1.6390380859375, -1.48626708984375, -1.33349609375, -1.18072509765625, -1.0279541015625, -0.87518310546875, -0.722412109375, -0.56964111328125, -0.4168701171875, -0.26409912109375, -0.111328125, 0.04144287109375, 0.1942138671875, 0.34698486328125, 0.499755859375, 0.65252685546875, 0.8052978515625, 0.95806884765625, 1.11083984375, 1.26361083984375, 1.4163818359375, 1.56915283203125, 1.721923828125, 1.87469482421875, 2.0274658203125, 2.18023681640625, 2.3330078125, 2.48577880859375, 2.6385498046875, 2.79132080078125, 2.944091796875, 3.09686279296875, 3.2496337890625, 3.40240478515625, 3.55517578125, 3.70794677734375, 3.8607177734375, 4.01348876953125, 4.166259765625, 4.31903076171875, 4.4718017578125, 4.62457275390625, 4.77734375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 5.0, 5.0, 11.0, 14.0, 36.0, 43.0, 77.0, 99.0, 171.0, 252.0, 420.0, 695.0, 1034.0, 1812.0, 2914.0, 5052.0, 8425.0, 14703.0, 25525.0, 45060.0, 1886276.0, 44430.0, 24836.0, 14405.0, 8434.0, 4842.0, 2869.0, 1773.0, 1074.0, 669.0, 408.0, 281.0, 171.0, 97.0, 75.0, 46.0, 21.0, 16.0, 14.0, 12.0, 2.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.24609375, -2.17474365234375, -2.1033935546875, -2.03204345703125, -1.960693359375, -1.88934326171875, -1.8179931640625, -1.74664306640625, -1.67529296875, -1.60394287109375, -1.5325927734375, -1.46124267578125, -1.389892578125, -1.31854248046875, -1.2471923828125, -1.17584228515625, -1.1044921875, -1.03314208984375, -0.9617919921875, -0.89044189453125, -0.819091796875, -0.74774169921875, -0.6763916015625, -0.60504150390625, -0.53369140625, -0.46234130859375, -0.3909912109375, -0.31964111328125, -0.248291015625, -0.17694091796875, -0.1055908203125, -0.03424072265625, 0.037109375, 0.10845947265625, 0.1798095703125, 0.25115966796875, 0.322509765625, 0.39385986328125, 0.4652099609375, 0.53656005859375, 0.60791015625, 0.67926025390625, 0.7506103515625, 0.82196044921875, 0.893310546875, 0.96466064453125, 1.0360107421875, 1.10736083984375, 1.1787109375, 1.25006103515625, 1.3214111328125, 1.39276123046875, 1.464111328125, 1.53546142578125, 1.6068115234375, 1.67816162109375, 1.74951171875, 1.82086181640625, 1.8922119140625, 1.96356201171875, 2.034912109375, 2.10626220703125, 2.1776123046875, 2.24896240234375, 2.3203125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 7.0, 5.0, 9.0, 10.0, 14.0, 17.0, 18.0, 28.0, 31.0, 50.0, 58.0, 61.0, 59.0, 59.0, 62.0, 72.0, 58.0, 61.0, 52.0, 52.0, 37.0, 35.0, 25.0, 28.0, 23.0, 10.0, 10.0, 11.0, 9.0, 5.0, 5.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.044921875, -0.04382038116455078, -0.04271888732910156, -0.041617393493652344, -0.040515899658203125, -0.039414405822753906, -0.03831291198730469, -0.03721141815185547, -0.03610992431640625, -0.03500843048095703, -0.03390693664550781, -0.032805442810058594, -0.031703948974609375, -0.030602455139160156, -0.029500961303710938, -0.02839946746826172, -0.0272979736328125, -0.02619647979736328, -0.025094985961914062, -0.023993492126464844, -0.022891998291015625, -0.021790504455566406, -0.020689010620117188, -0.01958751678466797, -0.01848602294921875, -0.01738452911376953, -0.016283035278320312, -0.015181541442871094, -0.014080047607421875, -0.012978553771972656, -0.011877059936523438, -0.010775566101074219, -0.009674072265625, -0.008572578430175781, -0.0074710845947265625, -0.006369590759277344, -0.005268096923828125, -0.004166603088378906, -0.0030651092529296875, -0.0019636154174804688, -0.00086212158203125, 0.00023937225341796875, 0.0013408660888671875, 0.0024423599243164062, 0.003543853759765625, 0.004645347595214844, 0.0057468414306640625, 0.006848335266113281, 0.0079498291015625, 0.009051322937011719, 0.010152816772460938, 0.011254310607910156, 0.012355804443359375, 0.013457298278808594, 0.014558792114257812, 0.01566028594970703, 0.01676177978515625, 0.01786327362060547, 0.018964767456054688, 0.020066261291503906, 0.021167755126953125, 0.022269248962402344, 0.023370742797851562, 0.02447223663330078, 0.02557373046875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 6.0, 11.0, 8.0, 17.0, 15.0, 22.0, 30.0, 34.0, 46.0, 70.0, 83.0, 135.0, 167.0, 293.0, 534.0, 1586.0, 758641.0, 284253.0, 1222.0, 468.0, 274.0, 193.0, 121.0, 85.0, 64.0, 41.0, 31.0, 21.0, 22.0, 14.0, 7.0, 3.0, 7.0, 9.0, 10.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46826171875, -0.4478607177734375, -0.427459716796875, -0.4070587158203125, -0.38665771484375, -0.3662567138671875, -0.345855712890625, -0.3254547119140625, -0.3050537109375, -0.2846527099609375, -0.264251708984375, -0.2438507080078125, -0.22344970703125, -0.2030487060546875, -0.182647705078125, -0.1622467041015625, -0.141845703125, -0.1214447021484375, -0.101043701171875, -0.0806427001953125, -0.06024169921875, -0.0398406982421875, -0.019439697265625, 0.0009613037109375, 0.0213623046875, 0.0417633056640625, 0.062164306640625, 0.0825653076171875, 0.10296630859375, 0.1233673095703125, 0.143768310546875, 0.1641693115234375, 0.1845703125, 0.2049713134765625, 0.225372314453125, 0.2457733154296875, 0.26617431640625, 0.2865753173828125, 0.306976318359375, 0.3273773193359375, 0.3477783203125, 0.3681793212890625, 0.388580322265625, 0.4089813232421875, 0.42938232421875, 0.4497833251953125, 0.470184326171875, 0.4905853271484375, 0.510986328125, 0.5313873291015625, 0.551788330078125, 0.5721893310546875, 0.59259033203125, 0.6129913330078125, 0.633392333984375, 0.6537933349609375, 0.6741943359375, 0.6945953369140625, 0.714996337890625, 0.7353973388671875, 0.75579833984375, 0.7761993408203125, 0.796600341796875, 0.8170013427734375, 0.83740234375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 9.0, 47.0, 718.0, 219.0, 22.0], "bins": [-0.5567181706428528, -0.5477088689804077, -0.5386995673179626, -0.5296902656555176, -0.5206809639930725, -0.5116716623306274, -0.5026623606681824, -0.4936530590057373, -0.48464375734329224, -0.47563445568084717, -0.4666251540184021, -0.45761585235595703, -0.44860655069351196, -0.4395972490310669, -0.4305879473686218, -0.42157864570617676, -0.4125693440437317, -0.4035600423812866, -0.39455074071884155, -0.3855414390563965, -0.3765321373939514, -0.36752283573150635, -0.3585135340690613, -0.3495042324066162, -0.34049490094184875, -0.3314855992794037, -0.3224762976169586, -0.31346699595451355, -0.3044576942920685, -0.2954483926296234, -0.28643909096717834, -0.2774297893047333, -0.2684205174446106, -0.2594112157821655, -0.25040191411972046, -0.2413926124572754, -0.23238331079483032, -0.22337400913238525, -0.21436470746994019, -0.20535540580749512, -0.19634608924388885, -0.1873367875814438, -0.17832748591899872, -0.16931818425655365, -0.16030888259410858, -0.1512995809316635, -0.14229026436805725, -0.13328096270561218, -0.12427166849374771, -0.11526236683130264, -0.10625306516885757, -0.09724375605583191, -0.08823445439338684, -0.07922515273094177, -0.0702158510684967, -0.061206549406051636, -0.05219724774360657, -0.0431879460811615, -0.03417864441871643, -0.025169339030981064, -0.016160037368535995, -0.007150735706090927, 0.0018585696816444397, 0.010867871344089508, 0.019877171143889427]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 7.0, 11.0, 10.0, 12.0, 27.0, 16.0, 22.0, 20.0, 20.0, 25.0, 36.0, 34.0, 41.0, 29.0, 37.0, 41.0, 43.0, 51.0, 50.0, 48.0, 45.0, 43.0, 39.0, 39.0, 34.0, 27.0, 31.0, 31.0, 17.0, 16.0, 17.0, 17.0, 13.0, 9.0, 15.0, 5.0, 6.0, 1.0, 4.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0532834529876709, -0.051585204899311066, -0.04988695681095123, -0.0481887124478817, -0.046490464359521866, -0.04479221627116203, -0.0430939719080925, -0.041395723819732666, -0.03969747573137283, -0.037999227643013, -0.03630097955465317, -0.03460273519158363, -0.0329044871032238, -0.031206239014863968, -0.029507992789149284, -0.0278097465634346, -0.026111498475074768, -0.024413250386714935, -0.022715004161000252, -0.021016757935285568, -0.019318509846925735, -0.017620261758565903, -0.01592201553285122, -0.014223768375813961, -0.012525521218776703, -0.010827274061739445, -0.009129026904702187, -0.0074307797476649284, -0.00573253259062767, -0.004034285433590412, -0.002336038276553154, -0.0006377911195158958, 0.0010604560375213623, 0.0027587031945586205, 0.004456950351595879, 0.006155197508633137, 0.007853444665670395, 0.009551691822707653, 0.011249938979744911, 0.01294818613678217, 0.014646433293819427, 0.01634468138217926, 0.018042927607893944, 0.019741173833608627, 0.02143942192196846, 0.023137670010328293, 0.024835916236042976, 0.02653416246175766, 0.028232410550117493, 0.029930658638477325, 0.03162890672683716, 0.03332715108990669, 0.035025399178266525, 0.03672364726662636, 0.03842189162969589, 0.040120139718055725, 0.04181838780641556, 0.04351663589477539, 0.04521488398313522, 0.04691312834620476, 0.04861137643456459, 0.05030962452292442, 0.05200786888599396, 0.05370611697435379, 0.05540436506271362]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 8.0, 6.0, 8.0, 11.0, 16.0, 16.0, 17.0, 16.0, 22.0, 20.0, 29.0, 42.0, 33.0, 33.0, 32.0, 45.0, 51.0, 39.0, 45.0, 41.0, 37.0, 57.0, 46.0, 34.0, 37.0, 30.0, 25.0, 23.0, 27.0, 19.0, 21.0, 21.0, 16.0, 16.0, 12.0, 9.0, 5.0, 4.0, 7.0, 2.0, 5.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.72265625, -7.47320556640625, -7.2237548828125, -6.97430419921875, -6.724853515625, -6.47540283203125, -6.2259521484375, -5.97650146484375, -5.72705078125, -5.47760009765625, -5.2281494140625, -4.97869873046875, -4.729248046875, -4.47979736328125, -4.2303466796875, -3.98089599609375, -3.7314453125, -3.48199462890625, -3.2325439453125, -2.98309326171875, -2.733642578125, -2.48419189453125, -2.2347412109375, -1.98529052734375, -1.73583984375, -1.48638916015625, -1.2369384765625, -0.98748779296875, -0.738037109375, -0.48858642578125, -0.2391357421875, 0.01031494140625, 0.259765625, 0.50921630859375, 0.7586669921875, 1.00811767578125, 1.257568359375, 1.50701904296875, 1.7564697265625, 2.00592041015625, 2.25537109375, 2.50482177734375, 2.7542724609375, 3.00372314453125, 3.253173828125, 3.50262451171875, 3.7520751953125, 4.00152587890625, 4.2509765625, 4.50042724609375, 4.7498779296875, 4.99932861328125, 5.248779296875, 5.49822998046875, 5.7476806640625, 5.99713134765625, 6.24658203125, 6.49603271484375, 6.7454833984375, 6.99493408203125, 7.244384765625, 7.49383544921875, 7.7432861328125, 7.99273681640625, 8.2421875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 7.0, 11.0, 14.0, 12.0, 18.0, 27.0, 23.0, 49.0, 51.0, 92.0, 114.0, 150.0, 263.0, 414.0, 784.0, 1481.0, 3279.0, 6916.0, 14685.0, 32535.0, 72684.0, 171084.0, 342842.0, 227952.0, 94717.0, 41838.0, 19184.0, 8703.0, 4138.0, 1967.0, 976.0, 532.0, 330.0, 208.0, 121.0, 100.0, 78.0, 35.0, 38.0, 27.0, 15.0, 14.0, 19.0, 13.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8671875, -9.5555419921875, -9.243896484375, -8.9322509765625, -8.62060546875, -8.3089599609375, -7.997314453125, -7.6856689453125, -7.3740234375, -7.0623779296875, -6.750732421875, -6.4390869140625, -6.12744140625, -5.8157958984375, -5.504150390625, -5.1925048828125, -4.880859375, -4.5692138671875, -4.257568359375, -3.9459228515625, -3.63427734375, -3.3226318359375, -3.010986328125, -2.6993408203125, -2.3876953125, -2.0760498046875, -1.764404296875, -1.4527587890625, -1.14111328125, -0.8294677734375, -0.517822265625, -0.2061767578125, 0.10546875, 0.4171142578125, 0.728759765625, 1.0404052734375, 1.35205078125, 1.6636962890625, 1.975341796875, 2.2869873046875, 2.5986328125, 2.9102783203125, 3.221923828125, 3.5335693359375, 3.84521484375, 4.1568603515625, 4.468505859375, 4.7801513671875, 5.091796875, 5.4034423828125, 5.715087890625, 6.0267333984375, 6.33837890625, 6.6500244140625, 6.961669921875, 7.2733154296875, 7.5849609375, 7.8966064453125, 8.208251953125, 8.5198974609375, 8.83154296875, 9.1431884765625, 9.454833984375, 9.7664794921875, 10.078125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 7.0, 2.0, 7.0, 10.0, 9.0, 15.0, 13.0, 13.0, 16.0, 16.0, 22.0, 18.0, 27.0, 30.0, 28.0, 36.0, 52.0, 43.0, 71.0, 138.0, 246.0, 1371.0, 240.0, 128.0, 74.0, 58.0, 45.0, 34.0, 40.0, 36.0, 31.0, 26.0, 30.0, 9.0, 11.0, 15.0, 10.0, 14.0, 10.0, 8.0, 8.0, 4.0, 5.0, 3.0, 3.0, 3.0, 9.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.171875, -16.627685546875, -16.08349609375, -15.539306640625, -14.9951171875, -14.450927734375, -13.90673828125, -13.362548828125, -12.818359375, -12.274169921875, -11.72998046875, -11.185791015625, -10.6416015625, -10.097412109375, -9.55322265625, -9.009033203125, -8.46484375, -7.920654296875, -7.37646484375, -6.832275390625, -6.2880859375, -5.743896484375, -5.19970703125, -4.655517578125, -4.111328125, -3.567138671875, -3.02294921875, -2.478759765625, -1.9345703125, -1.390380859375, -0.84619140625, -0.302001953125, 0.2421875, 0.786376953125, 1.33056640625, 1.874755859375, 2.4189453125, 2.963134765625, 3.50732421875, 4.051513671875, 4.595703125, 5.139892578125, 5.68408203125, 6.228271484375, 6.7724609375, 7.316650390625, 7.86083984375, 8.405029296875, 8.94921875, 9.493408203125, 10.03759765625, 10.581787109375, 11.1259765625, 11.670166015625, 12.21435546875, 12.758544921875, 13.302734375, 13.846923828125, 14.39111328125, 14.935302734375, 15.4794921875, 16.023681640625, 16.56787109375, 17.112060546875, 17.65625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 4.0, 5.0, 4.0, 6.0, 4.0, 4.0, 6.0, 6.0, 8.0, 18.0, 15.0, 19.0, 21.0, 30.0, 56.0, 64.0, 101.0, 144.0, 219.0, 318.0, 525.0, 1049.0, 4998.0, 3042133.0, 92322.0, 1634.0, 703.0, 415.0, 268.0, 175.0, 124.0, 80.0, 60.0, 38.0, 21.0, 20.0, 18.0, 6.0, 11.0, 13.0, 8.0, 6.0, 5.0, 3.0, 2.0, 10.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.75, -62.6435546875, -60.537109375, -58.4306640625, -56.32421875, -54.2177734375, -52.111328125, -50.0048828125, -47.8984375, -45.7919921875, -43.685546875, -41.5791015625, -39.47265625, -37.3662109375, -35.259765625, -33.1533203125, -31.046875, -28.9404296875, -26.833984375, -24.7275390625, -22.62109375, -20.5146484375, -18.408203125, -16.3017578125, -14.1953125, -12.0888671875, -9.982421875, -7.8759765625, -5.76953125, -3.6630859375, -1.556640625, 0.5498046875, 2.65625, 4.7626953125, 6.869140625, 8.9755859375, 11.08203125, 13.1884765625, 15.294921875, 17.4013671875, 19.5078125, 21.6142578125, 23.720703125, 25.8271484375, 27.93359375, 30.0400390625, 32.146484375, 34.2529296875, 36.359375, 38.4658203125, 40.572265625, 42.6787109375, 44.78515625, 46.8916015625, 48.998046875, 51.1044921875, 53.2109375, 55.3173828125, 57.423828125, 59.5302734375, 61.63671875, 63.7431640625, 65.849609375, 67.9560546875, 70.0625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 16.0, 60.0, 240.0, 396.0, 233.0, 59.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.53961181640625, -64.1181640625, -59.69672393798828, -55.27527618408203, -50.85383224487305, -46.43238830566406, -42.01094055175781, -37.58949661254883, -33.168052673339844, -28.74660873413086, -24.325162887573242, -19.903717041015625, -15.48227310180664, -11.060829162597656, -6.639383316040039, -2.217937469482422, 2.2035064697265625, 6.624951362609863, 11.046396255493164, 15.467841148376465, 19.889286041259766, 24.31072998046875, 28.732175827026367, 33.153621673583984, 37.57506561279297, 41.99650955200195, 46.41795349121094, 50.83940124511719, 55.26084518432617, 59.682289123535156, 64.1037368774414, 68.52517700195312, 72.94662475585938, 77.36807250976562, 81.78951263427734, 86.2109603881836, 90.63240051269531, 95.05384826660156, 99.47529602050781, 103.89674377441406, 108.31818389892578, 112.73963165283203, 117.16107177734375, 121.58251953125, 126.00396728515625, 130.4254150390625, 134.8468475341797, 139.26829528808594, 143.6897430419922, 148.11119079589844, 152.5326385498047, 156.95407104492188, 161.37551879882812, 165.79696655273438, 170.21841430664062, 174.63986206054688, 179.06130981445312, 183.48275756835938, 187.90420532226562, 192.3256378173828, 196.74708557128906, 201.1685333251953, 205.58998107910156, 210.0114288330078, 214.432861328125]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 0.0, 5.0, 2.0, 4.0, 4.0, 2.0, 5.0, 7.0, 10.0, 9.0, 12.0, 12.0, 13.0, 21.0, 21.0, 20.0, 30.0, 30.0, 33.0, 27.0, 45.0, 33.0, 33.0, 32.0, 40.0, 43.0, 35.0, 50.0, 49.0, 35.0, 41.0, 30.0, 34.0, 36.0, 29.0, 30.0, 22.0, 17.0, 16.0, 12.0, 19.0, 12.0, 8.0, 12.0, 7.0, 6.0, 1.0, 6.0, 4.0, 4.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.08631134033203, -47.47657775878906, -45.866844177246094, -44.257110595703125, -42.647377014160156, -41.03764343261719, -39.42790985107422, -37.81817626953125, -36.20844268798828, -34.59870910644531, -32.988975524902344, -31.379241943359375, -29.769508361816406, -28.159774780273438, -26.55004119873047, -24.9403076171875, -23.33057403564453, -21.720840454101562, -20.111106872558594, -18.501373291015625, -16.891639709472656, -15.281906127929688, -13.672172546386719, -12.06243896484375, -10.452705383300781, -8.842971801757812, -7.233238220214844, -5.623504638671875, -4.013771057128906, -2.4040374755859375, -0.7943038940429688, 0.8154296875, 2.4251632690429688, 4.0348968505859375, 5.644630432128906, 7.254364013671875, 8.864097595214844, 10.473831176757812, 12.083564758300781, 13.69329833984375, 15.303031921386719, 16.912765502929688, 18.522499084472656, 20.132232666015625, 21.741966247558594, 23.351699829101562, 24.96143341064453, 26.5711669921875, 28.18090057373047, 29.790634155273438, 31.400367736816406, 33.010101318359375, 34.619834899902344, 36.22956848144531, 37.83930206298828, 39.44903564453125, 41.05876922607422, 42.66850280761719, 44.278236389160156, 45.887969970703125, 47.497703552246094, 49.10743713378906, 50.71717071533203, 52.326904296875, 53.93663787841797]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 2.0, 6.0, 8.0, 11.0, 15.0, 8.0, 18.0, 27.0, 19.0, 34.0, 34.0, 40.0, 34.0, 36.0, 41.0, 44.0, 41.0, 49.0, 57.0, 44.0, 60.0, 46.0, 43.0, 40.0, 38.0, 35.0, 29.0, 20.0, 27.0, 19.0, 13.0, 19.0, 12.0, 10.0, 3.0, 4.0, 5.0, 7.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.546875, -8.2547607421875, -7.962646484375, -7.6705322265625, -7.37841796875, -7.0863037109375, -6.794189453125, -6.5020751953125, -6.2099609375, -5.9178466796875, -5.625732421875, -5.3336181640625, -5.04150390625, -4.7493896484375, -4.457275390625, -4.1651611328125, -3.873046875, -3.5809326171875, -3.288818359375, -2.9967041015625, -2.70458984375, -2.4124755859375, -2.120361328125, -1.8282470703125, -1.5361328125, -1.2440185546875, -0.951904296875, -0.6597900390625, -0.36767578125, -0.0755615234375, 0.216552734375, 0.5086669921875, 0.80078125, 1.0928955078125, 1.385009765625, 1.6771240234375, 1.96923828125, 2.2613525390625, 2.553466796875, 2.8455810546875, 3.1376953125, 3.4298095703125, 3.721923828125, 4.0140380859375, 4.30615234375, 4.5982666015625, 4.890380859375, 5.1824951171875, 5.474609375, 5.7667236328125, 6.058837890625, 6.3509521484375, 6.64306640625, 6.9351806640625, 7.227294921875, 7.5194091796875, 7.8115234375, 8.1036376953125, 8.395751953125, 8.6878662109375, 8.97998046875, 9.2720947265625, 9.564208984375, 9.8563232421875, 10.1484375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 6.0, 11.0, 14.0, 9.0, 20.0, 29.0, 39.0, 64.0, 111.0, 152.0, 243.0, 395.0, 640.0, 1115.0, 1840.0, 3398.0, 6499.0, 13294.0, 29857.0, 75526.0, 198703.0, 496881.0, 1067437.0, 1245544.0, 625186.0, 258541.0, 97018.0, 37865.0, 16385.0, 7855.0, 3980.0, 2261.0, 1228.0, 798.0, 466.0, 268.0, 206.0, 120.0, 78.0, 61.0, 39.0, 30.0, 19.0, 16.0, 6.0, 12.0, 5.0, 7.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.1640625, -7.9100341796875, -7.656005859375, -7.4019775390625, -7.14794921875, -6.8939208984375, -6.639892578125, -6.3858642578125, -6.1318359375, -5.8778076171875, -5.623779296875, -5.3697509765625, -5.11572265625, -4.8616943359375, -4.607666015625, -4.3536376953125, -4.099609375, -3.8455810546875, -3.591552734375, -3.3375244140625, -3.08349609375, -2.8294677734375, -2.575439453125, -2.3214111328125, -2.0673828125, -1.8133544921875, -1.559326171875, -1.3052978515625, -1.05126953125, -0.7972412109375, -0.543212890625, -0.2891845703125, -0.03515625, 0.2188720703125, 0.472900390625, 0.7269287109375, 0.98095703125, 1.2349853515625, 1.489013671875, 1.7430419921875, 1.9970703125, 2.2510986328125, 2.505126953125, 2.7591552734375, 3.01318359375, 3.2672119140625, 3.521240234375, 3.7752685546875, 4.029296875, 4.2833251953125, 4.537353515625, 4.7913818359375, 5.04541015625, 5.2994384765625, 5.553466796875, 5.8074951171875, 6.0615234375, 6.3155517578125, 6.569580078125, 6.8236083984375, 7.07763671875, 7.3316650390625, 7.585693359375, 7.8397216796875, 8.09375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 5.0, 6.0, 12.0, 15.0, 26.0, 21.0, 20.0, 39.0, 49.0, 66.0, 82.0, 126.0, 128.0, 202.0, 253.0, 349.0, 444.0, 491.0, 436.0, 323.0, 221.0, 186.0, 129.0, 116.0, 77.0, 64.0, 49.0, 33.0, 36.0, 20.0, 18.0, 10.0, 8.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0859375, -11.6612548828125, -11.236572265625, -10.8118896484375, -10.38720703125, -9.9625244140625, -9.537841796875, -9.1131591796875, -8.6884765625, -8.2637939453125, -7.839111328125, -7.4144287109375, -6.98974609375, -6.5650634765625, -6.140380859375, -5.7156982421875, -5.291015625, -4.8663330078125, -4.441650390625, -4.0169677734375, -3.59228515625, -3.1676025390625, -2.742919921875, -2.3182373046875, -1.8935546875, -1.4688720703125, -1.044189453125, -0.6195068359375, -0.19482421875, 0.2298583984375, 0.654541015625, 1.0792236328125, 1.50390625, 1.9285888671875, 2.353271484375, 2.7779541015625, 3.20263671875, 3.6273193359375, 4.052001953125, 4.4766845703125, 4.9013671875, 5.3260498046875, 5.750732421875, 6.1754150390625, 6.60009765625, 7.0247802734375, 7.449462890625, 7.8741455078125, 8.298828125, 8.7235107421875, 9.148193359375, 9.5728759765625, 9.99755859375, 10.4222412109375, 10.846923828125, 11.2716064453125, 11.6962890625, 12.1209716796875, 12.545654296875, 12.9703369140625, 13.39501953125, 13.8197021484375, 14.244384765625, 14.6690673828125, 15.09375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 2.0, 7.0, 13.0, 17.0, 27.0, 35.0, 56.0, 83.0, 105.0, 158.0, 269.0, 479.0, 933.0, 1861.0, 5433.0, 28579.0, 243618.0, 2167768.0, 1546332.0, 169399.0, 20998.0, 4488.0, 1639.0, 760.0, 456.0, 278.0, 161.0, 99.0, 65.0, 57.0, 35.0, 20.0, 21.0, 10.0, 10.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.296875, -20.64990234375, -20.0029296875, -19.35595703125, -18.708984375, -18.06201171875, -17.4150390625, -16.76806640625, -16.12109375, -15.47412109375, -14.8271484375, -14.18017578125, -13.533203125, -12.88623046875, -12.2392578125, -11.59228515625, -10.9453125, -10.29833984375, -9.6513671875, -9.00439453125, -8.357421875, -7.71044921875, -7.0634765625, -6.41650390625, -5.76953125, -5.12255859375, -4.4755859375, -3.82861328125, -3.181640625, -2.53466796875, -1.8876953125, -1.24072265625, -0.59375, 0.05322265625, 0.7001953125, 1.34716796875, 1.994140625, 2.64111328125, 3.2880859375, 3.93505859375, 4.58203125, 5.22900390625, 5.8759765625, 6.52294921875, 7.169921875, 7.81689453125, 8.4638671875, 9.11083984375, 9.7578125, 10.40478515625, 11.0517578125, 11.69873046875, 12.345703125, 12.99267578125, 13.6396484375, 14.28662109375, 14.93359375, 15.58056640625, 16.2275390625, 16.87451171875, 17.521484375, 18.16845703125, 18.8154296875, 19.46240234375, 20.109375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 42.0, 246.0, 449.0, 228.0, 42.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.30906677246094, -136.50979614257812, -128.71054077148438, -120.91127014160156, -113.11201477050781, -105.312744140625, -97.51348114013672, -89.71421813964844, -81.91495513916016, -74.11569213867188, -66.3164291381836, -58.51716232299805, -50.717899322509766, -42.918636322021484, -35.11936950683594, -27.320106506347656, -19.520843505859375, -11.721579551696777, -3.9223155975341797, 3.8769493103027344, 11.676212310791016, 19.475475311279297, 27.274742126464844, 35.074005126953125, 42.873268127441406, 50.67253112792969, 58.47179412841797, 66.27105712890625, 74.07032775878906, 81.86958312988281, 89.66885375976562, 97.4681167602539, 105.26739501953125, 113.06665802001953, 120.86592102050781, 128.66519165039062, 136.46444702148438, 144.2637176513672, 152.06298828125, 159.86224365234375, 167.6614990234375, 175.4607696533203, 183.26002502441406, 191.05929565429688, 198.85855102539062, 206.65782165527344, 214.45709228515625, 222.25634765625, 230.0556182861328, 237.85488891601562, 245.65414428710938, 253.4534149169922, 261.252685546875, 269.05194091796875, 276.8511962890625, 284.65045166015625, 292.4497375488281, 300.2489929199219, 308.04827880859375, 315.8475341796875, 323.64678955078125, 331.446044921875, 339.2453308105469, 347.0445861816406, 354.8438415527344]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 8.0, 4.0, 6.0, 6.0, 10.0, 11.0, 18.0, 19.0, 16.0, 24.0, 22.0, 29.0, 34.0, 44.0, 41.0, 43.0, 31.0, 48.0, 50.0, 47.0, 42.0, 51.0, 43.0, 55.0, 44.0, 34.0, 31.0, 28.0, 32.0, 18.0, 13.0, 20.0, 19.0, 12.0, 12.0, 11.0, 9.0, 4.0, 4.0, 4.0, 1.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-59.576290130615234, -57.73762893676758, -55.89896774291992, -54.06031036376953, -52.221649169921875, -50.38298797607422, -48.54432678222656, -46.705665588378906, -44.86700439453125, -43.028343200683594, -41.18968200683594, -39.35102081298828, -37.51236343383789, -35.673702239990234, -33.83504104614258, -31.996379852294922, -30.15772247314453, -28.319061279296875, -26.48040199279785, -24.641740798950195, -22.803081512451172, -20.964420318603516, -19.12575912475586, -17.287097930908203, -15.44843864440918, -13.60977840423584, -11.7711181640625, -9.932456970214844, -8.093796730041504, -6.255136489868164, -4.416475296020508, -2.577815055847168, -0.7391586303710938, 1.0995018482208252, 2.938162326812744, 4.776823043823242, 6.615483283996582, 8.454143524169922, 10.292804718017578, 12.131464958190918, 13.970125198364258, 15.808785438537598, 17.647445678710938, 19.486106872558594, 21.32476806640625, 23.163427352905273, 25.00208854675293, 26.840747833251953, 28.67940902709961, 30.518070220947266, 32.35673141479492, 34.19538879394531, 36.03404998779297, 37.872711181640625, 39.71137237548828, 41.55003356933594, 43.388694763183594, 45.22735595703125, 47.066017150878906, 48.90467834472656, 50.74333572387695, 52.58199691772461, 54.420658111572266, 56.25931930541992, 58.09797668457031]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 3.0, 2.0, 8.0, 5.0, 11.0, 15.0, 23.0, 19.0, 20.0, 16.0, 24.0, 29.0, 27.0, 49.0, 44.0, 59.0, 42.0, 45.0, 49.0, 50.0, 35.0, 37.0, 50.0, 41.0, 45.0, 34.0, 27.0, 29.0, 20.0, 22.0, 29.0, 15.0, 14.0, 14.0, 13.0, 10.0, 11.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.828125, -7.587646484375, -7.34716796875, -7.106689453125, -6.8662109375, -6.625732421875, -6.38525390625, -6.144775390625, -5.904296875, -5.663818359375, -5.42333984375, -5.182861328125, -4.9423828125, -4.701904296875, -4.46142578125, -4.220947265625, -3.98046875, -3.739990234375, -3.49951171875, -3.259033203125, -3.0185546875, -2.778076171875, -2.53759765625, -2.297119140625, -2.056640625, -1.816162109375, -1.57568359375, -1.335205078125, -1.0947265625, -0.854248046875, -0.61376953125, -0.373291015625, -0.1328125, 0.107666015625, 0.34814453125, 0.588623046875, 0.8291015625, 1.069580078125, 1.31005859375, 1.550537109375, 1.791015625, 2.031494140625, 2.27197265625, 2.512451171875, 2.7529296875, 2.993408203125, 3.23388671875, 3.474365234375, 3.71484375, 3.955322265625, 4.19580078125, 4.436279296875, 4.6767578125, 4.917236328125, 5.15771484375, 5.398193359375, 5.638671875, 5.879150390625, 6.11962890625, 6.360107421875, 6.6005859375, 6.841064453125, 7.08154296875, 7.322021484375, 7.5625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 11.0, 14.0, 18.0, 39.0, 51.0, 77.0, 123.0, 185.0, 330.0, 482.0, 796.0, 1212.0, 1995.0, 3129.0, 5079.0, 7730.0, 12363.0, 18947.0, 28806.0, 41577.0, 59406.0, 81060.0, 102768.0, 120599.0, 125155.0, 114608.0, 94611.0, 71588.0, 51960.0, 35816.0, 24194.0, 15683.0, 10254.0, 6578.0, 4069.0, 2685.0, 1690.0, 1032.0, 688.0, 421.0, 295.0, 166.0, 115.0, 57.0, 33.0, 21.0, 24.0, 9.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.68603515625, -0.6641159057617188, -0.6421966552734375, -0.6202774047851562, -0.598358154296875, -0.5764389038085938, -0.5545196533203125, -0.5326004028320312, -0.51068115234375, -0.48876190185546875, -0.4668426513671875, -0.44492340087890625, -0.423004150390625, -0.40108489990234375, -0.3791656494140625, -0.35724639892578125, -0.3353271484375, -0.31340789794921875, -0.2914886474609375, -0.26956939697265625, -0.247650146484375, -0.22573089599609375, -0.2038116455078125, -0.18189239501953125, -0.15997314453125, -0.13805389404296875, -0.1161346435546875, -0.09421539306640625, -0.072296142578125, -0.05037689208984375, -0.0284576416015625, -0.00653839111328125, 0.015380859375, 0.03730010986328125, 0.0592193603515625, 0.08113861083984375, 0.103057861328125, 0.12497711181640625, 0.1468963623046875, 0.16881561279296875, 0.19073486328125, 0.21265411376953125, 0.2345733642578125, 0.25649261474609375, 0.278411865234375, 0.30033111572265625, 0.3222503662109375, 0.34416961669921875, 0.3660888671875, 0.38800811767578125, 0.4099273681640625, 0.43184661865234375, 0.453765869140625, 0.47568511962890625, 0.4976043701171875, 0.5195236206054688, 0.54144287109375, 0.5633621215820312, 0.5852813720703125, 0.6072006225585938, 0.629119873046875, 0.6510391235351562, 0.6729583740234375, 0.6948776245117188, 0.716796875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 1.0, 7.0, 5.0, 13.0, 9.0, 13.0, 12.0, 17.0, 18.0, 32.0, 24.0, 27.0, 24.0, 27.0, 31.0, 34.0, 51.0, 37.0, 45.0, 33.0, 43.0, 1054.0, 49.0, 35.0, 30.0, 43.0, 40.0, 41.0, 41.0, 34.0, 23.0, 19.0, 13.0, 19.0, 17.0, 9.0, 12.0, 13.0, 7.0, 8.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7265625, -4.570556640625, -4.41455078125, -4.258544921875, -4.1025390625, -3.946533203125, -3.79052734375, -3.634521484375, -3.478515625, -3.322509765625, -3.16650390625, -3.010498046875, -2.8544921875, -2.698486328125, -2.54248046875, -2.386474609375, -2.23046875, -2.074462890625, -1.91845703125, -1.762451171875, -1.6064453125, -1.450439453125, -1.29443359375, -1.138427734375, -0.982421875, -0.826416015625, -0.67041015625, -0.514404296875, -0.3583984375, -0.202392578125, -0.04638671875, 0.109619140625, 0.265625, 0.421630859375, 0.57763671875, 0.733642578125, 0.8896484375, 1.045654296875, 1.20166015625, 1.357666015625, 1.513671875, 1.669677734375, 1.82568359375, 1.981689453125, 2.1376953125, 2.293701171875, 2.44970703125, 2.605712890625, 2.76171875, 2.917724609375, 3.07373046875, 3.229736328125, 3.3857421875, 3.541748046875, 3.69775390625, 3.853759765625, 4.009765625, 4.165771484375, 4.32177734375, 4.477783203125, 4.6337890625, 4.789794921875, 4.94580078125, 5.101806640625, 5.2578125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 1.0, 4.0, 10.0, 8.0, 10.0, 25.0, 28.0, 29.0, 58.0, 92.0, 127.0, 208.0, 367.0, 538.0, 865.0, 1441.0, 2279.0, 3711.0, 6402.0, 10527.0, 17467.0, 28820.0, 53395.0, 1876720.0, 37643.0, 22373.0, 13464.0, 7901.0, 4876.0, 2914.0, 1774.0, 1111.0, 703.0, 433.0, 280.0, 174.0, 117.0, 79.0, 54.0, 23.0, 22.0, 14.0, 15.0, 8.0, 6.0, 6.0, 4.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.8740234375, -1.817657470703125, -1.76129150390625, -1.704925537109375, -1.6485595703125, -1.592193603515625, -1.53582763671875, -1.479461669921875, -1.423095703125, -1.366729736328125, -1.31036376953125, -1.253997802734375, -1.1976318359375, -1.141265869140625, -1.08489990234375, -1.028533935546875, -0.97216796875, -0.915802001953125, -0.85943603515625, -0.803070068359375, -0.7467041015625, -0.690338134765625, -0.63397216796875, -0.577606201171875, -0.521240234375, -0.464874267578125, -0.40850830078125, -0.352142333984375, -0.2957763671875, -0.239410400390625, -0.18304443359375, -0.126678466796875, -0.0703125, -0.013946533203125, 0.04241943359375, 0.098785400390625, 0.1551513671875, 0.211517333984375, 0.26788330078125, 0.324249267578125, 0.380615234375, 0.436981201171875, 0.49334716796875, 0.549713134765625, 0.6060791015625, 0.662445068359375, 0.71881103515625, 0.775177001953125, 0.83154296875, 0.887908935546875, 0.94427490234375, 1.000640869140625, 1.0570068359375, 1.113372802734375, 1.16973876953125, 1.226104736328125, 1.282470703125, 1.338836669921875, 1.39520263671875, 1.451568603515625, 1.5079345703125, 1.564300537109375, 1.62066650390625, 1.677032470703125, 1.7333984375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 5.0, 4.0, 7.0, 10.0, 7.0, 18.0, 15.0, 17.0, 13.0, 19.0, 21.0, 31.0, 38.0, 30.0, 42.0, 56.0, 58.0, 58.0, 72.0, 67.0, 71.0, 33.0, 43.0, 38.0, 43.0, 27.0, 28.0, 23.0, 23.0, 17.0, 13.0, 13.0, 5.0, 7.0, 6.0, 4.0, 2.0, 5.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0208892822265625, -0.020151615142822266, -0.01941394805908203, -0.018676280975341797, -0.017938613891601562, -0.017200946807861328, -0.016463279724121094, -0.01572561264038086, -0.014987945556640625, -0.01425027847290039, -0.013512611389160156, -0.012774944305419922, -0.012037277221679688, -0.011299610137939453, -0.010561943054199219, -0.009824275970458984, -0.00908660888671875, -0.008348941802978516, -0.007611274719238281, -0.006873607635498047, -0.0061359405517578125, -0.005398273468017578, -0.004660606384277344, -0.003922939300537109, -0.003185272216796875, -0.0024476051330566406, -0.0017099380493164062, -0.0009722709655761719, -0.0002346038818359375, 0.0005030632019042969, 0.0012407302856445312, 0.0019783973693847656, 0.002716064453125, 0.0034537315368652344, 0.004191398620605469, 0.004929065704345703, 0.0056667327880859375, 0.006404399871826172, 0.007142066955566406, 0.00787973403930664, 0.008617401123046875, 0.00935506820678711, 0.010092735290527344, 0.010830402374267578, 0.011568069458007812, 0.012305736541748047, 0.013043403625488281, 0.013781070709228516, 0.01451873779296875, 0.015256404876708984, 0.01599407196044922, 0.016731739044189453, 0.017469406127929688, 0.018207073211669922, 0.018944740295410156, 0.01968240737915039, 0.020420074462890625, 0.02115774154663086, 0.021895408630371094, 0.022633075714111328, 0.023370742797851562, 0.024108409881591797, 0.02484607696533203, 0.025583744049072266, 0.0263214111328125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 11.0, 8.0, 7.0, 10.0, 8.0, 21.0, 27.0, 28.0, 33.0, 48.0, 60.0, 61.0, 112.0, 149.0, 200.0, 289.0, 524.0, 1062.0, 201150.0, 841832.0, 1254.0, 522.0, 340.0, 213.0, 156.0, 92.0, 71.0, 53.0, 30.0, 42.0, 30.0, 21.0, 17.0, 14.0, 12.0, 10.0, 8.0, 7.0, 4.0, 5.0, 8.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.487060546875, -0.473175048828125, -0.45928955078125, -0.445404052734375, -0.4315185546875, -0.417633056640625, -0.40374755859375, -0.389862060546875, -0.3759765625, -0.362091064453125, -0.34820556640625, -0.334320068359375, -0.3204345703125, -0.306549072265625, -0.29266357421875, -0.278778076171875, -0.264892578125, -0.251007080078125, -0.23712158203125, -0.223236083984375, -0.2093505859375, -0.195465087890625, -0.18157958984375, -0.167694091796875, -0.15380859375, -0.139923095703125, -0.12603759765625, -0.112152099609375, -0.0982666015625, -0.084381103515625, -0.07049560546875, -0.056610107421875, -0.042724609375, -0.028839111328125, -0.01495361328125, -0.001068115234375, 0.0128173828125, 0.026702880859375, 0.04058837890625, 0.054473876953125, 0.068359375, 0.082244873046875, 0.09613037109375, 0.110015869140625, 0.1239013671875, 0.137786865234375, 0.15167236328125, 0.165557861328125, 0.179443359375, 0.193328857421875, 0.20721435546875, 0.221099853515625, 0.2349853515625, 0.248870849609375, 0.26275634765625, 0.276641845703125, 0.29052734375, 0.304412841796875, 0.31829833984375, 0.332183837890625, 0.3460693359375, 0.359954833984375, 0.37384033203125, 0.387725830078125, 0.401611328125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 12.0, 951.0, 53.0], "bins": [-0.7828263640403748, -0.7703506946563721, -0.7578750252723694, -0.7453993558883667, -0.732923686504364, -0.7204480171203613, -0.7079723477363586, -0.695496678352356, -0.6830210089683533, -0.6705453395843506, -0.6580696702003479, -0.6455940008163452, -0.6331183314323425, -0.6206426620483398, -0.6081669926643372, -0.5956913232803345, -0.5832157135009766, -0.5707400441169739, -0.5582643747329712, -0.5457887053489685, -0.5333130359649658, -0.5208373665809631, -0.5083616971969604, -0.49588602781295776, -0.4834103584289551, -0.4709346890449524, -0.4584590196609497, -0.445983350276947, -0.43350768089294434, -0.42103201150894165, -0.40855634212493896, -0.3960806727409363, -0.3836049735546112, -0.3711293041706085, -0.35865363478660583, -0.34617796540260315, -0.33370229601860046, -0.3212266266345978, -0.3087509870529175, -0.2962753176689148, -0.2837996482849121, -0.2713239789009094, -0.25884830951690674, -0.24637264013290405, -0.23389697074890137, -0.22142130136489868, -0.2089456468820572, -0.1964699774980545, -0.18399429321289062, -0.17151862382888794, -0.15904295444488525, -0.14656728506088257, -0.13409161567687988, -0.1216159537434578, -0.1091402918100357, -0.09666462242603302, -0.08418895304203033, -0.07171328365802765, -0.05923761799931526, -0.046761952340602875, -0.03428628295660019, -0.021810613572597504, -0.009334951639175415, 0.0031407177448272705, 0.015616384334862232]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 7.0, 1.0, 9.0, 13.0, 15.0, 21.0, 13.0, 23.0, 31.0, 33.0, 29.0, 37.0, 44.0, 37.0, 45.0, 44.0, 51.0, 45.0, 46.0, 54.0, 51.0, 39.0, 45.0, 43.0, 31.0, 26.0, 35.0, 22.0, 25.0, 16.0, 19.0, 16.0, 11.0, 10.0, 7.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042565882205963135, -0.04116690531373024, -0.039767928421497345, -0.03836895152926445, -0.036969974637031555, -0.03557099774479866, -0.034172020852565765, -0.03277304396033287, -0.031374067068099976, -0.02997509017586708, -0.028576113283634186, -0.02717713639140129, -0.025778159499168396, -0.0243791826069355, -0.022980205714702606, -0.02158122882246971, -0.020182251930236816, -0.01878327503800392, -0.017384298145771027, -0.01598532125353813, -0.014586344361305237, -0.013187367469072342, -0.011788390576839447, -0.010389413684606552, -0.008990436792373657, -0.007591459900140762, -0.006192483007907867, -0.0047935061156749725, -0.0033945292234420776, -0.0019955523312091827, -0.0005965754389762878, 0.0008024014532566071, 0.002201378345489502, 0.003600355237722397, 0.004999332129955292, 0.006398309022188187, 0.0077972859144210815, 0.009196262806653976, 0.010595239698886871, 0.011994216591119766, 0.013393193483352661, 0.014792170375585556, 0.01619114726781845, 0.017590124160051346, 0.01898910105228424, 0.020388077944517136, 0.02178705483675003, 0.023186031728982925, 0.02458500862121582, 0.025983985513448715, 0.02738296240568161, 0.028781939297914505, 0.0301809161901474, 0.031579893082380295, 0.03297886997461319, 0.034377846866846085, 0.03577682375907898, 0.037175800651311874, 0.03857477754354477, 0.039973754435777664, 0.04137273132801056, 0.042771708220243454, 0.04417068511247635, 0.045569662004709244, 0.04696863889694214]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 4.0, 5.0, 6.0, 8.0, 14.0, 13.0, 11.0, 14.0, 16.0, 24.0, 20.0, 37.0, 29.0, 43.0, 30.0, 47.0, 45.0, 45.0, 57.0, 38.0, 55.0, 38.0, 46.0, 41.0, 38.0, 31.0, 30.0, 25.0, 28.0, 24.0, 24.0, 19.0, 22.0, 16.0, 18.0, 7.0, 6.0, 9.0, 4.0, 6.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.40625, -7.1748046875, -6.943359375, -6.7119140625, -6.48046875, -6.2490234375, -6.017578125, -5.7861328125, -5.5546875, -5.3232421875, -5.091796875, -4.8603515625, -4.62890625, -4.3974609375, -4.166015625, -3.9345703125, -3.703125, -3.4716796875, -3.240234375, -3.0087890625, -2.77734375, -2.5458984375, -2.314453125, -2.0830078125, -1.8515625, -1.6201171875, -1.388671875, -1.1572265625, -0.92578125, -0.6943359375, -0.462890625, -0.2314453125, 0.0, 0.2314453125, 0.462890625, 0.6943359375, 0.92578125, 1.1572265625, 1.388671875, 1.6201171875, 1.8515625, 2.0830078125, 2.314453125, 2.5458984375, 2.77734375, 3.0087890625, 3.240234375, 3.4716796875, 3.703125, 3.9345703125, 4.166015625, 4.3974609375, 4.62890625, 4.8603515625, 5.091796875, 5.3232421875, 5.5546875, 5.7861328125, 6.017578125, 6.2490234375, 6.48046875, 6.7119140625, 6.943359375, 7.1748046875, 7.40625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 0.0, 3.0, 2.0, 5.0, 5.0, 5.0, 11.0, 13.0, 24.0, 22.0, 38.0, 48.0, 79.0, 97.0, 159.0, 202.0, 266.0, 434.0, 628.0, 1070.0, 1890.0, 4298.0, 10714.0, 30622.0, 99946.0, 386709.0, 367585.0, 95160.0, 29132.0, 10332.0, 4103.0, 1871.0, 1091.0, 630.0, 391.0, 294.0, 202.0, 140.0, 104.0, 60.0, 46.0, 40.0, 29.0, 20.0, 11.0, 11.0, 7.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.359375, -10.98046875, -10.6015625, -10.22265625, -9.84375, -9.46484375, -9.0859375, -8.70703125, -8.328125, -7.94921875, -7.5703125, -7.19140625, -6.8125, -6.43359375, -6.0546875, -5.67578125, -5.296875, -4.91796875, -4.5390625, -4.16015625, -3.78125, -3.40234375, -3.0234375, -2.64453125, -2.265625, -1.88671875, -1.5078125, -1.12890625, -0.75, -0.37109375, 0.0078125, 0.38671875, 0.765625, 1.14453125, 1.5234375, 1.90234375, 2.28125, 2.66015625, 3.0390625, 3.41796875, 3.796875, 4.17578125, 4.5546875, 4.93359375, 5.3125, 5.69140625, 6.0703125, 6.44921875, 6.828125, 7.20703125, 7.5859375, 7.96484375, 8.34375, 8.72265625, 9.1015625, 9.48046875, 9.859375, 10.23828125, 10.6171875, 10.99609375, 11.375, 11.75390625, 12.1328125, 12.51171875, 12.890625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 10.0, 5.0, 11.0, 8.0, 11.0, 14.0, 15.0, 9.0, 21.0, 27.0, 33.0, 43.0, 42.0, 48.0, 74.0, 115.0, 202.0, 1410.0, 288.0, 177.0, 98.0, 68.0, 53.0, 46.0, 33.0, 36.0, 25.0, 23.0, 20.0, 16.0, 9.0, 16.0, 11.0, 7.0, 6.0, 5.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.3046875, -14.7725830078125, -14.240478515625, -13.7083740234375, -13.17626953125, -12.6441650390625, -12.112060546875, -11.5799560546875, -11.0478515625, -10.5157470703125, -9.983642578125, -9.4515380859375, -8.91943359375, -8.3873291015625, -7.855224609375, -7.3231201171875, -6.791015625, -6.2589111328125, -5.726806640625, -5.1947021484375, -4.66259765625, -4.1304931640625, -3.598388671875, -3.0662841796875, -2.5341796875, -2.0020751953125, -1.469970703125, -0.9378662109375, -0.40576171875, 0.1263427734375, 0.658447265625, 1.1905517578125, 1.72265625, 2.2547607421875, 2.786865234375, 3.3189697265625, 3.85107421875, 4.3831787109375, 4.915283203125, 5.4473876953125, 5.9794921875, 6.5115966796875, 7.043701171875, 7.5758056640625, 8.10791015625, 8.6400146484375, 9.172119140625, 9.7042236328125, 10.236328125, 10.7684326171875, 11.300537109375, 11.8326416015625, 12.36474609375, 12.8968505859375, 13.428955078125, 13.9610595703125, 14.4931640625, 15.0252685546875, 15.557373046875, 16.0894775390625, 16.62158203125, 17.1536865234375, 17.685791015625, 18.2178955078125, 18.75]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 3.0, 5.0, 8.0, 14.0, 16.0, 19.0, 23.0, 31.0, 49.0, 47.0, 95.0, 147.0, 204.0, 347.0, 591.0, 1178.0, 6880.0, 3090739.0, 41761.0, 1643.0, 710.0, 411.0, 249.0, 164.0, 117.0, 73.0, 41.0, 31.0, 25.0, 27.0, 10.0, 14.0, 6.0, 5.0, 3.0, 4.0, 1.0, 5.0, 6.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.8125, -46.083984375, -44.35546875, -42.626953125, -40.8984375, -39.169921875, -37.44140625, -35.712890625, -33.984375, -32.255859375, -30.52734375, -28.798828125, -27.0703125, -25.341796875, -23.61328125, -21.884765625, -20.15625, -18.427734375, -16.69921875, -14.970703125, -13.2421875, -11.513671875, -9.78515625, -8.056640625, -6.328125, -4.599609375, -2.87109375, -1.142578125, 0.5859375, 2.314453125, 4.04296875, 5.771484375, 7.5, 9.228515625, 10.95703125, 12.685546875, 14.4140625, 16.142578125, 17.87109375, 19.599609375, 21.328125, 23.056640625, 24.78515625, 26.513671875, 28.2421875, 29.970703125, 31.69921875, 33.427734375, 35.15625, 36.884765625, 38.61328125, 40.341796875, 42.0703125, 43.798828125, 45.52734375, 47.255859375, 48.984375, 50.712890625, 52.44140625, 54.169921875, 55.8984375, 57.626953125, 59.35546875, 61.083984375, 62.8125]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 15.0, 42.0, 121.0, 283.0, 307.0, 162.0, 64.0, 16.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.35564422607422, -92.37616729736328, -88.39669036865234, -84.4172134399414, -80.43773651123047, -76.45825958251953, -72.47877502441406, -68.49929809570312, -64.51982116699219, -60.54034423828125, -56.56086730957031, -52.581390380859375, -48.60191345214844, -44.6224365234375, -40.6429557800293, -36.66347885131836, -32.68400573730469, -28.70452880859375, -24.725051879882812, -20.745573043823242, -16.766096115112305, -12.786619186401367, -8.807140350341797, -4.827663421630859, -0.8481864929199219, 3.131290912628174, 7.1107683181762695, 11.090246200561523, 15.069723129272461, 19.0492000579834, 23.02867889404297, 27.008155822753906, 30.987640380859375, 34.96711730957031, 38.94659423828125, 42.92607116699219, 46.905548095703125, 50.88502502441406, 54.864505767822266, 58.8439826965332, 62.82345962524414, 66.80294036865234, 70.78241729736328, 74.76189422607422, 78.74137115478516, 82.7208480834961, 86.70032501220703, 90.67980194091797, 94.6592788696289, 98.63875579833984, 102.61823272705078, 106.59770965576172, 110.57718658447266, 114.5566635131836, 118.53614807128906, 122.515625, 126.49510192871094, 130.47457885742188, 134.4540557861328, 138.43353271484375, 142.4130096435547, 146.39248657226562, 150.37196350097656, 154.3514404296875, 158.33091735839844]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 5.0, 4.0, 10.0, 7.0, 12.0, 16.0, 17.0, 15.0, 17.0, 32.0, 32.0, 33.0, 36.0, 24.0, 32.0, 39.0, 36.0, 38.0, 35.0, 49.0, 32.0, 51.0, 42.0, 36.0, 30.0, 41.0, 32.0, 23.0, 28.0, 32.0, 29.0, 14.0, 20.0, 18.0, 16.0, 14.0, 10.0, 4.0, 8.0, 9.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-53.585548400878906, -52.10537338256836, -50.62519836425781, -49.14501953125, -47.66484451293945, -46.184669494628906, -44.70449447631836, -43.22431945800781, -41.744144439697266, -40.26396942138672, -38.78379440307617, -37.303619384765625, -35.82344055175781, -34.343265533447266, -32.86309051513672, -31.382915496826172, -29.902738571166992, -28.422563552856445, -26.942386627197266, -25.46221160888672, -23.982036590576172, -22.501861572265625, -21.021684646606445, -19.5415096282959, -18.06133270263672, -16.581157684326172, -15.100981712341309, -13.620805740356445, -12.140630722045898, -10.660454750061035, -9.180278778076172, -7.700103759765625, -6.219928741455078, -4.739753246307373, -3.259577512741089, -1.7794017791748047, -0.2992262840270996, 1.1809492111206055, 2.6611251831054688, 4.141300201416016, 5.621476173400879, 7.101651668548584, 8.581827163696289, 10.062003135681152, 11.542179107666016, 13.022354125976562, 14.502530097961426, 15.982705116271973, 17.462881088256836, 18.943056106567383, 20.423233032226562, 21.90340805053711, 23.383583068847656, 24.863758087158203, 26.343935012817383, 27.82411003112793, 29.30428695678711, 30.784461975097656, 32.2646369934082, 33.74481201171875, 35.22499084472656, 36.70516586303711, 38.185340881347656, 39.6655158996582, 41.14569091796875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 8.0, 6.0, 11.0, 11.0, 14.0, 17.0, 9.0, 29.0, 20.0, 16.0, 25.0, 28.0, 47.0, 41.0, 37.0, 42.0, 59.0, 52.0, 47.0, 43.0, 42.0, 42.0, 36.0, 33.0, 24.0, 36.0, 29.0, 24.0, 24.0, 20.0, 27.0, 19.0, 14.0, 18.0, 14.0, 9.0, 6.0, 4.0, 5.0, 4.0, 3.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1328125, -6.8868408203125, -6.640869140625, -6.3948974609375, -6.14892578125, -5.9029541015625, -5.656982421875, -5.4110107421875, -5.1650390625, -4.9190673828125, -4.673095703125, -4.4271240234375, -4.18115234375, -3.9351806640625, -3.689208984375, -3.4432373046875, -3.197265625, -2.9512939453125, -2.705322265625, -2.4593505859375, -2.21337890625, -1.9674072265625, -1.721435546875, -1.4754638671875, -1.2294921875, -0.9835205078125, -0.737548828125, -0.4915771484375, -0.24560546875, 0.0003662109375, 0.246337890625, 0.4923095703125, 0.73828125, 0.9842529296875, 1.230224609375, 1.4761962890625, 1.72216796875, 1.9681396484375, 2.214111328125, 2.4600830078125, 2.7060546875, 2.9520263671875, 3.197998046875, 3.4439697265625, 3.68994140625, 3.9359130859375, 4.181884765625, 4.4278564453125, 4.673828125, 4.9197998046875, 5.165771484375, 5.4117431640625, 5.65771484375, 5.9036865234375, 6.149658203125, 6.3956298828125, 6.6416015625, 6.8875732421875, 7.133544921875, 7.3795166015625, 7.62548828125, 7.8714599609375, 8.117431640625, 8.3634033203125, 8.609375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 12.0, 10.0, 17.0, 33.0, 58.0, 110.0, 195.0, 422.0, 761.0, 1519.0, 3315.0, 7966.0, 24303.0, 127864.0, 883549.0, 2262698.0, 741292.0, 105061.0, 21979.0, 7248.0, 3032.0, 1429.0, 660.0, 348.0, 175.0, 107.0, 62.0, 29.0, 20.0, 8.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.90625, -14.4468994140625, -13.987548828125, -13.5281982421875, -13.06884765625, -12.6094970703125, -12.150146484375, -11.6907958984375, -11.2314453125, -10.7720947265625, -10.312744140625, -9.8533935546875, -9.39404296875, -8.9346923828125, -8.475341796875, -8.0159912109375, -7.556640625, -7.0972900390625, -6.637939453125, -6.1785888671875, -5.71923828125, -5.2598876953125, -4.800537109375, -4.3411865234375, -3.8818359375, -3.4224853515625, -2.963134765625, -2.5037841796875, -2.04443359375, -1.5850830078125, -1.125732421875, -0.6663818359375, -0.20703125, 0.2523193359375, 0.711669921875, 1.1710205078125, 1.63037109375, 2.0897216796875, 2.549072265625, 3.0084228515625, 3.4677734375, 3.9271240234375, 4.386474609375, 4.8458251953125, 5.30517578125, 5.7645263671875, 6.223876953125, 6.6832275390625, 7.142578125, 7.6019287109375, 8.061279296875, 8.5206298828125, 8.97998046875, 9.4393310546875, 9.898681640625, 10.3580322265625, 10.8173828125, 11.2767333984375, 11.736083984375, 12.1954345703125, 12.65478515625, 13.1141357421875, 13.573486328125, 14.0328369140625, 14.4921875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 3.0, 13.0, 10.0, 16.0, 19.0, 35.0, 58.0, 70.0, 74.0, 115.0, 149.0, 169.0, 220.0, 269.0, 368.0, 405.0, 404.0, 366.0, 298.0, 266.0, 190.0, 152.0, 94.0, 85.0, 61.0, 45.0, 33.0, 21.0, 16.0, 14.0, 7.0, 9.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5, -11.1434326171875, -10.786865234375, -10.4302978515625, -10.07373046875, -9.7171630859375, -9.360595703125, -9.0040283203125, -8.6474609375, -8.2908935546875, -7.934326171875, -7.5777587890625, -7.22119140625, -6.8646240234375, -6.508056640625, -6.1514892578125, -5.794921875, -5.4383544921875, -5.081787109375, -4.7252197265625, -4.36865234375, -4.0120849609375, -3.655517578125, -3.2989501953125, -2.9423828125, -2.5858154296875, -2.229248046875, -1.8726806640625, -1.51611328125, -1.1595458984375, -0.802978515625, -0.4464111328125, -0.08984375, 0.2667236328125, 0.623291015625, 0.9798583984375, 1.33642578125, 1.6929931640625, 2.049560546875, 2.4061279296875, 2.7626953125, 3.1192626953125, 3.475830078125, 3.8323974609375, 4.18896484375, 4.5455322265625, 4.902099609375, 5.2586669921875, 5.615234375, 5.9718017578125, 6.328369140625, 6.6849365234375, 7.04150390625, 7.3980712890625, 7.754638671875, 8.1112060546875, 8.4677734375, 8.8243408203125, 9.180908203125, 9.5374755859375, 9.89404296875, 10.2506103515625, 10.607177734375, 10.9637451171875, 11.3203125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 2.0, 4.0, 9.0, 13.0, 16.0, 15.0, 29.0, 42.0, 50.0, 77.0, 116.0, 178.0, 278.0, 539.0, 1043.0, 2409.0, 7364.0, 56081.0, 1340281.0, 2640659.0, 127531.0, 11350.0, 3217.0, 1276.0, 651.0, 347.0, 228.0, 130.0, 91.0, 70.0, 50.0, 46.0, 22.0, 18.0, 11.0, 7.0, 8.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.609375, -20.892333984375, -20.17529296875, -19.458251953125, -18.7412109375, -18.024169921875, -17.30712890625, -16.590087890625, -15.873046875, -15.156005859375, -14.43896484375, -13.721923828125, -13.0048828125, -12.287841796875, -11.57080078125, -10.853759765625, -10.13671875, -9.419677734375, -8.70263671875, -7.985595703125, -7.2685546875, -6.551513671875, -5.83447265625, -5.117431640625, -4.400390625, -3.683349609375, -2.96630859375, -2.249267578125, -1.5322265625, -0.815185546875, -0.09814453125, 0.618896484375, 1.3359375, 2.052978515625, 2.77001953125, 3.487060546875, 4.2041015625, 4.921142578125, 5.63818359375, 6.355224609375, 7.072265625, 7.789306640625, 8.50634765625, 9.223388671875, 9.9404296875, 10.657470703125, 11.37451171875, 12.091552734375, 12.80859375, 13.525634765625, 14.24267578125, 14.959716796875, 15.6767578125, 16.393798828125, 17.11083984375, 17.827880859375, 18.544921875, 19.261962890625, 19.97900390625, 20.696044921875, 21.4130859375, 22.130126953125, 22.84716796875, 23.564208984375, 24.28125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 70.0, 415.0, 422.0, 93.0, 7.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-425.3759460449219, -416.69317626953125, -408.0104064941406, -399.3276062011719, -390.64483642578125, -381.9620666503906, -373.279296875, -364.59649658203125, -355.9137268066406, -347.23095703125, -338.5481872558594, -329.8653869628906, -321.1826171875, -312.4998474121094, -303.81707763671875, -295.13427734375, -286.4515380859375, -277.7687683105469, -269.08599853515625, -260.4031982421875, -251.72042846679688, -243.03765869140625, -234.35488891601562, -225.67210388183594, -216.98931884765625, -208.30654907226562, -199.62376403808594, -190.9409942626953, -182.25820922851562, -173.575439453125, -164.89266967773438, -156.2098846435547, -147.52708435058594, -138.8443145751953, -130.16152954101562, -121.478759765625, -112.79597473144531, -104.11320495605469, -95.43042755126953, -86.74765014648438, -78.06487274169922, -69.38209533691406, -60.699317932128906, -52.016544342041016, -43.33376693725586, -34.6509895324707, -25.968215942382812, -17.285438537597656, -8.6026611328125, 0.08011531829833984, 8.76289176940918, 17.445667266845703, 26.12844467163086, 34.811222076416016, 43.493995666503906, 52.17677307128906, 60.85955047607422, 69.54232788085938, 78.22510528564453, 86.90788269042969, 95.59065246582031, 104.2734375, 112.95620727539062, 121.63898468017578, 130.32176208496094]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 8.0, 6.0, 8.0, 6.0, 12.0, 17.0, 17.0, 22.0, 25.0, 18.0, 31.0, 26.0, 32.0, 36.0, 25.0, 33.0, 35.0, 43.0, 19.0, 42.0, 44.0, 40.0, 45.0, 49.0, 35.0, 30.0, 37.0, 48.0, 24.0, 26.0, 24.0, 22.0, 24.0, 20.0, 13.0, 12.0, 10.0, 8.0, 4.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-44.3279914855957, -42.986610412597656, -41.645233154296875, -40.303855895996094, -38.96247482299805, -37.62109375, -36.27971649169922, -34.93833923339844, -33.59695816040039, -32.255577087402344, -30.914199829101562, -29.57282066345215, -28.231441497802734, -26.89006233215332, -25.548683166503906, -24.207304000854492, -22.865924835205078, -21.524545669555664, -20.18316650390625, -18.841787338256836, -17.500408172607422, -16.159029006958008, -14.817649841308594, -13.47627067565918, -12.134891510009766, -10.793512344360352, -9.452133178710938, -8.110754013061523, -6.769374847412109, -5.427995681762695, -4.086616516113281, -2.745237350463867, -1.4038543701171875, -0.06247520446777344, 1.2789039611816406, 2.6202831268310547, 3.9616622924804688, 5.303041458129883, 6.644420623779297, 7.985799789428711, 9.327178955078125, 10.668558120727539, 12.009937286376953, 13.351316452026367, 14.692695617675781, 16.034074783325195, 17.37545394897461, 18.716833114624023, 20.058212280273438, 21.39959144592285, 22.740970611572266, 24.08234977722168, 25.423728942871094, 26.765108108520508, 28.106487274169922, 29.447866439819336, 30.78924560546875, 32.13062286376953, 33.47200393676758, 34.813385009765625, 36.154762268066406, 37.49613952636719, 38.837520599365234, 40.17890167236328, 41.52027893066406]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 9.0, 5.0, 6.0, 6.0, 14.0, 9.0, 22.0, 25.0, 34.0, 46.0, 49.0, 42.0, 46.0, 53.0, 52.0, 60.0, 43.0, 44.0, 58.0, 45.0, 61.0, 39.0, 31.0, 35.0, 35.0, 36.0, 28.0, 17.0, 10.0, 11.0, 12.0, 7.0, 11.0, 1.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.66015625, -7.41180419921875, -7.1634521484375, -6.91510009765625, -6.666748046875, -6.41839599609375, -6.1700439453125, -5.92169189453125, -5.67333984375, -5.42498779296875, -5.1766357421875, -4.92828369140625, -4.679931640625, -4.43157958984375, -4.1832275390625, -3.93487548828125, -3.6865234375, -3.43817138671875, -3.1898193359375, -2.94146728515625, -2.693115234375, -2.44476318359375, -2.1964111328125, -1.94805908203125, -1.69970703125, -1.45135498046875, -1.2030029296875, -0.95465087890625, -0.706298828125, -0.45794677734375, -0.2095947265625, 0.03875732421875, 0.287109375, 0.53546142578125, 0.7838134765625, 1.03216552734375, 1.280517578125, 1.52886962890625, 1.7772216796875, 2.02557373046875, 2.27392578125, 2.52227783203125, 2.7706298828125, 3.01898193359375, 3.267333984375, 3.51568603515625, 3.7640380859375, 4.01239013671875, 4.2607421875, 4.50909423828125, 4.7574462890625, 5.00579833984375, 5.254150390625, 5.50250244140625, 5.7508544921875, 5.99920654296875, 6.24755859375, 6.49591064453125, 6.7442626953125, 6.99261474609375, 7.240966796875, 7.48931884765625, 7.7376708984375, 7.98602294921875, 8.234375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 7.0, 7.0, 19.0, 14.0, 32.0, 50.0, 83.0, 147.0, 206.0, 308.0, 531.0, 809.0, 1268.0, 1922.0, 3023.0, 4597.0, 7017.0, 10637.0, 16149.0, 23760.0, 34396.0, 48937.0, 66248.0, 86316.0, 104386.0, 116355.0, 116433.0, 104187.0, 85162.0, 65137.0, 47993.0, 33593.0, 22987.0, 15750.0, 10416.0, 6821.0, 4539.0, 3006.0, 1896.0, 1241.0, 801.0, 507.0, 326.0, 207.0, 118.0, 72.0, 56.0, 30.0, 26.0, 11.0, 13.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.55517578125, -0.537811279296875, -0.52044677734375, -0.503082275390625, -0.4857177734375, -0.468353271484375, -0.45098876953125, -0.433624267578125, -0.416259765625, -0.398895263671875, -0.38153076171875, -0.364166259765625, -0.3468017578125, -0.329437255859375, -0.31207275390625, -0.294708251953125, -0.27734375, -0.259979248046875, -0.24261474609375, -0.225250244140625, -0.2078857421875, -0.190521240234375, -0.17315673828125, -0.155792236328125, -0.138427734375, -0.121063232421875, -0.10369873046875, -0.086334228515625, -0.0689697265625, -0.051605224609375, -0.03424072265625, -0.016876220703125, 0.00048828125, 0.017852783203125, 0.03521728515625, 0.052581787109375, 0.0699462890625, 0.087310791015625, 0.10467529296875, 0.122039794921875, 0.139404296875, 0.156768798828125, 0.17413330078125, 0.191497802734375, 0.2088623046875, 0.226226806640625, 0.24359130859375, 0.260955810546875, 0.2783203125, 0.295684814453125, 0.31304931640625, 0.330413818359375, 0.3477783203125, 0.365142822265625, 0.38250732421875, 0.399871826171875, 0.417236328125, 0.434600830078125, 0.45196533203125, 0.469329833984375, 0.4866943359375, 0.504058837890625, 0.52142333984375, 0.538787841796875, 0.55615234375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 2.0, 2.0, 3.0, 5.0, 4.0, 10.0, 16.0, 16.0, 18.0, 14.0, 22.0, 21.0, 25.0, 23.0, 22.0, 28.0, 30.0, 38.0, 24.0, 23.0, 39.0, 22.0, 43.0, 1062.0, 38.0, 41.0, 45.0, 29.0, 38.0, 31.0, 24.0, 32.0, 22.0, 32.0, 25.0, 12.0, 24.0, 14.0, 15.0, 12.0, 16.0, 13.0, 7.0, 7.0, 7.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 7.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.603515625, -3.486785888671875, -3.37005615234375, -3.253326416015625, -3.1365966796875, -3.019866943359375, -2.90313720703125, -2.786407470703125, -2.669677734375, -2.552947998046875, -2.43621826171875, -2.319488525390625, -2.2027587890625, -2.086029052734375, -1.96929931640625, -1.852569580078125, -1.73583984375, -1.619110107421875, -1.50238037109375, -1.385650634765625, -1.2689208984375, -1.152191162109375, -1.03546142578125, -0.918731689453125, -0.802001953125, -0.685272216796875, -0.56854248046875, -0.451812744140625, -0.3350830078125, -0.218353271484375, -0.10162353515625, 0.015106201171875, 0.1318359375, 0.248565673828125, 0.36529541015625, 0.482025146484375, 0.5987548828125, 0.715484619140625, 0.83221435546875, 0.948944091796875, 1.065673828125, 1.182403564453125, 1.29913330078125, 1.415863037109375, 1.5325927734375, 1.649322509765625, 1.76605224609375, 1.882781982421875, 1.99951171875, 2.116241455078125, 2.23297119140625, 2.349700927734375, 2.4664306640625, 2.583160400390625, 2.69989013671875, 2.816619873046875, 2.933349609375, 3.050079345703125, 3.16680908203125, 3.283538818359375, 3.4002685546875, 3.516998291015625, 3.63372802734375, 3.750457763671875, 3.8671875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 3.0, 14.0, 14.0, 17.0, 41.0, 45.0, 86.0, 145.0, 191.0, 336.0, 541.0, 782.0, 1321.0, 2199.0, 3593.0, 5872.0, 9555.0, 15720.0, 25009.0, 42028.0, 1879638.0, 42996.0, 25897.0, 15869.0, 9710.0, 5916.0, 3744.0, 2228.0, 1383.0, 834.0, 505.0, 321.0, 192.0, 126.0, 76.0, 51.0, 39.0, 30.0, 12.0, 17.0, 13.0, 1.0, 4.0, 0.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.6201171875, -1.57318115234375, -1.5262451171875, -1.47930908203125, -1.432373046875, -1.38543701171875, -1.3385009765625, -1.29156494140625, -1.24462890625, -1.19769287109375, -1.1507568359375, -1.10382080078125, -1.056884765625, -1.00994873046875, -0.9630126953125, -0.91607666015625, -0.869140625, -0.82220458984375, -0.7752685546875, -0.72833251953125, -0.681396484375, -0.63446044921875, -0.5875244140625, -0.54058837890625, -0.49365234375, -0.44671630859375, -0.3997802734375, -0.35284423828125, -0.305908203125, -0.25897216796875, -0.2120361328125, -0.16510009765625, -0.1181640625, -0.07122802734375, -0.0242919921875, 0.02264404296875, 0.069580078125, 0.11651611328125, 0.1634521484375, 0.21038818359375, 0.25732421875, 0.30426025390625, 0.3511962890625, 0.39813232421875, 0.445068359375, 0.49200439453125, 0.5389404296875, 0.58587646484375, 0.6328125, 0.67974853515625, 0.7266845703125, 0.77362060546875, 0.820556640625, 0.86749267578125, 0.9144287109375, 0.96136474609375, 1.00830078125, 1.05523681640625, 1.1021728515625, 1.14910888671875, 1.196044921875, 1.24298095703125, 1.2899169921875, 1.33685302734375, 1.3837890625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 2.0, 1.0, 7.0, 7.0, 14.0, 21.0, 38.0, 56.0, 98.0, 154.0, 142.0, 152.0, 112.0, 66.0, 49.0, 26.0, 13.0, 7.0, 3.0, 6.0, 0.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0367431640625, -0.035741329193115234, -0.03473949432373047, -0.0337376594543457, -0.03273582458496094, -0.03173398971557617, -0.030732154846191406, -0.02973031997680664, -0.028728485107421875, -0.02772665023803711, -0.026724815368652344, -0.025722980499267578, -0.024721145629882812, -0.023719310760498047, -0.02271747589111328, -0.021715641021728516, -0.02071380615234375, -0.019711971282958984, -0.01871013641357422, -0.017708301544189453, -0.016706466674804688, -0.015704631805419922, -0.014702796936035156, -0.01370096206665039, -0.012699127197265625, -0.01169729232788086, -0.010695457458496094, -0.009693622589111328, -0.008691787719726562, -0.007689952850341797, -0.006688117980957031, -0.005686283111572266, -0.0046844482421875, -0.0036826133728027344, -0.0026807785034179688, -0.0016789436340332031, -0.0006771087646484375, 0.0003247261047363281, 0.0013265609741210938, 0.0023283958435058594, 0.003330230712890625, 0.004332065582275391, 0.005333900451660156, 0.006335735321044922, 0.0073375701904296875, 0.008339405059814453, 0.009341239929199219, 0.010343074798583984, 0.01134490966796875, 0.012346744537353516, 0.013348579406738281, 0.014350414276123047, 0.015352249145507812, 0.016354084014892578, 0.017355918884277344, 0.01835775375366211, 0.019359588623046875, 0.02036142349243164, 0.021363258361816406, 0.022365093231201172, 0.023366928100585938, 0.024368762969970703, 0.02537059783935547, 0.026372432708740234, 0.027374267578125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 8.0, 6.0, 8.0, 3.0, 11.0, 17.0, 32.0, 88.0, 205.0, 711.0, 950404.0, 96086.0, 590.0, 184.0, 77.0, 40.0, 15.0, 15.0, 12.0, 4.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67529296875, -0.651123046875, -0.626953125, -0.602783203125, -0.57861328125, -0.554443359375, -0.5302734375, -0.506103515625, -0.48193359375, -0.457763671875, -0.43359375, -0.409423828125, -0.38525390625, -0.361083984375, -0.3369140625, -0.312744140625, -0.28857421875, -0.264404296875, -0.240234375, -0.216064453125, -0.19189453125, -0.167724609375, -0.1435546875, -0.119384765625, -0.09521484375, -0.071044921875, -0.046875, -0.022705078125, 0.00146484375, 0.025634765625, 0.0498046875, 0.073974609375, 0.09814453125, 0.122314453125, 0.146484375, 0.170654296875, 0.19482421875, 0.218994140625, 0.2431640625, 0.267333984375, 0.29150390625, 0.315673828125, 0.33984375, 0.364013671875, 0.38818359375, 0.412353515625, 0.4365234375, 0.460693359375, 0.48486328125, 0.509033203125, 0.533203125, 0.557373046875, 0.58154296875, 0.605712890625, 0.6298828125, 0.654052734375, 0.67822265625, 0.702392578125, 0.7265625, 0.750732421875, 0.77490234375, 0.799072265625, 0.8232421875, 0.847412109375, 0.87158203125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 11.0, 1002.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20539942383766174, -0.19582006335258484, -0.18624070286750793, -0.17666135728359222, -0.16708199679851532, -0.15750263631343842, -0.1479232907295227, -0.1383439302444458, -0.1287645697593689, -0.11918520927429199, -0.10960585623979568, -0.10002650320529938, -0.09044714272022247, -0.08086778223514557, -0.07128842920064926, -0.061709076166152954, -0.05212971568107605, -0.042550358921289444, -0.03297100216150284, -0.023391645401716232, -0.013812288641929626, -0.004232931882143021, 0.005346424877643585, 0.014925777912139893, 0.024505138397216797, 0.0340844951570034, 0.04366385191679001, 0.053243208676576614, 0.06282256543636322, 0.07240192592144012, 0.08198127895593643, 0.09156063199043274, 0.10113999247550964, 0.11071935296058655, 0.12029870599508286, 0.12987805902957916, 0.13945741951465607, 0.14903677999973297, 0.15861612558364868, 0.16819548606872559, 0.1777748465538025, 0.1873542070388794, 0.1969335675239563, 0.206512913107872, 0.2160922735929489, 0.22567163407802582, 0.23525097966194153, 0.24483034014701843, 0.25440970063209534, 0.26398906111717224, 0.27356842160224915, 0.28314778208732605, 0.29272711277008057, 0.30230647325515747, 0.3118858337402344, 0.3214651942253113, 0.3310445547103882, 0.3406239151954651, 0.350203275680542, 0.3597826361656189, 0.3693619966506958, 0.3789413273334503, 0.3885206878185272, 0.3981000483036041, 0.40767940878868103]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 14.0, 24.0, 21.0, 34.0, 26.0, 42.0, 43.0, 51.0, 49.0, 61.0, 65.0, 60.0, 63.0, 68.0, 62.0, 59.0, 56.0, 36.0, 35.0, 31.0, 27.0, 14.0, 21.0, 7.0, 6.0, 7.0, 1.0, 4.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023725152015686035, -0.02281872183084488, -0.021912293508648872, -0.021005865186452866, -0.02009943500161171, -0.019193004816770554, -0.018286576494574547, -0.01738014817237854, -0.016473717987537384, -0.015567288734018803, -0.014660859480500221, -0.01375443022698164, -0.012848000973463058, -0.011941571719944477, -0.011035142466425896, -0.010128713212907314, -0.009222283959388733, -0.008315854705870152, -0.00740942545235157, -0.006502996198832989, -0.005596566945314407, -0.004690137691795826, -0.0037837084382772446, -0.002877279184758663, -0.001970849931240082, -0.0010644206777215004, -0.000157991424202919, 0.0007484378293156624, 0.0016548670828342438, 0.002561296336352825, 0.0034677255898714066, 0.004374154843389988, 0.005280584096908569, 0.006187013350427151, 0.007093442603945732, 0.007999871857464314, 0.008906301110982895, 0.009812730364501476, 0.010719159618020058, 0.011625588871538639, 0.01253201812505722, 0.013438447378575802, 0.014344876632094383, 0.015251305885612965, 0.016157735139131546, 0.017064165323972702, 0.01797059364616871, 0.018877021968364716, 0.01978345215320587, 0.020689882338047028, 0.021596310660243034, 0.02250273898243904, 0.023409169167280197, 0.024315599352121353, 0.02522202767431736, 0.026128455996513367, 0.027034886181354523, 0.02794131636619568, 0.028847744688391685, 0.029754173010587692, 0.03066060319542885, 0.031567033380270004, 0.03247345983982086, 0.03337989002466202, 0.034286320209503174]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 7.0, 1.0, 2.0, 7.0, 9.0, 13.0, 7.0, 11.0, 21.0, 26.0, 18.0, 30.0, 44.0, 32.0, 40.0, 42.0, 42.0, 43.0, 47.0, 44.0, 40.0, 49.0, 47.0, 47.0, 43.0, 26.0, 33.0, 41.0, 28.0, 28.0, 23.0, 20.0, 22.0, 11.0, 8.0, 12.0, 11.0, 9.0, 8.0, 4.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6171875, -5.40545654296875, -5.1937255859375, -4.98199462890625, -4.770263671875, -4.55853271484375, -4.3468017578125, -4.13507080078125, -3.92333984375, -3.71160888671875, -3.4998779296875, -3.28814697265625, -3.076416015625, -2.86468505859375, -2.6529541015625, -2.44122314453125, -2.2294921875, -2.01776123046875, -1.8060302734375, -1.59429931640625, -1.382568359375, -1.17083740234375, -0.9591064453125, -0.74737548828125, -0.53564453125, -0.32391357421875, -0.1121826171875, 0.09954833984375, 0.311279296875, 0.52301025390625, 0.7347412109375, 0.94647216796875, 1.158203125, 1.36993408203125, 1.5816650390625, 1.79339599609375, 2.005126953125, 2.21685791015625, 2.4285888671875, 2.64031982421875, 2.85205078125, 3.06378173828125, 3.2755126953125, 3.48724365234375, 3.698974609375, 3.91070556640625, 4.1224365234375, 4.33416748046875, 4.5458984375, 4.75762939453125, 4.9693603515625, 5.18109130859375, 5.392822265625, 5.60455322265625, 5.8162841796875, 6.02801513671875, 6.23974609375, 6.45147705078125, 6.6632080078125, 6.87493896484375, 7.086669921875, 7.29840087890625, 7.5101318359375, 7.72186279296875, 7.93359375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 8.0, 17.0, 16.0, 20.0, 19.0, 43.0, 62.0, 95.0, 117.0, 140.0, 197.0, 311.0, 404.0, 708.0, 1252.0, 2751.0, 7247.0, 24671.0, 108514.0, 430272.0, 358794.0, 81894.0, 19462.0, 6129.0, 2273.0, 1087.0, 653.0, 425.0, 293.0, 183.0, 146.0, 90.0, 82.0, 51.0, 43.0, 28.0, 19.0, 16.0, 7.0, 9.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.1484375, -7.8665771484375, -7.584716796875, -7.3028564453125, -7.02099609375, -6.7391357421875, -6.457275390625, -6.1754150390625, -5.8935546875, -5.6116943359375, -5.329833984375, -5.0479736328125, -4.76611328125, -4.4842529296875, -4.202392578125, -3.9205322265625, -3.638671875, -3.3568115234375, -3.074951171875, -2.7930908203125, -2.51123046875, -2.2293701171875, -1.947509765625, -1.6656494140625, -1.3837890625, -1.1019287109375, -0.820068359375, -0.5382080078125, -0.25634765625, 0.0255126953125, 0.307373046875, 0.5892333984375, 0.87109375, 1.1529541015625, 1.434814453125, 1.7166748046875, 1.99853515625, 2.2803955078125, 2.562255859375, 2.8441162109375, 3.1259765625, 3.4078369140625, 3.689697265625, 3.9715576171875, 4.25341796875, 4.5352783203125, 4.817138671875, 5.0989990234375, 5.380859375, 5.6627197265625, 5.944580078125, 6.2264404296875, 6.50830078125, 6.7901611328125, 7.072021484375, 7.3538818359375, 7.6357421875, 7.9176025390625, 8.199462890625, 8.4813232421875, 8.76318359375, 9.0450439453125, 9.326904296875, 9.6087646484375, 9.890625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 1.0, 2.0, 3.0, 2.0, 8.0, 2.0, 12.0, 11.0, 8.0, 16.0, 16.0, 17.0, 29.0, 36.0, 28.0, 48.0, 59.0, 68.0, 88.0, 159.0, 937.0, 944.0, 151.0, 97.0, 55.0, 37.0, 42.0, 33.0, 29.0, 30.0, 16.0, 14.0, 11.0, 13.0, 10.0, 13.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.015625, -13.431640625, -12.84765625, -12.263671875, -11.6796875, -11.095703125, -10.51171875, -9.927734375, -9.34375, -8.759765625, -8.17578125, -7.591796875, -7.0078125, -6.423828125, -5.83984375, -5.255859375, -4.671875, -4.087890625, -3.50390625, -2.919921875, -2.3359375, -1.751953125, -1.16796875, -0.583984375, 0.0, 0.583984375, 1.16796875, 1.751953125, 2.3359375, 2.919921875, 3.50390625, 4.087890625, 4.671875, 5.255859375, 5.83984375, 6.423828125, 7.0078125, 7.591796875, 8.17578125, 8.759765625, 9.34375, 9.927734375, 10.51171875, 11.095703125, 11.6796875, 12.263671875, 12.84765625, 13.431640625, 14.015625, 14.599609375, 15.18359375, 15.767578125, 16.3515625, 16.935546875, 17.51953125, 18.103515625, 18.6875, 19.271484375, 19.85546875, 20.439453125, 21.0234375, 21.607421875, 22.19140625, 22.775390625, 23.359375]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 11.0, 12.0, 13.0, 18.0, 21.0, 29.0, 46.0, 59.0, 88.0, 124.0, 198.0, 338.0, 785.0, 4043.0, 2860429.0, 275822.0, 2138.0, 609.0, 303.0, 185.0, 133.0, 77.0, 63.0, 44.0, 26.0, 34.0, 17.0, 8.0, 13.0, 4.0, 5.0, 6.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.78125, -40.58251953125, -39.3837890625, -38.18505859375, -36.986328125, -35.78759765625, -34.5888671875, -33.39013671875, -32.19140625, -30.99267578125, -29.7939453125, -28.59521484375, -27.396484375, -26.19775390625, -24.9990234375, -23.80029296875, -22.6015625, -21.40283203125, -20.2041015625, -19.00537109375, -17.806640625, -16.60791015625, -15.4091796875, -14.21044921875, -13.01171875, -11.81298828125, -10.6142578125, -9.41552734375, -8.216796875, -7.01806640625, -5.8193359375, -4.62060546875, -3.421875, -2.22314453125, -1.0244140625, 0.17431640625, 1.373046875, 2.57177734375, 3.7705078125, 4.96923828125, 6.16796875, 7.36669921875, 8.5654296875, 9.76416015625, 10.962890625, 12.16162109375, 13.3603515625, 14.55908203125, 15.7578125, 16.95654296875, 18.1552734375, 19.35400390625, 20.552734375, 21.75146484375, 22.9501953125, 24.14892578125, 25.34765625, 26.54638671875, 27.7451171875, 28.94384765625, 30.142578125, 31.34130859375, 32.5400390625, 33.73876953125, 34.9375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 8.0, 113.0, 796.0, 96.0, 1.0, 1.0], "bins": [-476.4843444824219, -468.6148986816406, -460.74542236328125, -452.8759765625, -445.00653076171875, -437.1370544433594, -429.2676086425781, -421.3981628417969, -413.5286865234375, -405.65924072265625, -397.7897644042969, -389.9203186035156, -382.0508728027344, -374.181396484375, -366.31195068359375, -358.4425048828125, -350.57305908203125, -342.70361328125, -334.8341369628906, -326.9646911621094, -319.0952453613281, -311.22576904296875, -303.3563232421875, -295.48687744140625, -287.6174011230469, -279.7479553222656, -271.87847900390625, -264.009033203125, -256.13958740234375, -248.27012634277344, -240.40066528320312, -232.53121948242188, -224.66177368164062, -216.7923126220703, -208.92286682128906, -201.05340576171875, -193.18394470214844, -185.3144989013672, -177.44503784179688, -169.57559204101562, -161.70611572265625, -153.83665466308594, -145.9672088623047, -138.09774780273438, -130.22828674316406, -122.35884094238281, -114.4893798828125, -106.61992645263672, -98.75047302246094, -90.88101959228516, -83.01155853271484, -75.14210510253906, -67.27265167236328, -59.403194427490234, -51.53373718261719, -43.664283752441406, -35.794830322265625, -27.92537498474121, -20.055919647216797, -12.18646240234375, -4.317007064819336, 3.552448272705078, 11.421905517578125, 19.291358947753906, 27.160818099975586]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 6.0, 5.0, 11.0, 13.0, 7.0, 16.0, 12.0, 15.0, 9.0, 29.0, 28.0, 25.0, 31.0, 25.0, 33.0, 23.0, 37.0, 45.0, 46.0, 36.0, 48.0, 46.0, 38.0, 39.0, 49.0, 36.0, 36.0, 26.0, 45.0, 26.0, 24.0, 24.0, 20.0, 12.0, 11.0, 5.0, 14.0, 8.0, 12.0, 3.0, 3.0, 9.0, 7.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.25749206542969, -33.1310920715332, -32.00469207763672, -30.878293991088867, -29.751893997192383, -28.6254940032959, -27.499095916748047, -26.372695922851562, -25.246295928955078, -24.119895935058594, -22.99349594116211, -21.867097854614258, -20.740697860717773, -19.61429786682129, -18.487899780273438, -17.361499786376953, -16.23509979248047, -15.108699798583984, -13.982300758361816, -12.855901718139648, -11.729501724243164, -10.60310173034668, -9.476702690124512, -8.350303649902344, -7.223903656005859, -6.097504138946533, -4.971104621887207, -3.844705104827881, -2.7183055877685547, -1.5919060707092285, -0.46550655364990234, 0.6608929634094238, 1.7872962951660156, 2.913695812225342, 4.040095329284668, 5.166494846343994, 6.29289436340332, 7.4192938804626465, 8.545693397521973, 9.67209243774414, 10.798492431640625, 11.92489242553711, 13.051291465759277, 14.177690505981445, 15.30409049987793, 16.430490493774414, 17.556888580322266, 18.68328857421875, 19.809688568115234, 20.93608856201172, 22.062488555908203, 23.188886642456055, 24.31528663635254, 25.441686630249023, 26.568084716796875, 27.69448471069336, 28.820884704589844, 29.947284698486328, 31.073684692382812, 32.2000846862793, 33.32648468017578, 34.452880859375, 35.579280853271484, 36.70568084716797, 37.83208084106445]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 10.0, 11.0, 11.0, 14.0, 14.0, 28.0, 23.0, 38.0, 37.0, 54.0, 56.0, 50.0, 50.0, 46.0, 68.0, 61.0, 52.0, 56.0, 57.0, 29.0, 48.0, 29.0, 26.0, 30.0, 21.0, 24.0, 13.0, 9.0, 10.0, 13.0, 6.0, 3.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5234375, -9.233642578125, -8.94384765625, -8.654052734375, -8.3642578125, -8.074462890625, -7.78466796875, -7.494873046875, -7.205078125, -6.915283203125, -6.62548828125, -6.335693359375, -6.0458984375, -5.756103515625, -5.46630859375, -5.176513671875, -4.88671875, -4.596923828125, -4.30712890625, -4.017333984375, -3.7275390625, -3.437744140625, -3.14794921875, -2.858154296875, -2.568359375, -2.278564453125, -1.98876953125, -1.698974609375, -1.4091796875, -1.119384765625, -0.82958984375, -0.539794921875, -0.25, 0.039794921875, 0.32958984375, 0.619384765625, 0.9091796875, 1.198974609375, 1.48876953125, 1.778564453125, 2.068359375, 2.358154296875, 2.64794921875, 2.937744140625, 3.2275390625, 3.517333984375, 3.80712890625, 4.096923828125, 4.38671875, 4.676513671875, 4.96630859375, 5.256103515625, 5.5458984375, 5.835693359375, 6.12548828125, 6.415283203125, 6.705078125, 6.994873046875, 7.28466796875, 7.574462890625, 7.8642578125, 8.154052734375, 8.44384765625, 8.733642578125, 9.0234375]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 13.0, 13.0, 24.0, 21.0, 38.0, 61.0, 72.0, 138.0, 165.0, 298.0, 412.0, 769.0, 1387.0, 4432.0, 86201.0, 2974533.0, 1098863.0, 21402.0, 2578.0, 1023.0, 590.0, 399.0, 305.0, 186.0, 88.0, 76.0, 54.0, 39.0, 30.0, 15.0, 7.0, 12.0, 14.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.46875, -35.28515625, -34.1015625, -32.91796875, -31.734375, -30.55078125, -29.3671875, -28.18359375, -27.0, -25.81640625, -24.6328125, -23.44921875, -22.265625, -21.08203125, -19.8984375, -18.71484375, -17.53125, -16.34765625, -15.1640625, -13.98046875, -12.796875, -11.61328125, -10.4296875, -9.24609375, -8.0625, -6.87890625, -5.6953125, -4.51171875, -3.328125, -2.14453125, -0.9609375, 0.22265625, 1.40625, 2.58984375, 3.7734375, 4.95703125, 6.140625, 7.32421875, 8.5078125, 9.69140625, 10.875, 12.05859375, 13.2421875, 14.42578125, 15.609375, 16.79296875, 17.9765625, 19.16015625, 20.34375, 21.52734375, 22.7109375, 23.89453125, 25.078125, 26.26171875, 27.4453125, 28.62890625, 29.8125, 30.99609375, 32.1796875, 33.36328125, 34.546875, 35.73046875, 36.9140625, 38.09765625, 39.28125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 8.0, 15.0, 17.0, 34.0, 58.0, 88.0, 124.0, 192.0, 312.0, 437.0, 607.0, 649.0, 489.0, 358.0, 246.0, 161.0, 108.0, 83.0, 34.0, 16.0, 14.0, 9.0, 9.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.09375, -23.4951171875, -22.896484375, -22.2978515625, -21.69921875, -21.1005859375, -20.501953125, -19.9033203125, -19.3046875, -18.7060546875, -18.107421875, -17.5087890625, -16.91015625, -16.3115234375, -15.712890625, -15.1142578125, -14.515625, -13.9169921875, -13.318359375, -12.7197265625, -12.12109375, -11.5224609375, -10.923828125, -10.3251953125, -9.7265625, -9.1279296875, -8.529296875, -7.9306640625, -7.33203125, -6.7333984375, -6.134765625, -5.5361328125, -4.9375, -4.3388671875, -3.740234375, -3.1416015625, -2.54296875, -1.9443359375, -1.345703125, -0.7470703125, -0.1484375, 0.4501953125, 1.048828125, 1.6474609375, 2.24609375, 2.8447265625, 3.443359375, 4.0419921875, 4.640625, 5.2392578125, 5.837890625, 6.4365234375, 7.03515625, 7.6337890625, 8.232421875, 8.8310546875, 9.4296875, 10.0283203125, 10.626953125, 11.2255859375, 11.82421875, 12.4228515625, 13.021484375, 13.6201171875, 14.21875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 6.0, 6.0, 3.0, 19.0, 16.0, 37.0, 60.0, 102.0, 172.0, 397.0, 758.0, 1735.0, 4541.0, 14656.0, 66041.0, 355167.0, 1538170.0, 1692693.0, 417288.0, 77266.0, 16688.0, 4921.0, 1899.0, 791.0, 396.0, 217.0, 91.0, 54.0, 36.0, 17.0, 15.0, 6.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-13.25, -12.86083984375, -12.4716796875, -12.08251953125, -11.693359375, -11.30419921875, -10.9150390625, -10.52587890625, -10.13671875, -9.74755859375, -9.3583984375, -8.96923828125, -8.580078125, -8.19091796875, -7.8017578125, -7.41259765625, -7.0234375, -6.63427734375, -6.2451171875, -5.85595703125, -5.466796875, -5.07763671875, -4.6884765625, -4.29931640625, -3.91015625, -3.52099609375, -3.1318359375, -2.74267578125, -2.353515625, -1.96435546875, -1.5751953125, -1.18603515625, -0.796875, -0.40771484375, -0.0185546875, 0.37060546875, 0.759765625, 1.14892578125, 1.5380859375, 1.92724609375, 2.31640625, 2.70556640625, 3.0947265625, 3.48388671875, 3.873046875, 4.26220703125, 4.6513671875, 5.04052734375, 5.4296875, 5.81884765625, 6.2080078125, 6.59716796875, 6.986328125, 7.37548828125, 7.7646484375, 8.15380859375, 8.54296875, 8.93212890625, 9.3212890625, 9.71044921875, 10.099609375, 10.48876953125, 10.8779296875, 11.26708984375, 11.65625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 9.0, 8.0, 10.0, 14.0, 18.0, 17.0, 18.0, 23.0, 30.0, 28.0, 47.0, 40.0, 50.0, 51.0, 52.0, 52.0, 65.0, 43.0, 51.0, 61.0, 42.0, 38.0, 40.0, 20.0, 23.0, 29.0, 22.0, 19.0, 20.0, 9.0, 10.0, 11.0, 6.0, 7.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.954532623291016, -51.15250015258789, -49.3504638671875, -47.548431396484375, -45.74639892578125, -43.944366455078125, -42.142330169677734, -40.34029769897461, -38.53826141357422, -36.736228942871094, -34.9341926574707, -33.13216018676758, -31.330127716064453, -29.528093338012695, -27.726058959960938, -25.924026489257812, -24.121994018554688, -22.31995964050293, -20.517927169799805, -18.715892791748047, -16.913860321044922, -15.111825942993164, -13.309791564941406, -11.507758140563965, -9.705724716186523, -7.903691291809082, -6.101657390594482, -4.299623489379883, -2.4975900650024414, -0.695556640625, 1.1064777374267578, 2.908511161804199, 4.710540771484375, 6.512574195861816, 8.314607620239258, 10.116641998291016, 11.918675422668457, 13.720708847045898, 15.522743225097656, 17.32477569580078, 19.12681007385254, 20.928844451904297, 22.730876922607422, 24.53291130065918, 26.334945678710938, 28.136978149414062, 29.93901252746582, 31.741046905517578, 33.5430793762207, 35.34511184692383, 37.14714813232422, 38.949180603027344, 40.75121307373047, 42.553245544433594, 44.355281829833984, 46.15731430053711, 47.9593505859375, 49.761383056640625, 51.563419342041016, 53.36545181274414, 55.167484283447266, 56.969520568847656, 58.77155303955078, 60.573585510253906, 62.37561798095703]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 6.0, 5.0, 5.0, 12.0, 6.0, 12.0, 13.0, 17.0, 19.0, 30.0, 27.0, 30.0, 25.0, 31.0, 38.0, 28.0, 32.0, 31.0, 47.0, 43.0, 39.0, 43.0, 32.0, 36.0, 36.0, 40.0, 35.0, 41.0, 42.0, 29.0, 17.0, 22.0, 15.0, 19.0, 14.0, 11.0, 20.0, 3.0, 8.0, 9.0, 6.0, 10.0, 7.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0], "bins": [-57.087806701660156, -55.41359329223633, -53.7393798828125, -52.06516647338867, -50.390953063964844, -48.71673583984375, -47.04252243041992, -45.368309020996094, -43.694095611572266, -42.01988220214844, -40.34566879272461, -38.67145538330078, -36.99723815917969, -35.323028564453125, -33.64881134033203, -31.974597930908203, -30.300384521484375, -28.626171112060547, -26.95195770263672, -25.277742385864258, -23.60352897644043, -21.9293155670166, -20.25510025024414, -18.580886840820312, -16.906673431396484, -15.232460021972656, -13.558245658874512, -11.884031295776367, -10.209817886352539, -8.535604476928711, -6.861390113830566, -5.187175750732422, -3.5129623413085938, -1.8387484550476074, -0.1645345687866211, 1.5096793174743652, 3.1838932037353516, 4.85810661315918, 6.532320976257324, 8.206535339355469, 9.880748748779297, 11.554962158203125, 13.22917652130127, 14.903390884399414, 16.577604293823242, 18.25181770324707, 19.92603302001953, 21.60024642944336, 23.274459838867188, 24.948673248291016, 26.622886657714844, 28.297101974487305, 29.971315383911133, 31.64552879333496, 33.31974411010742, 34.99395751953125, 36.66817092895508, 38.342384338378906, 40.016597747802734, 41.69081115722656, 43.365028381347656, 45.03923797607422, 46.71345520019531, 48.38766860961914, 50.06188201904297]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 1.0, 4.0, 12.0, 11.0, 9.0, 10.0, 22.0, 20.0, 19.0, 30.0, 23.0, 28.0, 44.0, 39.0, 45.0, 38.0, 53.0, 45.0, 49.0, 48.0, 45.0, 40.0, 28.0, 37.0, 40.0, 31.0, 32.0, 29.0, 23.0, 26.0, 23.0, 15.0, 18.0, 15.0, 9.0, 9.0, 5.0, 2.0, 4.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-109.8125, -106.4921875, -103.171875, -99.8515625, -96.53125, -93.2109375, -89.890625, -86.5703125, -83.25, -79.9296875, -76.609375, -73.2890625, -69.96875, -66.6484375, -63.328125, -60.0078125, -56.6875, -53.3671875, -50.046875, -46.7265625, -43.40625, -40.0859375, -36.765625, -33.4453125, -30.125, -26.8046875, -23.484375, -20.1640625, -16.84375, -13.5234375, -10.203125, -6.8828125, -3.5625, -0.2421875, 3.078125, 6.3984375, 9.71875, 13.0390625, 16.359375, 19.6796875, 23.0, 26.3203125, 29.640625, 32.9609375, 36.28125, 39.6015625, 42.921875, 46.2421875, 49.5625, 52.8828125, 56.203125, 59.5234375, 62.84375, 66.1640625, 69.484375, 72.8046875, 76.125, 79.4453125, 82.765625, 86.0859375, 89.40625, 92.7265625, 96.046875, 99.3671875, 102.6875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 6.0, 3.0, 6.0, 5.0, 16.0, 17.0, 28.0, 48.0, 56.0, 101.0, 130.0, 218.0, 358.0, 616.0, 920.0, 1494.0, 2348.0, 3661.0, 5831.0, 9289.0, 14467.0, 22402.0, 33689.0, 50544.0, 72283.0, 97998.0, 122410.0, 135794.0, 128003.0, 104790.0, 78563.0, 55446.0, 37745.0, 25155.0, 16115.0, 10195.0, 6655.0, 4060.0, 2616.0, 1659.0, 1027.0, 659.0, 419.0, 260.0, 147.0, 110.0, 82.0, 52.0, 25.0, 24.0, 15.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.8046875, -6.58953857421875, -6.3743896484375, -6.15924072265625, -5.944091796875, -5.72894287109375, -5.5137939453125, -5.29864501953125, -5.08349609375, -4.86834716796875, -4.6531982421875, -4.43804931640625, -4.222900390625, -4.00775146484375, -3.7926025390625, -3.57745361328125, -3.3623046875, -3.14715576171875, -2.9320068359375, -2.71685791015625, -2.501708984375, -2.28656005859375, -2.0714111328125, -1.85626220703125, -1.64111328125, -1.42596435546875, -1.2108154296875, -0.99566650390625, -0.780517578125, -0.56536865234375, -0.3502197265625, -0.13507080078125, 0.080078125, 0.29522705078125, 0.5103759765625, 0.72552490234375, 0.940673828125, 1.15582275390625, 1.3709716796875, 1.58612060546875, 1.80126953125, 2.01641845703125, 2.2315673828125, 2.44671630859375, 2.661865234375, 2.87701416015625, 3.0921630859375, 3.30731201171875, 3.5224609375, 3.73760986328125, 3.9527587890625, 4.16790771484375, 4.383056640625, 4.59820556640625, 4.8133544921875, 5.02850341796875, 5.24365234375, 5.45880126953125, 5.6739501953125, 5.88909912109375, 6.104248046875, 6.31939697265625, 6.5345458984375, 6.74969482421875, 6.96484375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 6.0, 9.0, 5.0, 9.0, 4.0, 5.0, 16.0, 17.0, 14.0, 16.0, 26.0, 30.0, 36.0, 22.0, 32.0, 37.0, 35.0, 30.0, 44.0, 52.0, 34.0, 47.0, 1060.0, 41.0, 36.0, 32.0, 27.0, 33.0, 27.0, 26.0, 23.0, 33.0, 25.0, 24.0, 18.0, 11.0, 14.0, 11.0, 11.0, 6.0, 9.0, 11.0, 7.0, 7.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-58.375, -56.50244140625, -54.6298828125, -52.75732421875, -50.884765625, -49.01220703125, -47.1396484375, -45.26708984375, -43.39453125, -41.52197265625, -39.6494140625, -37.77685546875, -35.904296875, -34.03173828125, -32.1591796875, -30.28662109375, -28.4140625, -26.54150390625, -24.6689453125, -22.79638671875, -20.923828125, -19.05126953125, -17.1787109375, -15.30615234375, -13.43359375, -11.56103515625, -9.6884765625, -7.81591796875, -5.943359375, -4.07080078125, -2.1982421875, -0.32568359375, 1.546875, 3.41943359375, 5.2919921875, 7.16455078125, 9.037109375, 10.90966796875, 12.7822265625, 14.65478515625, 16.52734375, 18.39990234375, 20.2724609375, 22.14501953125, 24.017578125, 25.89013671875, 27.7626953125, 29.63525390625, 31.5078125, 33.38037109375, 35.2529296875, 37.12548828125, 38.998046875, 40.87060546875, 42.7431640625, 44.61572265625, 46.48828125, 48.36083984375, 50.2333984375, 52.10595703125, 53.978515625, 55.85107421875, 57.7236328125, 59.59619140625, 61.46875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 6.0, 5.0, 8.0, 11.0, 15.0, 17.0, 22.0, 37.0, 50.0, 63.0, 86.0, 119.0, 181.0, 297.0, 433.0, 670.0, 1013.0, 1682.0, 2583.0, 4019.0, 6329.0, 9800.0, 15191.0, 23288.0, 36163.0, 1870557.0, 46397.0, 27407.0, 18048.0, 11619.0, 7584.0, 4679.0, 3105.0, 1947.0, 1268.0, 823.0, 536.0, 343.0, 246.0, 145.0, 108.0, 73.0, 45.0, 25.0, 25.0, 25.0, 12.0, 13.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.921875, -17.318359375, -16.71484375, -16.111328125, -15.5078125, -14.904296875, -14.30078125, -13.697265625, -13.09375, -12.490234375, -11.88671875, -11.283203125, -10.6796875, -10.076171875, -9.47265625, -8.869140625, -8.265625, -7.662109375, -7.05859375, -6.455078125, -5.8515625, -5.248046875, -4.64453125, -4.041015625, -3.4375, -2.833984375, -2.23046875, -1.626953125, -1.0234375, -0.419921875, 0.18359375, 0.787109375, 1.390625, 1.994140625, 2.59765625, 3.201171875, 3.8046875, 4.408203125, 5.01171875, 5.615234375, 6.21875, 6.822265625, 7.42578125, 8.029296875, 8.6328125, 9.236328125, 9.83984375, 10.443359375, 11.046875, 11.650390625, 12.25390625, 12.857421875, 13.4609375, 14.064453125, 14.66796875, 15.271484375, 15.875, 16.478515625, 17.08203125, 17.685546875, 18.2890625, 18.892578125, 19.49609375, 20.099609375, 20.703125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 7.0, 6.0, 8.0, 14.0, 29.0, 26.0, 31.0, 38.0, 41.0, 43.0, 56.0, 60.0, 69.0, 68.0, 74.0, 68.0, 46.0, 46.0, 50.0, 39.0, 38.0, 28.0, 25.0, 18.0, 10.0, 12.0, 8.0, 8.0, 8.0, 8.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.142333984375, -0.13824462890625, -0.1341552734375, -0.13006591796875, -0.1259765625, -0.12188720703125, -0.1177978515625, -0.11370849609375, -0.109619140625, -0.10552978515625, -0.1014404296875, -0.09735107421875, -0.09326171875, -0.08917236328125, -0.0850830078125, -0.08099365234375, -0.076904296875, -0.07281494140625, -0.0687255859375, -0.06463623046875, -0.060546875, -0.05645751953125, -0.0523681640625, -0.04827880859375, -0.044189453125, -0.04010009765625, -0.0360107421875, -0.03192138671875, -0.02783203125, -0.02374267578125, -0.0196533203125, -0.01556396484375, -0.011474609375, -0.00738525390625, -0.0032958984375, 0.00079345703125, 0.0048828125, 0.00897216796875, 0.0130615234375, 0.01715087890625, 0.021240234375, 0.02532958984375, 0.0294189453125, 0.03350830078125, 0.03759765625, 0.04168701171875, 0.0457763671875, 0.04986572265625, 0.053955078125, 0.05804443359375, 0.0621337890625, 0.06622314453125, 0.0703125, 0.07440185546875, 0.0784912109375, 0.08258056640625, 0.086669921875, 0.09075927734375, 0.0948486328125, 0.09893798828125, 0.10302734375, 0.10711669921875, 0.1112060546875, 0.11529541015625, 0.119384765625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 2.0, 4.0, 4.0, 11.0, 9.0, 12.0, 16.0, 25.0, 55.0, 64.0, 95.0, 147.0, 237.0, 403.0, 698.0, 1444.0, 3494.0, 8777.0, 24649.0, 72491.0, 201998.0, 355433.0, 239974.0, 89343.0, 30328.0, 10876.0, 4168.0, 1759.0, 843.0, 505.0, 265.0, 150.0, 80.0, 67.0, 44.0, 20.0, 14.0, 21.0, 14.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6376953125, -0.618133544921875, -0.59857177734375, -0.579010009765625, -0.5594482421875, -0.539886474609375, -0.52032470703125, -0.500762939453125, -0.481201171875, -0.461639404296875, -0.44207763671875, -0.422515869140625, -0.4029541015625, -0.383392333984375, -0.36383056640625, -0.344268798828125, -0.32470703125, -0.305145263671875, -0.28558349609375, -0.266021728515625, -0.2464599609375, -0.226898193359375, -0.20733642578125, -0.187774658203125, -0.168212890625, -0.148651123046875, -0.12908935546875, -0.109527587890625, -0.0899658203125, -0.070404052734375, -0.05084228515625, -0.031280517578125, -0.01171875, 0.007843017578125, 0.02740478515625, 0.046966552734375, 0.0665283203125, 0.086090087890625, 0.10565185546875, 0.125213623046875, 0.144775390625, 0.164337158203125, 0.18389892578125, 0.203460693359375, 0.2230224609375, 0.242584228515625, 0.26214599609375, 0.281707763671875, 0.30126953125, 0.320831298828125, 0.34039306640625, 0.359954833984375, 0.3795166015625, 0.399078369140625, 0.41864013671875, 0.438201904296875, 0.457763671875, 0.477325439453125, 0.49688720703125, 0.516448974609375, 0.5360107421875, 0.555572509765625, 0.57513427734375, 0.594696044921875, 0.6142578125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 8.0, 19.0, 16.0, 26.0, 32.0, 43.0, 47.0, 49.0, 64.0, 65.0, 69.0, 61.0, 71.0, 76.0, 62.0, 58.0, 49.0, 47.0, 18.0, 19.0, 19.0, 14.0, 17.0, 9.0, 11.0, 7.0, 4.0, 6.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1294659823179245, -0.12472700327634811, -0.11998803168535233, -0.11524905264377594, -0.11051008105278015, -0.10577110201120377, -0.10103212296962738, -0.09629315137863159, -0.0915541723370552, -0.08681519329547882, -0.08207622170448303, -0.07733724266290665, -0.07259826362133026, -0.06785929203033447, -0.06312031298875809, -0.058381337672472, -0.05364236235618591, -0.048903387039899826, -0.04416441172361374, -0.039425432682037354, -0.034686457365751266, -0.02994748204946518, -0.025208504870533943, -0.020469527691602707, -0.01573055237531662, -0.010991576127707958, -0.006252599880099297, -0.001513623632490635, 0.0032253526151180267, 0.007964327931404114, 0.01270330511033535, 0.017442282289266586, 0.022181257605552673, 0.02692023292183876, 0.03165920823812485, 0.03639818727970123, 0.04113716259598732, 0.04587613791227341, 0.05061511695384979, 0.05535409227013588, 0.06009306758642197, 0.06483204662799835, 0.06957101821899414, 0.07430999726057053, 0.07904897630214691, 0.0837879478931427, 0.08852692693471909, 0.09326590597629547, 0.09800487756729126, 0.10274385660886765, 0.10748282819986343, 0.11222180724143982, 0.11696077883243561, 0.121699757874012, 0.12643873691558838, 0.13117770850658417, 0.13591668009757996, 0.14065565168857574, 0.14539463818073273, 0.15013360977172852, 0.1548725813627243, 0.1596115529537201, 0.16435053944587708, 0.16908951103687286, 0.17382849752902985]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 3.0, 6.0, 3.0, 4.0, 9.0, 13.0, 7.0, 13.0, 17.0, 18.0, 23.0, 28.0, 16.0, 26.0, 30.0, 32.0, 41.0, 33.0, 42.0, 44.0, 39.0, 41.0, 47.0, 33.0, 34.0, 42.0, 39.0, 43.0, 38.0, 36.0, 22.0, 26.0, 15.0, 17.0, 16.0, 20.0, 10.0, 11.0, 15.0, 10.0, 6.0, 9.0, 7.0, 8.0, 3.0, 0.0, 4.0], "bins": [-0.0986703634262085, -0.0961313396692276, -0.0935923159122467, -0.09105329215526581, -0.08851426839828491, -0.08597523719072342, -0.08343621343374252, -0.08089718967676163, -0.07835816591978073, -0.07581914216279984, -0.07328011840581894, -0.07074109464883804, -0.06820206344127655, -0.06566303968429565, -0.06312401592731476, -0.06058499217033386, -0.058045968413352966, -0.05550694465637207, -0.052967920899391174, -0.05042889341711998, -0.047889869660139084, -0.04535084590315819, -0.04281181842088699, -0.0402727946639061, -0.0377337709069252, -0.035194747149944305, -0.03265572339296341, -0.030116695910692215, -0.02757767215371132, -0.025038648396730423, -0.022499622777104378, -0.019960597157478333, -0.017421573400497437, -0.014882548712193966, -0.012343524023890495, -0.009804499335587025, -0.007265474647283554, -0.0047264499589800835, -0.002187425270676613, 0.0003516003489494324, 0.0028906241059303284, 0.005429648794233799, 0.00796867348253727, 0.01050769817084074, 0.01304672285914421, 0.015585747547447681, 0.018124772235751152, 0.020663797855377197, 0.023202821612358093, 0.02574184536933899, 0.028280870988965034, 0.03081989660859108, 0.033358920365571976, 0.03589794412255287, 0.038436971604824066, 0.04097599536180496, 0.04351501911878586, 0.046054042875766754, 0.04859306663274765, 0.051132094115018845, 0.05367111787199974, 0.05621014162898064, 0.05874916911125183, 0.06128819286823273, 0.06382721662521362]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 4.0, 10.0, 13.0, 21.0, 12.0, 18.0, 19.0, 28.0, 25.0, 33.0, 30.0, 41.0, 38.0, 40.0, 53.0, 36.0, 32.0, 56.0, 39.0, 44.0, 38.0, 39.0, 42.0, 42.0, 34.0, 39.0, 24.0, 24.0, 13.0, 23.0, 18.0, 6.0, 12.0, 7.0, 12.0, 9.0, 5.0, 5.0, 5.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-110.0625, -106.8056640625, -103.548828125, -100.2919921875, -97.03515625, -93.7783203125, -90.521484375, -87.2646484375, -84.0078125, -80.7509765625, -77.494140625, -74.2373046875, -70.98046875, -67.7236328125, -64.466796875, -61.2099609375, -57.953125, -54.6962890625, -51.439453125, -48.1826171875, -44.92578125, -41.6689453125, -38.412109375, -35.1552734375, -31.8984375, -28.6416015625, -25.384765625, -22.1279296875, -18.87109375, -15.6142578125, -12.357421875, -9.1005859375, -5.84375, -2.5869140625, 0.669921875, 3.9267578125, 7.18359375, 10.4404296875, 13.697265625, 16.9541015625, 20.2109375, 23.4677734375, 26.724609375, 29.9814453125, 33.23828125, 36.4951171875, 39.751953125, 43.0087890625, 46.265625, 49.5224609375, 52.779296875, 56.0361328125, 59.29296875, 62.5498046875, 65.806640625, 69.0634765625, 72.3203125, 75.5771484375, 78.833984375, 82.0908203125, 85.34765625, 88.6044921875, 91.861328125, 95.1181640625, 98.375]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 8.0, 9.0, 6.0, 12.0, 19.0, 22.0, 21.0, 27.0, 29.0, 53.0, 60.0, 96.0, 140.0, 264.0, 604.0, 2139.0, 11399.0, 95916.0, 532565.0, 350692.0, 45918.0, 6133.0, 1324.0, 449.0, 217.0, 124.0, 65.0, 50.0, 40.0, 26.0, 24.0, 22.0, 19.0, 7.0, 13.0, 4.0, 10.0, 7.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-21.375, -20.7431640625, -20.111328125, -19.4794921875, -18.84765625, -18.2158203125, -17.583984375, -16.9521484375, -16.3203125, -15.6884765625, -15.056640625, -14.4248046875, -13.79296875, -13.1611328125, -12.529296875, -11.8974609375, -11.265625, -10.6337890625, -10.001953125, -9.3701171875, -8.73828125, -8.1064453125, -7.474609375, -6.8427734375, -6.2109375, -5.5791015625, -4.947265625, -4.3154296875, -3.68359375, -3.0517578125, -2.419921875, -1.7880859375, -1.15625, -0.5244140625, 0.107421875, 0.7392578125, 1.37109375, 2.0029296875, 2.634765625, 3.2666015625, 3.8984375, 4.5302734375, 5.162109375, 5.7939453125, 6.42578125, 7.0576171875, 7.689453125, 8.3212890625, 8.953125, 9.5849609375, 10.216796875, 10.8486328125, 11.48046875, 12.1123046875, 12.744140625, 13.3759765625, 14.0078125, 14.6396484375, 15.271484375, 15.9033203125, 16.53515625, 17.1669921875, 17.798828125, 18.4306640625, 19.0625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 12.0, 14.0, 18.0, 21.0, 22.0, 15.0, 33.0, 27.0, 42.0, 45.0, 55.0, 60.0, 51.0, 101.0, 2070.0, 62.0, 43.0, 50.0, 42.0, 32.0, 40.0, 39.0, 29.0, 24.0, 19.0, 13.0, 7.0, 8.0, 19.0, 11.0, 2.0, 4.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-189.625, -184.5234375, -179.421875, -174.3203125, -169.21875, -164.1171875, -159.015625, -153.9140625, -148.8125, -143.7109375, -138.609375, -133.5078125, -128.40625, -123.3046875, -118.203125, -113.1015625, -108.0, -102.8984375, -97.796875, -92.6953125, -87.59375, -82.4921875, -77.390625, -72.2890625, -67.1875, -62.0859375, -56.984375, -51.8828125, -46.78125, -41.6796875, -36.578125, -31.4765625, -26.375, -21.2734375, -16.171875, -11.0703125, -5.96875, -0.8671875, 4.234375, 9.3359375, 14.4375, 19.5390625, 24.640625, 29.7421875, 34.84375, 39.9453125, 45.046875, 50.1484375, 55.25, 60.3515625, 65.453125, 70.5546875, 75.65625, 80.7578125, 85.859375, 90.9609375, 96.0625, 101.1640625, 106.265625, 111.3671875, 116.46875, 121.5703125, 126.671875, 131.7734375, 136.875]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 10.0, 10.0, 12.0, 17.0, 34.0, 46.0, 47.0, 85.0, 119.0, 214.0, 284.0, 526.0, 933.0, 2214.0, 7413.0, 69830.0, 2695338.0, 334703.0, 26213.0, 4230.0, 1517.0, 744.0, 408.0, 276.0, 169.0, 115.0, 62.0, 50.0, 31.0, 16.0, 13.0, 5.0, 5.0, 10.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.796875, -20.14306640625, -19.4892578125, -18.83544921875, -18.181640625, -17.52783203125, -16.8740234375, -16.22021484375, -15.56640625, -14.91259765625, -14.2587890625, -13.60498046875, -12.951171875, -12.29736328125, -11.6435546875, -10.98974609375, -10.3359375, -9.68212890625, -9.0283203125, -8.37451171875, -7.720703125, -7.06689453125, -6.4130859375, -5.75927734375, -5.10546875, -4.45166015625, -3.7978515625, -3.14404296875, -2.490234375, -1.83642578125, -1.1826171875, -0.52880859375, 0.125, 0.77880859375, 1.4326171875, 2.08642578125, 2.740234375, 3.39404296875, 4.0478515625, 4.70166015625, 5.35546875, 6.00927734375, 6.6630859375, 7.31689453125, 7.970703125, 8.62451171875, 9.2783203125, 9.93212890625, 10.5859375, 11.23974609375, 11.8935546875, 12.54736328125, 13.201171875, 13.85498046875, 14.5087890625, 15.16259765625, 15.81640625, 16.47021484375, 17.1240234375, 17.77783203125, 18.431640625, 19.08544921875, 19.7392578125, 20.39306640625, 21.046875]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 5.0, 14.0, 13.0, 20.0, 27.0, 35.0, 63.0, 109.0, 113.0, 142.0, 121.0, 126.0, 72.0, 42.0, 24.0, 26.0, 11.0, 7.0, 4.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-230.87667846679688, -224.71714782714844, -218.5576171875, -212.3980712890625, -206.23854064941406, -200.07901000976562, -193.91946411132812, -187.7599334716797, -181.60040283203125, -175.4408721923828, -169.28134155273438, -163.12179565429688, -156.96226501464844, -150.802734375, -144.6431884765625, -138.48365783691406, -132.32412719726562, -126.16459655761719, -120.00505828857422, -113.84552001953125, -107.68598937988281, -101.52645874023438, -95.3669204711914, -89.20738220214844, -83.0478515625, -76.88832092285156, -70.7287826538086, -64.56924438476562, -58.40971374511719, -52.250179290771484, -46.09064483642578, -39.93111038208008, -33.771575927734375, -27.612041473388672, -21.45250701904297, -15.292972564697266, -9.133438110351562, -2.9739036560058594, 3.1856307983398438, 9.345165252685547, 15.50469970703125, 21.664234161376953, 27.823768615722656, 33.98330307006836, 40.14283752441406, 46.302371978759766, 52.46190643310547, 58.62144088745117, 64.78097534179688, 70.94050598144531, 77.10004425048828, 83.25958251953125, 89.41911315917969, 95.57864379882812, 101.7381820678711, 107.89772033691406, 114.0572509765625, 120.21678161621094, 126.3763198852539, 132.53585815429688, 138.6953887939453, 144.85491943359375, 151.01446533203125, 157.1739959716797, 163.33352661132812]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 1.0, 10.0, 14.0, 8.0, 12.0, 14.0, 22.0, 13.0, 31.0, 29.0, 29.0, 46.0, 41.0, 44.0, 51.0, 40.0, 42.0, 38.0, 57.0, 50.0, 34.0, 44.0, 39.0, 32.0, 37.0, 42.0, 32.0, 28.0, 25.0, 23.0, 11.0, 9.0, 10.0, 12.0, 7.0, 5.0, 7.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-219.067626953125, -212.6111602783203, -206.1547088623047, -199.6982421875, -193.24179077148438, -186.7853240966797, -180.32887268066406, -173.87240600585938, -167.41595458984375, -160.95948791503906, -154.50303649902344, -148.04656982421875, -141.59011840820312, -135.13365173339844, -128.6772003173828, -122.22073364257812, -115.76427459716797, -109.30781555175781, -102.85135650634766, -96.3948974609375, -89.93843841552734, -83.48197937011719, -77.0255126953125, -70.56906127929688, -64.11259460449219, -57.65613555908203, -51.199676513671875, -44.74321746826172, -38.28675842285156, -31.83029556274414, -25.373836517333984, -18.917377471923828, -12.460922241210938, -6.004462718963623, 0.4519968032836914, 6.908456802368164, 13.36491584777832, 19.82137680053711, 26.277835845947266, 32.73429489135742, 39.19075393676758, 45.647212982177734, 52.10367202758789, 58.56013488769531, 65.01659393310547, 71.47305297851562, 77.92951202392578, 84.38597106933594, 90.8424301147461, 97.29888916015625, 103.7553482055664, 110.21180725097656, 116.66826629638672, 123.12472534179688, 129.58119201660156, 136.0376434326172, 142.49411010742188, 148.95057678222656, 155.4070281982422, 161.86349487304688, 168.3199462890625, 174.7764129638672, 181.2328643798828, 187.6893310546875, 194.14578247070312]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 9.0, 4.0, 8.0, 10.0, 17.0, 31.0, 21.0, 56.0, 63.0, 74.0, 126.0, 176.0, 256.0, 368.0, 482.0, 647.0, 847.0, 1212.0, 1916.0, 2570.0, 3698.0, 5105.0, 1006064.0, 7723.0, 5004.0, 3614.0, 2476.0, 1709.0, 1217.0, 813.0, 653.0, 403.0, 340.0, 235.0, 155.0, 122.0, 74.0, 56.0, 58.0, 34.0, 32.0, 13.0, 21.0, 15.0, 7.0, 5.0, 4.0, 6.0, 3.0, 4.0, 1.0, 2.0], "bins": [-33.72859191894531, -32.76339340209961, -31.79819679260254, -30.832998275756836, -29.867801666259766, -28.902603149414062, -27.93740463256836, -26.972206115722656, -26.007009506225586, -25.041810989379883, -24.076614379882812, -23.11141586303711, -22.146217346191406, -21.181020736694336, -20.215822219848633, -19.250625610351562, -18.28542709350586, -17.320228576660156, -16.355031967163086, -15.389833450317383, -14.424635887145996, -13.45943832397461, -12.494239807128906, -11.52904224395752, -10.563844680786133, -9.598647117614746, -8.63344955444336, -7.668251037597656, -6.7030534744262695, -5.737855911254883, -4.772657871246338, -3.807459831237793, -2.8422622680664062, -1.8770644664764404, -0.9118666648864746, 0.05333113670349121, 1.018528938293457, 1.9837265014648438, 2.9489245414733887, 3.9141225814819336, 4.87932014465332, 5.844517707824707, 6.809715747833252, 7.774913787841797, 8.740111351013184, 9.70530891418457, 10.670507431030273, 11.63570499420166, 12.600902557373047, 13.566100120544434, 14.53129768371582, 15.496496200561523, 16.461692810058594, 17.426891326904297, 18.39208984375, 19.357288360595703, 20.322484970092773, 21.287683486938477, 22.252880096435547, 23.21807861328125, 24.183277130126953, 25.148473739624023, 26.113672256469727, 27.078868865966797, 28.0440673828125]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 9.0, 6.0, 11.0, 17.0, 15.0, 39.0, 39.0, 59.0, 102.0, 287.0, 64026.0, 51398048.0, 331.0, 77.0, 40.0, 31.0, 18.0, 11.0, 10.0, 7.0, 2.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2062.07421875, -1999.68798828125, -1937.3016357421875, -1874.915283203125, -1812.529052734375, -1750.142822265625, -1687.7564697265625, -1625.3701171875, -1562.98388671875, -1500.59765625, -1438.2113037109375, -1375.824951171875, -1313.438720703125, -1251.052490234375, -1188.6661376953125, -1126.27978515625, -1063.8935546875, -1001.5072631835938, -939.1209716796875, -876.7346801757812, -814.348388671875, -751.9620971679688, -689.5758056640625, -627.1895141601562, -564.80322265625, -502.41693115234375, -440.0306396484375, -377.64434814453125, -315.258056640625, -252.87176513671875, -190.4854736328125, -128.09918212890625, -65.712890625, -3.32659912109375, 59.0596923828125, 121.44598388671875, 183.832275390625, 246.21856689453125, 308.6048583984375, 370.99114990234375, 433.37744140625, 495.76373291015625, 558.1500244140625, 620.5363159179688, 682.922607421875, 745.3088989257812, 807.6951904296875, 870.0814819335938, 932.4677734375, 994.8540649414062, 1057.2403564453125, 1119.626708984375, 1182.012939453125, 1244.399169921875, 1306.7855224609375, 1369.171875, 1431.55810546875, 1493.9443359375, 1556.3306884765625, 1618.717041015625, 1681.103271484375, 1743.489501953125, 1805.8758544921875, 1868.26220703125, 1930.6484375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 4.0, 6.0, 22.0, 39.0, 81.0, 169.0, 253.0, 194.0, 100.0, 46.0, 28.0, 17.0, 10.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-111.88494873046875, -108.74992370605469, -105.61489868164062, -102.47987365722656, -99.34484100341797, -96.2098159790039, -93.07479095458984, -89.93976593017578, -86.80474090576172, -83.66971588134766, -80.5346908569336, -77.399658203125, -74.26463317871094, -71.12960815429688, -67.99458312988281, -64.85955810546875, -61.72452926635742, -58.58950424194336, -55.45447540283203, -52.31945037841797, -49.184425354003906, -46.049400329589844, -42.914371490478516, -39.77934646606445, -36.644317626953125, -33.50929260253906, -30.374265670776367, -27.239238739013672, -24.10421371459961, -20.969186782836914, -17.83415985107422, -14.699134826660156, -11.564109802246094, -8.429083824157715, -5.294057369232178, -2.1590309143066406, 0.9759950637817383, 4.111021041870117, 7.2460479736328125, 10.381072998046875, 13.51609992980957, 16.651126861572266, 19.786151885986328, 22.921178817749023, 26.05620574951172, 29.19123077392578, 32.326255798339844, 35.461280822753906, 38.596309661865234, 41.7313346862793, 44.866363525390625, 48.00138854980469, 51.13641357421875, 54.27143859863281, 57.40646743774414, 60.5414924621582, 63.67652130126953, 66.8115463256836, 69.94657135009766, 73.08160400390625, 76.21662902832031, 79.35165405273438, 82.48667907714844, 85.6217041015625, 88.75672912597656]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 5.0, 3.0, 1.0, 5.0, 9.0, 7.0, 5.0, 12.0, 19.0, 24.0, 30.0, 41.0, 56.0, 58.0, 83.0, 88.0, 64.0, 86.0, 82.0, 65.0, 57.0, 47.0, 27.0, 28.0, 18.0, 17.0, 16.0, 11.0, 7.0, 5.0, 6.0, 3.0, 4.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.47213745117188, -92.94001007080078, -89.40788269042969, -85.87574768066406, -82.34362030029297, -78.81149291992188, -75.27936553955078, -71.74723815917969, -68.21510314941406, -64.68297576904297, -61.15084457397461, -57.618717193603516, -54.086585998535156, -50.55445861816406, -47.02233123779297, -43.49020004272461, -39.958072662353516, -36.42594528198242, -32.89381408691406, -29.36168670654297, -25.82955551147461, -22.297428131103516, -18.76529884338379, -15.233169555664062, -11.701040267944336, -8.16891098022461, -4.636782169342041, -1.1046533584594727, 2.427475929260254, 5.959604263305664, 9.49173355102539, 13.023862838745117, 16.555992126464844, 20.08812141418457, 23.620250701904297, 27.15237808227539, 30.68450927734375, 34.216636657714844, 37.74876403808594, 41.2808952331543, 44.813026428222656, 48.34515380859375, 51.87728500366211, 55.4094123840332, 58.94154357910156, 62.473670959472656, 66.00579833984375, 69.53793334960938, 73.07005310058594, 76.60218048095703, 80.13430786132812, 83.66644287109375, 87.19857025146484, 90.73069763183594, 94.26282501220703, 97.79495239257812, 101.32708740234375, 104.85921478271484, 108.39134216308594, 111.92347717285156, 115.45560455322266, 118.98773193359375, 122.51985931396484, 126.05198669433594, 129.58412170410156]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 6.0, 2.0, 12.0, 10.0, 15.0, 18.0, 18.0, 20.0, 27.0, 33.0, 33.0, 65.0, 78.0, 116.0, 168.0, 207.0, 348.0, 509.0, 816.0, 1497.0, 2716.0, 6039.0, 16112.0, 73541.0, 4002815.0, 62293.0, 14561.0, 5709.0, 2633.0, 1437.0, 844.0, 456.0, 323.0, 233.0, 147.0, 108.0, 77.0, 51.0, 40.0, 24.0, 30.0, 17.0, 20.0, 20.0, 11.0, 8.0, 5.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-1.8671875, -1.8114013671875, -1.755615234375, -1.6998291015625, -1.64404296875, -1.5882568359375, -1.532470703125, -1.4766845703125, -1.4208984375, -1.3651123046875, -1.309326171875, -1.2535400390625, -1.19775390625, -1.1419677734375, -1.086181640625, -1.0303955078125, -0.974609375, -0.9188232421875, -0.863037109375, -0.8072509765625, -0.75146484375, -0.6956787109375, -0.639892578125, -0.5841064453125, -0.5283203125, -0.4725341796875, -0.416748046875, -0.3609619140625, -0.30517578125, -0.2493896484375, -0.193603515625, -0.1378173828125, -0.08203125, -0.0262451171875, 0.029541015625, 0.0853271484375, 0.14111328125, 0.1968994140625, 0.252685546875, 0.3084716796875, 0.3642578125, 0.4200439453125, 0.475830078125, 0.5316162109375, 0.58740234375, 0.6431884765625, 0.698974609375, 0.7547607421875, 0.810546875, 0.8663330078125, 0.922119140625, 0.9779052734375, 1.03369140625, 1.0894775390625, 1.145263671875, 1.2010498046875, 1.2568359375, 1.3126220703125, 1.368408203125, 1.4241943359375, 1.47998046875, 1.5357666015625, 1.591552734375, 1.6473388671875, 1.703125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 4.0, 6.0, 7.0, 12.0, 13.0, 16.0, 12.0, 25.0, 767.0, 29.0, 17.0, 6.0, 6.0, 9.0, 7.0, 6.0, 3.0, 9.0, 6.0, 3.0, 5.0, 7.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6494140625, -0.628204345703125, -0.60699462890625, -0.585784912109375, -0.5645751953125, -0.543365478515625, -0.52215576171875, -0.500946044921875, -0.479736328125, -0.458526611328125, -0.43731689453125, -0.416107177734375, -0.3948974609375, -0.373687744140625, -0.35247802734375, -0.331268310546875, -0.31005859375, -0.288848876953125, -0.26763916015625, -0.246429443359375, -0.2252197265625, -0.204010009765625, -0.18280029296875, -0.161590576171875, -0.140380859375, -0.119171142578125, -0.09796142578125, -0.076751708984375, -0.0555419921875, -0.034332275390625, -0.01312255859375, 0.008087158203125, 0.029296875, 0.050506591796875, 0.07171630859375, 0.092926025390625, 0.1141357421875, 0.135345458984375, 0.15655517578125, 0.177764892578125, 0.198974609375, 0.220184326171875, 0.24139404296875, 0.262603759765625, 0.2838134765625, 0.305023193359375, 0.32623291015625, 0.347442626953125, 0.36865234375, 0.389862060546875, 0.41107177734375, 0.432281494140625, 0.4534912109375, 0.474700927734375, 0.49591064453125, 0.517120361328125, 0.538330078125, 0.559539794921875, 0.58074951171875, 0.601959228515625, 0.6231689453125, 0.644378662109375, 0.66558837890625, 0.686798095703125, 0.7080078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 4.0, 3.0, 2.0, 5.0, 3.0, 10.0, 19.0, 24.0, 26.0, 47.0, 57.0, 76.0, 146.0, 226.0, 374.0, 722.0, 1280.0, 2437.0, 5466.0, 13229.0, 38534.0, 161037.0, 3154451.0, 689442.0, 85527.0, 24421.0, 9016.0, 3721.0, 1791.0, 909.0, 527.0, 255.0, 155.0, 118.0, 88.0, 52.0, 30.0, 19.0, 16.0, 5.0, 9.0, 4.0, 5.0, 1.0, 2.0, 2.0, 3.0], "bins": [-1.109375, -1.0815048217773438, -1.0536346435546875, -1.0257644653320312, -0.997894287109375, -0.9700241088867188, -0.9421539306640625, -0.9142837524414062, -0.88641357421875, -0.8585433959960938, -0.8306732177734375, -0.8028030395507812, -0.774932861328125, -0.7470626831054688, -0.7191925048828125, -0.6913223266601562, -0.6634521484375, -0.6355819702148438, -0.6077117919921875, -0.5798416137695312, -0.551971435546875, -0.5241012573242188, -0.4962310791015625, -0.46836090087890625, -0.44049072265625, -0.41262054443359375, -0.3847503662109375, -0.35688018798828125, -0.329010009765625, -0.30113983154296875, -0.2732696533203125, -0.24539947509765625, -0.217529296875, -0.18965911865234375, -0.1617889404296875, -0.13391876220703125, -0.106048583984375, -0.07817840576171875, -0.0503082275390625, -0.02243804931640625, 0.00543212890625, 0.03330230712890625, 0.0611724853515625, 0.08904266357421875, 0.116912841796875, 0.14478302001953125, 0.1726531982421875, 0.20052337646484375, 0.2283935546875, 0.25626373291015625, 0.2841339111328125, 0.31200408935546875, 0.339874267578125, 0.36774444580078125, 0.3956146240234375, 0.42348480224609375, 0.45135498046875, 0.47922515869140625, 0.5070953369140625, 0.5349655151367188, 0.562835693359375, 0.5907058715820312, 0.6185760498046875, 0.6464462280273438, 0.67431640625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 7.0, 7.0, 7.0, 12.0, 22.0, 23.0, 31.0, 41.0, 53.0, 91.0, 121.0, 222.0, 547.0, 1590.0, 590.0, 243.0, 151.0, 91.0, 58.0, 40.0, 37.0, 19.0, 15.0, 15.0, 7.0, 9.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.492431640625, -0.4781837463378906, -0.46393585205078125, -0.4496879577636719, -0.4354400634765625, -0.4211921691894531, -0.40694427490234375, -0.3926963806152344, -0.378448486328125, -0.3642005920410156, -0.34995269775390625, -0.3357048034667969, -0.3214569091796875, -0.3072090148925781, -0.29296112060546875, -0.2787132263183594, -0.26446533203125, -0.2502174377441406, -0.23596954345703125, -0.22172164916992188, -0.2074737548828125, -0.19322586059570312, -0.17897796630859375, -0.16473007202148438, -0.150482177734375, -0.13623428344726562, -0.12198638916015625, -0.10773849487304688, -0.0934906005859375, -0.07924270629882812, -0.06499481201171875, -0.050746917724609375, -0.0364990234375, -0.022251129150390625, -0.00800323486328125, 0.006244659423828125, 0.0204925537109375, 0.034740447998046875, 0.04898834228515625, 0.06323623657226562, 0.077484130859375, 0.09173202514648438, 0.10597991943359375, 0.12022781372070312, 0.1344757080078125, 0.14872360229492188, 0.16297149658203125, 0.17721939086914062, 0.19146728515625, 0.20571517944335938, 0.21996307373046875, 0.23421096801757812, 0.2484588623046875, 0.2627067565917969, 0.27695465087890625, 0.2912025451660156, 0.305450439453125, 0.3196983337402344, 0.33394622802734375, 0.3481941223144531, 0.3624420166015625, 0.3766899108886719, 0.39093780517578125, 0.4051856994628906, 0.41943359375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 17.0, 142.0, 687.0, 144.0, 18.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.129505634307861, -4.852033615112305, -4.57456111907959, -4.297088623046875, -4.019616603851318, -3.7421443462371826, -3.464672088623047, -3.187199831008911, -2.9097275733947754, -2.6322553157806396, -2.354783058166504, -2.077310800552368, -1.7998385429382324, -1.5223662853240967, -1.244894027709961, -0.9674217700958252, -0.6899495124816895, -0.4124772548675537, -0.13500499725341797, 0.14246726036071777, 0.4199395179748535, 0.6974117755889893, 0.974884033203125, 1.2523562908172607, 1.5298285484313965, 1.8073008060455322, 2.084773063659668, 2.3622453212738037, 2.6397175788879395, 2.917189836502075, 3.194662094116211, 3.4721343517303467, 3.749606132507324, 4.027078628540039, 4.304550647735596, 4.582022666931152, 4.859495162963867, 5.136967658996582, 5.414439678192139, 5.691911697387695, 5.96938419342041, 6.246856689453125, 6.524328708648682, 6.801800727844238, 7.079273223876953, 7.356745719909668, 7.634217739105225, 7.911689758300781, 8.189162254333496, 8.466634750366211, 8.74410629272461, 9.021578788757324, 9.299051284790039, 9.576523780822754, 9.853996276855469, 10.131467819213867, 10.408940315246582, 10.686412811279297, 10.963884353637695, 11.24135684967041, 11.518829345703125, 11.79630184173584, 12.073774337768555, 12.351245880126953, 12.628718376159668]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 2.0, 8.0, 5.0, 13.0, 8.0, 10.0, 24.0, 17.0, 24.0, 32.0, 37.0, 46.0, 47.0, 68.0, 63.0, 68.0, 65.0, 58.0, 79.0, 51.0, 58.0, 40.0, 31.0, 30.0, 27.0, 23.0, 22.0, 10.0, 13.0, 9.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1734901666641235, -1.1189178228378296, -1.0643454790115356, -1.0097731351852417, -0.9552008509635925, -0.9006285071372986, -0.8460562229156494, -0.7914838790893555, -0.7369115352630615, -0.6823391914367676, -0.6277668476104736, -0.5731945633888245, -0.5186222195625305, -0.4640498757362366, -0.409477561712265, -0.35490524768829346, -0.3003329038619995, -0.24576057493686676, -0.191188246011734, -0.13661591708660126, -0.0820435881614685, -0.02747124433517456, 0.027101069688796997, 0.08167338371276855, 0.1362457275390625, 0.19081805646419525, 0.245390385389328, 0.29996269941329956, 0.3545350432395935, 0.40910738706588745, 0.463679701089859, 0.5182520151138306, 0.5728244781494141, 0.627396821975708, 0.681969165802002, 0.7365414500236511, 0.7911137938499451, 0.845686137676239, 0.9002584218978882, 0.9548307657241821, 1.009403109550476, 1.06397545337677, 1.118547797203064, 1.173120141029358, 1.2276923656463623, 1.2822647094726562, 1.3368370532989502, 1.3914093971252441, 1.445981740951538, 1.500554084777832, 1.555126428604126, 1.60969877243042, 1.6642711162567139, 1.7188434600830078, 1.7734156847000122, 1.8279880285263062, 1.8825603723526, 1.937132716178894, 1.991705060005188, 2.0462772846221924, 2.1008496284484863, 2.1554219722747803, 2.209994316101074, 2.264566659927368, 2.319139003753662]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 5.0, 4.0, 5.0, 10.0, 11.0, 7.0, 11.0, 23.0, 32.0, 40.0, 60.0, 91.0, 110.0, 151.0, 228.0, 352.0, 439.0, 748.0, 1030.0, 1592.0, 2460.0, 3627.0, 5864.0, 9544.0, 16538.0, 29240.0, 134620.0, 759137.0, 33485.0, 18934.0, 11092.0, 6652.0, 4229.0, 2742.0, 1767.0, 1166.0, 736.0, 486.0, 370.0, 271.0, 192.0, 148.0, 87.0, 62.0, 47.0, 26.0, 27.0, 17.0, 12.0, 8.0, 7.0, 8.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.5771484375, -1.5247955322265625, -1.472442626953125, -1.4200897216796875, -1.36773681640625, -1.3153839111328125, -1.263031005859375, -1.2106781005859375, -1.1583251953125, -1.1059722900390625, -1.053619384765625, -1.0012664794921875, -0.94891357421875, -0.8965606689453125, -0.844207763671875, -0.7918548583984375, -0.739501953125, -0.6871490478515625, -0.634796142578125, -0.5824432373046875, -0.53009033203125, -0.4777374267578125, -0.425384521484375, -0.3730316162109375, -0.3206787109375, -0.2683258056640625, -0.215972900390625, -0.1636199951171875, -0.11126708984375, -0.0589141845703125, -0.006561279296875, 0.0457916259765625, 0.09814453125, 0.1504974365234375, 0.202850341796875, 0.2552032470703125, 0.30755615234375, 0.3599090576171875, 0.412261962890625, 0.4646148681640625, 0.5169677734375, 0.5693206787109375, 0.621673583984375, 0.6740264892578125, 0.72637939453125, 0.7787322998046875, 0.831085205078125, 0.8834381103515625, 0.935791015625, 0.9881439208984375, 1.040496826171875, 1.0928497314453125, 1.14520263671875, 1.1975555419921875, 1.249908447265625, 1.3022613525390625, 1.3546142578125, 1.4069671630859375, 1.459320068359375, 1.5116729736328125, 1.56402587890625, 1.6163787841796875, 1.668731689453125, 1.7210845947265625, 1.7734375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 7.0, 4.0, 7.0, 11.0, 15.0, 13.0, 13.0, 21.0, 334.0, 469.0, 12.0, 8.0, 10.0, 3.0, 9.0, 10.0, 4.0, 4.0, 6.0, 6.0, 3.0, 12.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.650390625, -0.6294174194335938, -0.6084442138671875, -0.5874710083007812, -0.566497802734375, -0.5455245971679688, -0.5245513916015625, -0.5035781860351562, -0.48260498046875, -0.46163177490234375, -0.4406585693359375, -0.41968536376953125, -0.398712158203125, -0.37773895263671875, -0.3567657470703125, -0.33579254150390625, -0.3148193359375, -0.29384613037109375, -0.2728729248046875, -0.25189971923828125, -0.230926513671875, -0.20995330810546875, -0.1889801025390625, -0.16800689697265625, -0.14703369140625, -0.12606048583984375, -0.1050872802734375, -0.08411407470703125, -0.063140869140625, -0.04216766357421875, -0.0211944580078125, -0.00022125244140625, 0.020751953125, 0.04172515869140625, 0.0626983642578125, 0.08367156982421875, 0.104644775390625, 0.12561798095703125, 0.1465911865234375, 0.16756439208984375, 0.18853759765625, 0.20951080322265625, 0.2304840087890625, 0.25145721435546875, 0.272430419921875, 0.29340362548828125, 0.3143768310546875, 0.33535003662109375, 0.3563232421875, 0.37729644775390625, 0.3982696533203125, 0.41924285888671875, 0.440216064453125, 0.46118927001953125, 0.4821624755859375, 0.5031356811523438, 0.52410888671875, 0.5450820922851562, 0.5660552978515625, 0.5870285034179688, 0.608001708984375, 0.6289749145507812, 0.6499481201171875, 0.6709213256835938, 0.69189453125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 13.0, 10.0, 14.0, 20.0, 27.0, 35.0, 59.0, 89.0, 124.0, 202.0, 343.0, 540.0, 966.0, 1827.0, 3751.0, 8372.0, 20830.0, 67603.0, 270417.0, 466108.0, 143627.0, 38546.0, 13275.0, 5655.0, 2698.0, 1400.0, 782.0, 451.0, 284.0, 163.0, 104.0, 65.0, 42.0, 36.0, 22.0, 20.0, 8.0, 9.0, 8.0, 8.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.943359375, -1.8912200927734375, -1.839080810546875, -1.7869415283203125, -1.73480224609375, -1.6826629638671875, -1.630523681640625, -1.5783843994140625, -1.5262451171875, -1.4741058349609375, -1.421966552734375, -1.3698272705078125, -1.31768798828125, -1.2655487060546875, -1.213409423828125, -1.1612701416015625, -1.109130859375, -1.0569915771484375, -1.004852294921875, -0.9527130126953125, -0.90057373046875, -0.8484344482421875, -0.796295166015625, -0.7441558837890625, -0.6920166015625, -0.6398773193359375, -0.587738037109375, -0.5355987548828125, -0.48345947265625, -0.4313201904296875, -0.379180908203125, -0.3270416259765625, -0.27490234375, -0.2227630615234375, -0.170623779296875, -0.1184844970703125, -0.06634521484375, -0.0142059326171875, 0.037933349609375, 0.0900726318359375, 0.1422119140625, 0.1943511962890625, 0.246490478515625, 0.2986297607421875, 0.35076904296875, 0.4029083251953125, 0.455047607421875, 0.5071868896484375, 0.559326171875, 0.6114654541015625, 0.663604736328125, 0.7157440185546875, 0.76788330078125, 0.8200225830078125, 0.872161865234375, 0.9243011474609375, 0.9764404296875, 1.0285797119140625, 1.080718994140625, 1.1328582763671875, 1.18499755859375, 1.2371368408203125, 1.289276123046875, 1.3414154052734375, 1.3935546875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 5.0, 6.0, 15.0, 9.0, 15.0, 17.0, 18.0, 17.0, 25.0, 19.0, 22.0, 33.0, 35.0, 33.0, 27.0, 32.0, 46.0, 35.0, 41.0, 38.0, 33.0, 45.0, 40.0, 36.0, 40.0, 43.0, 33.0, 30.0, 27.0, 23.0, 23.0, 18.0, 22.0, 13.0, 11.0, 16.0, 12.0, 7.0, 7.0, 8.0, 5.0, 7.0, 2.0, 4.0, 4.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1.912109375, -1.8547210693359375, -1.797332763671875, -1.7399444580078125, -1.68255615234375, -1.6251678466796875, -1.567779541015625, -1.5103912353515625, -1.4530029296875, -1.3956146240234375, -1.338226318359375, -1.2808380126953125, -1.22344970703125, -1.1660614013671875, -1.108673095703125, -1.0512847900390625, -0.993896484375, -0.9365081787109375, -0.879119873046875, -0.8217315673828125, -0.76434326171875, -0.7069549560546875, -0.649566650390625, -0.5921783447265625, -0.5347900390625, -0.4774017333984375, -0.420013427734375, -0.3626251220703125, -0.30523681640625, -0.2478485107421875, -0.190460205078125, -0.1330718994140625, -0.07568359375, -0.0182952880859375, 0.039093017578125, 0.0964813232421875, 0.15386962890625, 0.2112579345703125, 0.268646240234375, 0.3260345458984375, 0.3834228515625, 0.4408111572265625, 0.498199462890625, 0.5555877685546875, 0.61297607421875, 0.6703643798828125, 0.727752685546875, 0.7851409912109375, 0.842529296875, 0.8999176025390625, 0.957305908203125, 1.0146942138671875, 1.07208251953125, 1.1294708251953125, 1.186859130859375, 1.2442474365234375, 1.3016357421875, 1.3590240478515625, 1.416412353515625, 1.4738006591796875, 1.53118896484375, 1.5885772705078125, 1.645965576171875, 1.7033538818359375, 1.7607421875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 0.0, 3.0, 4.0, 3.0, 9.0, 8.0, 6.0, 14.0, 17.0, 25.0, 58.0, 81.0, 143.0, 268.0, 603.0, 1577.0, 5515.0, 47985.0, 959031.0, 26725.0, 4135.0, 1281.0, 516.0, 205.0, 117.0, 85.0, 40.0, 21.0, 19.0, 17.0, 16.0, 9.0, 8.0, 2.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.54296875, -7.29486083984375, -7.0467529296875, -6.79864501953125, -6.550537109375, -6.30242919921875, -6.0543212890625, -5.80621337890625, -5.55810546875, -5.30999755859375, -5.0618896484375, -4.81378173828125, -4.565673828125, -4.31756591796875, -4.0694580078125, -3.82135009765625, -3.5732421875, -3.32513427734375, -3.0770263671875, -2.82891845703125, -2.580810546875, -2.33270263671875, -2.0845947265625, -1.83648681640625, -1.58837890625, -1.34027099609375, -1.0921630859375, -0.84405517578125, -0.595947265625, -0.34783935546875, -0.0997314453125, 0.14837646484375, 0.396484375, 0.64459228515625, 0.8927001953125, 1.14080810546875, 1.388916015625, 1.63702392578125, 1.8851318359375, 2.13323974609375, 2.38134765625, 2.62945556640625, 2.8775634765625, 3.12567138671875, 3.373779296875, 3.62188720703125, 3.8699951171875, 4.11810302734375, 4.3662109375, 4.61431884765625, 4.8624267578125, 5.11053466796875, 5.358642578125, 5.60675048828125, 5.8548583984375, 6.10296630859375, 6.35107421875, 6.59918212890625, 6.8472900390625, 7.09539794921875, 7.343505859375, 7.59161376953125, 7.8397216796875, 8.08782958984375, 8.3359375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 6.0, 11.0, 15.0, 19.0, 25.0, 59.0, 126.0, 255.0, 225.0, 124.0, 54.0, 27.0, 23.0, 15.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019621849060058594, -0.00018835067749023438, -0.0001804828643798828, -0.00017261505126953125, -0.0001647472381591797, -0.00015687942504882812, -0.00014901161193847656, -0.000141143798828125, -0.00013327598571777344, -0.00012540817260742188, -0.00011754035949707031, -0.00010967254638671875, -0.00010180473327636719, -9.393692016601562e-05, -8.606910705566406e-05, -7.82012939453125e-05, -7.033348083496094e-05, -6.246566772460938e-05, -5.459785461425781e-05, -4.673004150390625e-05, -3.886222839355469e-05, -3.0994415283203125e-05, -2.3126602172851562e-05, -1.52587890625e-05, -7.3909759521484375e-06, 4.76837158203125e-07, 8.344650268554688e-06, 1.621246337890625e-05, 2.4080276489257812e-05, 3.1948089599609375e-05, 3.981590270996094e-05, 4.76837158203125e-05, 5.555152893066406e-05, 6.341934204101562e-05, 7.128715515136719e-05, 7.915496826171875e-05, 8.702278137207031e-05, 9.489059448242188e-05, 0.00010275840759277344, 0.000110626220703125, 0.00011849403381347656, 0.00012636184692382812, 0.0001342296600341797, 0.00014209747314453125, 0.0001499652862548828, 0.00015783309936523438, 0.00016570091247558594, 0.0001735687255859375, 0.00018143653869628906, 0.00018930435180664062, 0.0001971721649169922, 0.00020503997802734375, 0.0002129077911376953, 0.00022077560424804688, 0.00022864341735839844, 0.00023651123046875, 0.00024437904357910156, 0.0002522468566894531, 0.0002601146697998047, 0.00026798248291015625, 0.0002758502960205078, 0.0002837181091308594, 0.00029158592224121094, 0.0002994537353515625, 0.00030732154846191406]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 8.0, 11.0, 12.0, 17.0, 28.0, 62.0, 82.0, 128.0, 236.0, 470.0, 877.0, 2038.0, 5382.0, 18027.0, 108406.0, 792638.0, 94824.0, 16582.0, 4856.0, 1916.0, 890.0, 449.0, 231.0, 131.0, 86.0, 48.0, 39.0, 25.0, 11.0, 7.0, 7.0, 7.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.859375, -2.765533447265625, -2.67169189453125, -2.577850341796875, -2.4840087890625, -2.390167236328125, -2.29632568359375, -2.202484130859375, -2.108642578125, -2.014801025390625, -1.92095947265625, -1.827117919921875, -1.7332763671875, -1.639434814453125, -1.54559326171875, -1.451751708984375, -1.35791015625, -1.264068603515625, -1.17022705078125, -1.076385498046875, -0.9825439453125, -0.888702392578125, -0.79486083984375, -0.701019287109375, -0.607177734375, -0.513336181640625, -0.41949462890625, -0.325653076171875, -0.2318115234375, -0.137969970703125, -0.04412841796875, 0.049713134765625, 0.1435546875, 0.237396240234375, 0.33123779296875, 0.425079345703125, 0.5189208984375, 0.612762451171875, 0.70660400390625, 0.800445556640625, 0.894287109375, 0.988128662109375, 1.08197021484375, 1.175811767578125, 1.2696533203125, 1.363494873046875, 1.45733642578125, 1.551177978515625, 1.64501953125, 1.738861083984375, 1.83270263671875, 1.926544189453125, 2.0203857421875, 2.114227294921875, 2.20806884765625, 2.301910400390625, 2.395751953125, 2.489593505859375, 2.58343505859375, 2.677276611328125, 2.7711181640625, 2.864959716796875, 2.95880126953125, 3.052642822265625, 3.146484375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 5.0, 3.0, 5.0, 4.0, 12.0, 14.0, 11.0, 19.0, 22.0, 21.0, 32.0, 59.0, 85.0, 86.0, 119.0, 106.0, 108.0, 59.0, 55.0, 38.0, 25.0, 20.0, 17.0, 17.0, 11.0, 10.0, 12.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.73828125, -2.658355712890625, -2.57843017578125, -2.498504638671875, -2.4185791015625, -2.338653564453125, -2.25872802734375, -2.178802490234375, -2.098876953125, -2.018951416015625, -1.93902587890625, -1.859100341796875, -1.7791748046875, -1.699249267578125, -1.61932373046875, -1.539398193359375, -1.45947265625, -1.379547119140625, -1.29962158203125, -1.219696044921875, -1.1397705078125, -1.059844970703125, -0.97991943359375, -0.899993896484375, -0.820068359375, -0.740142822265625, -0.66021728515625, -0.580291748046875, -0.5003662109375, -0.420440673828125, -0.34051513671875, -0.260589599609375, -0.1806640625, -0.100738525390625, -0.02081298828125, 0.059112548828125, 0.1390380859375, 0.218963623046875, 0.29888916015625, 0.378814697265625, 0.458740234375, 0.538665771484375, 0.61859130859375, 0.698516845703125, 0.7784423828125, 0.858367919921875, 0.93829345703125, 1.018218994140625, 1.09814453125, 1.178070068359375, 1.25799560546875, 1.337921142578125, 1.4178466796875, 1.497772216796875, 1.57769775390625, 1.657623291015625, 1.737548828125, 1.817474365234375, 1.89739990234375, 1.977325439453125, 2.0572509765625, 2.137176513671875, 2.21710205078125, 2.297027587890625, 2.376953125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 7.0, 5.0, 7.0, 15.0, 17.0, 40.0, 102.0, 205.0, 266.0, 180.0, 76.0, 26.0, 17.0, 9.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-35.24612808227539, -34.39177322387695, -33.53741455078125, -32.68305969238281, -31.828704833984375, -30.974348068237305, -30.119991302490234, -29.265636444091797, -28.411279678344727, -27.556922912597656, -26.70256805419922, -25.84821128845215, -24.99385643005371, -24.13949966430664, -23.285144805908203, -22.430788040161133, -21.576431274414062, -20.722074508666992, -19.867719650268555, -19.013362884521484, -18.159008026123047, -17.304651260375977, -16.450294494628906, -15.595939636230469, -14.741584777832031, -13.887228965759277, -13.032873153686523, -12.178516387939453, -11.3241605758667, -10.469804763793945, -9.615448951721191, -8.761093139648438, -7.906736373901367, -7.052380561828613, -6.198024272918701, -5.343668460845947, -4.489312171936035, -3.6349563598632812, -2.7806005477905273, -1.9262442588806152, -1.0718884468078613, -0.2175324559211731, 0.6368235349655151, 1.4911794662475586, 2.3455355167388916, 3.1998915672302246, 4.0542473793029785, 4.908603668212891, 5.7629594802856445, 6.617315292358398, 7.4716715812683105, 8.326026916503906, 9.180383682250977, 10.03473949432373, 10.889095306396484, 11.743452072143555, 12.597806930541992, 13.452162742614746, 14.3065185546875, 15.16087532043457, 16.015230178833008, 16.869586944580078, 17.723941802978516, 18.578298568725586, 19.432655334472656]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 9.0, 10.0, 7.0, 10.0, 33.0, 53.0, 85.0, 146.0, 204.0, 167.0, 101.0, 47.0, 28.0, 15.0, 13.0, 12.0, 8.0, 6.0, 6.0, 5.0, 3.0, 4.0, 2.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.9422607421875, -47.48849105834961, -46.034725189208984, -44.580955505371094, -43.12718963623047, -41.67341995239258, -40.21965026855469, -38.76588439941406, -37.31211471557617, -35.85834503173828, -34.404579162597656, -32.950809478759766, -31.497041702270508, -30.04327392578125, -28.589506149291992, -27.135738372802734, -25.681970596313477, -24.22820281982422, -22.77443504333496, -21.320667266845703, -19.866897583007812, -18.413129806518555, -16.959362030029297, -15.505593299865723, -14.051825523376465, -12.598057746887207, -11.144289016723633, -9.690521240234375, -8.236753463745117, -6.782984733581543, -5.329216957092285, -3.875448226928711, -2.421680450439453, -0.9679123163223267, 0.4858558177947998, 1.9396238327026367, 3.3933920860290527, 4.847160339355469, 6.300928115844727, 7.754696846008301, 9.208464622497559, 10.662232398986816, 12.11600112915039, 13.569768905639648, 15.023536682128906, 16.477306365966797, 17.931072235107422, 19.384841918945312, 20.83860969543457, 22.292377471923828, 23.746145248413086, 25.199913024902344, 26.653682708740234, 28.107450485229492, 29.56121826171875, 31.01498794555664, 32.468753814697266, 33.922523498535156, 35.37628936767578, 36.83005905151367, 38.2838249206543, 39.73759460449219, 41.19136047363281, 42.6451301574707, 44.098899841308594]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 1.0, 5.0, 6.0, 7.0, 8.0, 19.0, 19.0, 22.0, 32.0, 44.0, 79.0, 101.0, 147.0, 221.0, 354.0, 661.0, 1170.0, 2628.0, 6315.0, 23525.0, 462209.0, 3645925.0, 33938.0, 8913.0, 3466.0, 1756.0, 1008.0, 567.0, 345.0, 224.0, 147.0, 109.0, 76.0, 68.0, 46.0, 25.0, 19.0, 25.0, 17.0, 11.0, 11.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.69921875, -5.51593017578125, -5.3326416015625, -5.14935302734375, -4.966064453125, -4.78277587890625, -4.5994873046875, -4.41619873046875, -4.23291015625, -4.04962158203125, -3.8663330078125, -3.68304443359375, -3.499755859375, -3.31646728515625, -3.1331787109375, -2.94989013671875, -2.7666015625, -2.58331298828125, -2.4000244140625, -2.21673583984375, -2.033447265625, -1.85015869140625, -1.6668701171875, -1.48358154296875, -1.30029296875, -1.11700439453125, -0.9337158203125, -0.75042724609375, -0.567138671875, -0.38385009765625, -0.2005615234375, -0.01727294921875, 0.166015625, 0.34930419921875, 0.5325927734375, 0.71588134765625, 0.899169921875, 1.08245849609375, 1.2657470703125, 1.44903564453125, 1.63232421875, 1.81561279296875, 1.9989013671875, 2.18218994140625, 2.365478515625, 2.54876708984375, 2.7320556640625, 2.91534423828125, 3.0986328125, 3.28192138671875, 3.4652099609375, 3.64849853515625, 3.831787109375, 4.01507568359375, 4.1983642578125, 4.38165283203125, 4.56494140625, 4.74822998046875, 4.9315185546875, 5.11480712890625, 5.298095703125, 5.48138427734375, 5.6646728515625, 5.84796142578125, 6.03125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 7.0, 5.0, 15.0, 15.0, 13.0, 22.0, 24.0, 42.0, 234.0, 368.0, 120.0, 27.0, 19.0, 15.0, 3.0, 9.0, 10.0, 7.0, 7.0, 9.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.62548828125, -0.6072845458984375, -0.589080810546875, -0.5708770751953125, -0.55267333984375, -0.5344696044921875, -0.516265869140625, -0.4980621337890625, -0.4798583984375, -0.4616546630859375, -0.443450927734375, -0.4252471923828125, -0.40704345703125, -0.3888397216796875, -0.370635986328125, -0.3524322509765625, -0.334228515625, -0.3160247802734375, -0.297821044921875, -0.2796173095703125, -0.26141357421875, -0.2432098388671875, -0.225006103515625, -0.2068023681640625, -0.1885986328125, -0.1703948974609375, -0.152191162109375, -0.1339874267578125, -0.11578369140625, -0.0975799560546875, -0.079376220703125, -0.0611724853515625, -0.04296875, -0.0247650146484375, -0.006561279296875, 0.0116424560546875, 0.02984619140625, 0.0480499267578125, 0.066253662109375, 0.0844573974609375, 0.1026611328125, 0.1208648681640625, 0.139068603515625, 0.1572723388671875, 0.17547607421875, 0.1936798095703125, 0.211883544921875, 0.2300872802734375, 0.248291015625, 0.2664947509765625, 0.284698486328125, 0.3029022216796875, 0.32110595703125, 0.3393096923828125, 0.357513427734375, 0.3757171630859375, 0.3939208984375, 0.4121246337890625, 0.430328369140625, 0.4485321044921875, 0.46673583984375, 0.4849395751953125, 0.503143310546875, 0.5213470458984375, 0.53955078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 8.0, 10.0, 9.0, 18.0, 12.0, 30.0, 22.0, 40.0, 71.0, 89.0, 150.0, 214.0, 362.0, 614.0, 1199.0, 2323.0, 4866.0, 13228.0, 47362.0, 445253.0, 3497569.0, 139010.0, 26078.0, 8597.0, 3408.0, 1600.0, 833.0, 473.0, 270.0, 166.0, 128.0, 71.0, 44.0, 41.0, 25.0, 23.0, 22.0, 9.0, 6.0, 5.0, 4.0, 0.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.341796875, -2.2618408203125, -2.181884765625, -2.1019287109375, -2.02197265625, -1.9420166015625, -1.862060546875, -1.7821044921875, -1.7021484375, -1.6221923828125, -1.542236328125, -1.4622802734375, -1.38232421875, -1.3023681640625, -1.222412109375, -1.1424560546875, -1.0625, -0.9825439453125, -0.902587890625, -0.8226318359375, -0.74267578125, -0.6627197265625, -0.582763671875, -0.5028076171875, -0.4228515625, -0.3428955078125, -0.262939453125, -0.1829833984375, -0.10302734375, -0.0230712890625, 0.056884765625, 0.1368408203125, 0.216796875, 0.2967529296875, 0.376708984375, 0.4566650390625, 0.53662109375, 0.6165771484375, 0.696533203125, 0.7764892578125, 0.8564453125, 0.9364013671875, 1.016357421875, 1.0963134765625, 1.17626953125, 1.2562255859375, 1.336181640625, 1.4161376953125, 1.49609375, 1.5760498046875, 1.656005859375, 1.7359619140625, 1.81591796875, 1.8958740234375, 1.975830078125, 2.0557861328125, 2.1357421875, 2.2156982421875, 2.295654296875, 2.3756103515625, 2.45556640625, 2.5355224609375, 2.615478515625, 2.6954345703125, 2.775390625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 12.0, 13.0, 13.0, 12.0, 23.0, 47.0, 96.0, 222.0, 597.0, 1955.0, 602.0, 201.0, 97.0, 63.0, 25.0, 24.0, 14.0, 15.0, 8.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76171875, -0.73828125, -0.71484375, -0.69140625, -0.66796875, -0.64453125, -0.62109375, -0.59765625, -0.57421875, -0.55078125, -0.52734375, -0.50390625, -0.48046875, -0.45703125, -0.43359375, -0.41015625, -0.38671875, -0.36328125, -0.33984375, -0.31640625, -0.29296875, -0.26953125, -0.24609375, -0.22265625, -0.19921875, -0.17578125, -0.15234375, -0.12890625, -0.10546875, -0.08203125, -0.05859375, -0.03515625, -0.01171875, 0.01171875, 0.03515625, 0.05859375, 0.08203125, 0.10546875, 0.12890625, 0.15234375, 0.17578125, 0.19921875, 0.22265625, 0.24609375, 0.26953125, 0.29296875, 0.31640625, 0.33984375, 0.36328125, 0.38671875, 0.41015625, 0.43359375, 0.45703125, 0.48046875, 0.50390625, 0.52734375, 0.55078125, 0.57421875, 0.59765625, 0.62109375, 0.64453125, 0.66796875, 0.69140625, 0.71484375, 0.73828125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 8.0, 13.0, 35.0, 174.0, 518.0, 204.0, 31.0, 13.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.266407012939453, -11.038909912109375, -10.811412811279297, -10.583915710449219, -10.35641860961914, -10.128921508789062, -9.901424407958984, -9.67392635345459, -9.446429252624512, -9.218932151794434, -8.991435050964355, -8.763937950134277, -8.5364408493042, -8.308942794799805, -8.081445693969727, -7.853949069976807, -7.6264519691467285, -7.39895486831665, -7.171457767486572, -6.943960189819336, -6.716463088989258, -6.48896598815918, -6.261468887329102, -6.033971786499023, -5.806474685668945, -5.578977584838867, -5.351480484008789, -5.123983383178711, -4.896485805511475, -4.6689887046813965, -4.441491603851318, -4.21399450302124, -3.986496925354004, -3.758999824523926, -3.5315024852752686, -3.3040053844451904, -3.076508045196533, -2.849010944366455, -2.621513843536377, -2.394016742706299, -2.1665194034576416, -1.939022183418274, -1.7115249633789062, -1.4840278625488281, -1.2565306425094604, -1.0290334224700928, -0.8015363216400146, -0.574039101600647, -0.3465418815612793, -0.11904469132423401, 0.10845249891281128, 0.3359496593475342, 0.5634468793869019, 0.7909440994262695, 1.0184412002563477, 1.2459384202957153, 1.473435640335083, 1.7009328603744507, 1.9284300804138184, 2.1559271812438965, 2.3834242820739746, 2.610921621322632, 2.83841872215271, 3.065916061401367, 3.2934131622314453]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 1.0, 4.0, 5.0, 10.0, 13.0, 27.0, 35.0, 42.0, 41.0, 84.0, 98.0, 107.0, 108.0, 113.0, 77.0, 64.0, 44.0, 35.0, 26.0, 17.0, 11.0, 5.0, 3.0, 6.0, 6.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.386098861694336, -3.2672908306121826, -3.1484830379486084, -3.029675006866455, -2.9108669757843018, -2.7920589447021484, -2.673251152038574, -2.554443120956421, -2.4356350898742676, -2.3168270587921143, -2.19801926612854, -2.0792112350463867, -1.9604032039642334, -1.8415952920913696, -1.7227873802185059, -1.6039793491363525, -1.4851715564727783, -1.3663636445999146, -1.2475556135177612, -1.1287477016448975, -1.0099396705627441, -0.8911317586898804, -0.7723238468170166, -0.6535158753395081, -0.5347079038619995, -0.41589993238449097, -0.2970919907093048, -0.17828404903411865, -0.05947607755661011, 0.05933189392089844, 0.1781398057937622, 0.29694777727127075, 0.4157557487487793, 0.5345637202262878, 0.6533716917037964, 0.7721796035766602, 0.8909875750541687, 1.0097955465316772, 1.128603458404541, 1.2474114894866943, 1.366219401359558, 1.4850273132324219, 1.6038353443145752, 1.722643256187439, 1.8414511680603027, 1.960259199142456, 2.0790672302246094, 2.1978750228881836, 2.316683053970337, 2.4354910850524902, 2.5542988777160645, 2.6731069087982178, 2.791914939880371, 2.9107227325439453, 3.0295307636260986, 3.148338794708252, 3.267146587371826, 3.3859546184539795, 3.5047624111175537, 3.623570442199707, 3.7423784732818604, 3.8611865043640137, 3.979994297027588, 4.098802089691162, 4.2176103591918945]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 3.0, 10.0, 11.0, 19.0, 18.0, 28.0, 62.0, 96.0, 156.0, 251.0, 473.0, 950.0, 2023.0, 5448.0, 17809.0, 97815.0, 860427.0, 44791.0, 11226.0, 3728.0, 1532.0, 738.0, 355.0, 210.0, 132.0, 71.0, 58.0, 29.0, 26.0, 13.0, 22.0, 6.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.94921875, -5.77587890625, -5.6025390625, -5.42919921875, -5.255859375, -5.08251953125, -4.9091796875, -4.73583984375, -4.5625, -4.38916015625, -4.2158203125, -4.04248046875, -3.869140625, -3.69580078125, -3.5224609375, -3.34912109375, -3.17578125, -3.00244140625, -2.8291015625, -2.65576171875, -2.482421875, -2.30908203125, -2.1357421875, -1.96240234375, -1.7890625, -1.61572265625, -1.4423828125, -1.26904296875, -1.095703125, -0.92236328125, -0.7490234375, -0.57568359375, -0.40234375, -0.22900390625, -0.0556640625, 0.11767578125, 0.291015625, 0.46435546875, 0.6376953125, 0.81103515625, 0.984375, 1.15771484375, 1.3310546875, 1.50439453125, 1.677734375, 1.85107421875, 2.0244140625, 2.19775390625, 2.37109375, 2.54443359375, 2.7177734375, 2.89111328125, 3.064453125, 3.23779296875, 3.4111328125, 3.58447265625, 3.7578125, 3.93115234375, 4.1044921875, 4.27783203125, 4.451171875, 4.62451171875, 4.7978515625, 4.97119140625, 5.14453125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 0.0, 3.0, 8.0, 7.0, 6.0, 18.0, 9.0, 15.0, 27.0, 57.0, 171.0, 325.0, 201.0, 59.0, 19.0, 9.0, 12.0, 11.0, 13.0, 3.0, 10.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.513671875, -0.4951019287109375, -0.476531982421875, -0.4579620361328125, -0.43939208984375, -0.4208221435546875, -0.402252197265625, -0.3836822509765625, -0.3651123046875, -0.3465423583984375, -0.327972412109375, -0.3094024658203125, -0.29083251953125, -0.2722625732421875, -0.253692626953125, -0.2351226806640625, -0.216552734375, -0.1979827880859375, -0.179412841796875, -0.1608428955078125, -0.14227294921875, -0.1237030029296875, -0.105133056640625, -0.0865631103515625, -0.0679931640625, -0.0494232177734375, -0.030853271484375, -0.0122833251953125, 0.00628662109375, 0.0248565673828125, 0.043426513671875, 0.0619964599609375, 0.08056640625, 0.0991363525390625, 0.117706298828125, 0.1362762451171875, 0.15484619140625, 0.1734161376953125, 0.191986083984375, 0.2105560302734375, 0.2291259765625, 0.2476959228515625, 0.266265869140625, 0.2848358154296875, 0.30340576171875, 0.3219757080078125, 0.340545654296875, 0.3591156005859375, 0.377685546875, 0.3962554931640625, 0.414825439453125, 0.4333953857421875, 0.45196533203125, 0.4705352783203125, 0.489105224609375, 0.5076751708984375, 0.5262451171875, 0.5448150634765625, 0.563385009765625, 0.5819549560546875, 0.60052490234375, 0.6190948486328125, 0.637664794921875, 0.6562347412109375, 0.6748046875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 7.0, 5.0, 5.0, 6.0, 14.0, 16.0, 35.0, 47.0, 78.0, 141.0, 236.0, 463.0, 851.0, 2123.0, 6628.0, 27681.0, 165447.0, 582026.0, 214861.0, 35289.0, 7897.0, 2504.0, 1001.0, 529.0, 293.0, 143.0, 81.0, 40.0, 29.0, 27.0, 17.0, 13.0, 8.0, 7.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.341796875, -2.27203369140625, -2.2022705078125, -2.13250732421875, -2.062744140625, -1.99298095703125, -1.9232177734375, -1.85345458984375, -1.78369140625, -1.71392822265625, -1.6441650390625, -1.57440185546875, -1.504638671875, -1.43487548828125, -1.3651123046875, -1.29534912109375, -1.2255859375, -1.15582275390625, -1.0860595703125, -1.01629638671875, -0.946533203125, -0.87677001953125, -0.8070068359375, -0.73724365234375, -0.66748046875, -0.59771728515625, -0.5279541015625, -0.45819091796875, -0.388427734375, -0.31866455078125, -0.2489013671875, -0.17913818359375, -0.109375, -0.03961181640625, 0.0301513671875, 0.09991455078125, 0.169677734375, 0.23944091796875, 0.3092041015625, 0.37896728515625, 0.44873046875, 0.51849365234375, 0.5882568359375, 0.65802001953125, 0.727783203125, 0.79754638671875, 0.8673095703125, 0.93707275390625, 1.0068359375, 1.07659912109375, 1.1463623046875, 1.21612548828125, 1.285888671875, 1.35565185546875, 1.4254150390625, 1.49517822265625, 1.56494140625, 1.63470458984375, 1.7044677734375, 1.77423095703125, 1.843994140625, 1.91375732421875, 1.9835205078125, 2.05328369140625, 2.123046875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 2.0, 4.0, 9.0, 8.0, 10.0, 11.0, 11.0, 9.0, 21.0, 20.0, 22.0, 29.0, 24.0, 31.0, 37.0, 30.0, 34.0, 34.0, 29.0, 44.0, 40.0, 35.0, 40.0, 31.0, 44.0, 34.0, 37.0, 27.0, 22.0, 31.0, 32.0, 24.0, 28.0, 16.0, 21.0, 16.0, 21.0, 20.0, 16.0, 13.0, 11.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.197265625, -1.1585235595703125, -1.119781494140625, -1.0810394287109375, -1.04229736328125, -1.0035552978515625, -0.964813232421875, -0.9260711669921875, -0.8873291015625, -0.8485870361328125, -0.809844970703125, -0.7711029052734375, -0.73236083984375, -0.6936187744140625, -0.654876708984375, -0.6161346435546875, -0.577392578125, -0.5386505126953125, -0.499908447265625, -0.4611663818359375, -0.42242431640625, -0.3836822509765625, -0.344940185546875, -0.3061981201171875, -0.2674560546875, -0.2287139892578125, -0.189971923828125, -0.1512298583984375, -0.11248779296875, -0.0737457275390625, -0.035003662109375, 0.0037384033203125, 0.04248046875, 0.0812225341796875, 0.119964599609375, 0.1587066650390625, 0.19744873046875, 0.2361907958984375, 0.274932861328125, 0.3136749267578125, 0.3524169921875, 0.3911590576171875, 0.429901123046875, 0.4686431884765625, 0.50738525390625, 0.5461273193359375, 0.584869384765625, 0.6236114501953125, 0.662353515625, 0.7010955810546875, 0.739837646484375, 0.7785797119140625, 0.81732177734375, 0.8560638427734375, 0.894805908203125, 0.9335479736328125, 0.9722900390625, 1.0110321044921875, 1.049774169921875, 1.0885162353515625, 1.12725830078125, 1.1660003662109375, 1.204742431640625, 1.2434844970703125, 1.2822265625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 6.0, 3.0, 10.0, 9.0, 11.0, 26.0, 38.0, 57.0, 115.0, 197.0, 547.0, 3042.0, 684673.0, 356064.0, 2689.0, 584.0, 206.0, 116.0, 53.0, 34.0, 13.0, 20.0, 12.0, 6.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.921875, -19.4107666015625, -18.899658203125, -18.3885498046875, -17.87744140625, -17.3663330078125, -16.855224609375, -16.3441162109375, -15.8330078125, -15.3218994140625, -14.810791015625, -14.2996826171875, -13.78857421875, -13.2774658203125, -12.766357421875, -12.2552490234375, -11.744140625, -11.2330322265625, -10.721923828125, -10.2108154296875, -9.69970703125, -9.1885986328125, -8.677490234375, -8.1663818359375, -7.6552734375, -7.1441650390625, -6.633056640625, -6.1219482421875, -5.61083984375, -5.0997314453125, -4.588623046875, -4.0775146484375, -3.56640625, -3.0552978515625, -2.544189453125, -2.0330810546875, -1.52197265625, -1.0108642578125, -0.499755859375, 0.0113525390625, 0.5224609375, 1.0335693359375, 1.544677734375, 2.0557861328125, 2.56689453125, 3.0780029296875, 3.589111328125, 4.1002197265625, 4.611328125, 5.1224365234375, 5.633544921875, 6.1446533203125, 6.65576171875, 7.1668701171875, 7.677978515625, 8.1890869140625, 8.7001953125, 9.2113037109375, 9.722412109375, 10.2335205078125, 10.74462890625, 11.2557373046875, 11.766845703125, 12.2779541015625, 12.7890625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 11.0, 7.0, 11.0, 13.0, 35.0, 70.0, 196.0, 348.0, 184.0, 67.0, 22.0, 15.0, 12.0, 10.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031828880310058594, -0.00030576810240745544, -0.00029324740171432495, -0.00028072670102119446, -0.00026820600032806396, -0.00025568529963493347, -0.00024316459894180298, -0.00023064389824867249, -0.000218123197555542, -0.0002056024968624115, -0.000193081796169281, -0.0001805610954761505, -0.00016804039478302002, -0.00015551969408988953, -0.00014299899339675903, -0.00013047829270362854, -0.00011795759201049805, -0.00010543689131736755, -9.291619062423706e-05, -8.039548993110657e-05, -6.787478923797607e-05, -5.535408854484558e-05, -4.283338785171509e-05, -3.0312687158584595e-05, -1.77919864654541e-05, -5.271285772323608e-06, 7.249414920806885e-06, 1.9770115613937378e-05, 3.229081630706787e-05, 4.4811517000198364e-05, 5.733221769332886e-05, 6.985291838645935e-05, 8.237361907958984e-05, 9.489431977272034e-05, 0.00010741502046585083, 0.00011993572115898132, 0.00013245642185211182, 0.0001449771225452423, 0.0001574978232383728, 0.0001700185239315033, 0.0001825392246246338, 0.00019505992531776428, 0.00020758062601089478, 0.00022010132670402527, 0.00023262202739715576, 0.00024514272809028625, 0.00025766342878341675, 0.00027018412947654724, 0.00028270483016967773, 0.00029522553086280823, 0.0003077462315559387, 0.0003202669322490692, 0.0003327876329421997, 0.0003453083336353302, 0.0003578290343284607, 0.0003703497350215912, 0.0003828704357147217, 0.00039539113640785217, 0.00040791183710098267, 0.00042043253779411316, 0.00043295323848724365, 0.00044547393918037415, 0.00045799463987350464, 0.00047051534056663513, 0.0004830360412597656]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 0.0, 7.0, 16.0, 21.0, 48.0, 93.0, 207.0, 375.0, 1183.0, 5021.0, 66180.0, 943635.0, 27304.0, 3095.0, 772.0, 296.0, 138.0, 66.0, 34.0, 27.0, 16.0, 12.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1015625, -5.878662109375, -5.65576171875, -5.432861328125, -5.2099609375, -4.987060546875, -4.76416015625, -4.541259765625, -4.318359375, -4.095458984375, -3.87255859375, -3.649658203125, -3.4267578125, -3.203857421875, -2.98095703125, -2.758056640625, -2.53515625, -2.312255859375, -2.08935546875, -1.866455078125, -1.6435546875, -1.420654296875, -1.19775390625, -0.974853515625, -0.751953125, -0.529052734375, -0.30615234375, -0.083251953125, 0.1396484375, 0.362548828125, 0.58544921875, 0.808349609375, 1.03125, 1.254150390625, 1.47705078125, 1.699951171875, 1.9228515625, 2.145751953125, 2.36865234375, 2.591552734375, 2.814453125, 3.037353515625, 3.26025390625, 3.483154296875, 3.7060546875, 3.928955078125, 4.15185546875, 4.374755859375, 4.59765625, 4.820556640625, 5.04345703125, 5.266357421875, 5.4892578125, 5.712158203125, 5.93505859375, 6.157958984375, 6.380859375, 6.603759765625, 6.82666015625, 7.049560546875, 7.2724609375, 7.495361328125, 7.71826171875, 7.941162109375, 8.1640625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 3.0, 2.0, 7.0, 9.0, 10.0, 24.0, 34.0, 55.0, 140.0, 330.0, 212.0, 78.0, 38.0, 18.0, 16.0, 8.0, 6.0, 7.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2265625, -6.0361328125, -5.845703125, -5.6552734375, -5.46484375, -5.2744140625, -5.083984375, -4.8935546875, -4.703125, -4.5126953125, -4.322265625, -4.1318359375, -3.94140625, -3.7509765625, -3.560546875, -3.3701171875, -3.1796875, -2.9892578125, -2.798828125, -2.6083984375, -2.41796875, -2.2275390625, -2.037109375, -1.8466796875, -1.65625, -1.4658203125, -1.275390625, -1.0849609375, -0.89453125, -0.7041015625, -0.513671875, -0.3232421875, -0.1328125, 0.0576171875, 0.248046875, 0.4384765625, 0.62890625, 0.8193359375, 1.009765625, 1.2001953125, 1.390625, 1.5810546875, 1.771484375, 1.9619140625, 2.15234375, 2.3427734375, 2.533203125, 2.7236328125, 2.9140625, 3.1044921875, 3.294921875, 3.4853515625, 3.67578125, 3.8662109375, 4.056640625, 4.2470703125, 4.4375, 4.6279296875, 4.818359375, 5.0087890625, 5.19921875, 5.3896484375, 5.580078125, 5.7705078125, 5.9609375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 9.0, 49.0, 280.0, 493.0, 129.0, 22.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.675430297851562, -30.18354606628418, -28.691661834716797, -27.199777603149414, -25.70789337158203, -24.21600914001465, -22.724124908447266, -21.23223876953125, -19.7403564453125, -18.248472213745117, -16.756587982177734, -15.264703750610352, -13.772819519042969, -12.280935287475586, -10.789050102233887, -9.297165870666504, -7.805280685424805, -6.313396453857422, -4.821512222290039, -3.329627513885498, -1.8377432823181152, -0.3458590507507324, 1.1460256576538086, 2.6379098892211914, 4.129794120788574, 5.621678352355957, 7.11356258392334, 8.605447769165039, 10.097332000732422, 11.589216232299805, 13.081100463867188, 14.57298469543457, 16.064868927001953, 17.556753158569336, 19.04863739013672, 20.5405216217041, 22.032405853271484, 23.524290084838867, 25.01617431640625, 26.508060455322266, 27.999942779541016, 29.4918270111084, 30.98371124267578, 32.4755973815918, 33.96747970581055, 35.45936584472656, 36.95124816894531, 38.44313430786133, 39.935020446777344, 41.42690658569336, 42.91878890991211, 44.410675048828125, 45.902557373046875, 47.39444351196289, 48.88632583618164, 50.378211975097656, 51.870094299316406, 53.36198043823242, 54.85386276245117, 56.34574890136719, 57.83763122558594, 59.32951736450195, 60.8213996887207, 62.31328582763672, 63.80516815185547]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 2.0, 6.0, 5.0, 11.0, 14.0, 28.0, 32.0, 35.0, 68.0, 91.0, 110.0, 124.0, 118.0, 118.0, 85.0, 45.0, 36.0, 19.0, 10.0, 10.0, 11.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.536174774169922, -30.676769256591797, -29.817365646362305, -28.95796012878418, -28.098556518554688, -27.239151000976562, -26.379745483398438, -25.520339965820312, -24.66093635559082, -23.801530838012695, -22.942127227783203, -22.082721710205078, -21.223316192626953, -20.36391258239746, -19.504507064819336, -18.645103454589844, -17.78569793701172, -16.926292419433594, -16.0668888092041, -15.207483291625977, -14.348078727722168, -13.48867416381836, -12.629268646240234, -11.769864082336426, -10.910459518432617, -10.051054954528809, -9.191650390625, -8.332244873046875, -7.472840309143066, -6.613435745239258, -5.754030704498291, -4.894625663757324, -4.035221099853516, -3.175816297531128, -2.3164114952087402, -1.4570066928863525, -0.5976018905639648, 0.26180267333984375, 1.1212077140808105, 1.9806127548217773, 2.840017318725586, 3.6994221210479736, 4.558826923370361, 5.418231964111328, 6.277636528015137, 7.137041091918945, 7.996446132659912, 8.855851173400879, 9.715255737304688, 10.574660301208496, 11.434064865112305, 12.29347038269043, 13.152874946594238, 14.012279510498047, 14.871685028076172, 15.73108959197998, 16.59049415588379, 17.449899673461914, 18.309303283691406, 19.16870880126953, 20.028114318847656, 20.88751792907715, 21.746923446655273, 22.606327056884766, 23.46573257446289]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 6.0, 5.0, 16.0, 25.0, 35.0, 47.0, 57.0, 91.0, 109.0, 164.0, 269.0, 471.0, 845.0, 1465.0, 3328.0, 11649.0, 184617.0, 3955035.0, 25713.0, 5300.0, 1956.0, 1052.0, 614.0, 403.0, 270.0, 187.0, 125.0, 97.0, 64.0, 66.0, 42.0, 24.0, 21.0, 21.0, 19.0, 16.0, 11.0, 7.0, 15.0, 7.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.19921875, -6.93463134765625, -6.6700439453125, -6.40545654296875, -6.140869140625, -5.87628173828125, -5.6116943359375, -5.34710693359375, -5.08251953125, -4.81793212890625, -4.5533447265625, -4.28875732421875, -4.024169921875, -3.75958251953125, -3.4949951171875, -3.23040771484375, -2.9658203125, -2.70123291015625, -2.4366455078125, -2.17205810546875, -1.907470703125, -1.64288330078125, -1.3782958984375, -1.11370849609375, -0.84912109375, -0.58453369140625, -0.3199462890625, -0.05535888671875, 0.209228515625, 0.47381591796875, 0.7384033203125, 1.00299072265625, 1.267578125, 1.53216552734375, 1.7967529296875, 2.06134033203125, 2.325927734375, 2.59051513671875, 2.8551025390625, 3.11968994140625, 3.38427734375, 3.64886474609375, 3.9134521484375, 4.17803955078125, 4.442626953125, 4.70721435546875, 4.9718017578125, 5.23638916015625, 5.5009765625, 5.76556396484375, 6.0301513671875, 6.29473876953125, 6.559326171875, 6.82391357421875, 7.0885009765625, 7.35308837890625, 7.61767578125, 7.88226318359375, 8.1468505859375, 8.41143798828125, 8.676025390625, 8.94061279296875, 9.2052001953125, 9.46978759765625, 9.734375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 5.0, 9.0, 11.0, 15.0, 21.0, 35.0, 66.0, 140.0, 189.0, 199.0, 130.0, 54.0, 38.0, 19.0, 14.0, 11.0, 6.0, 6.0, 4.0, 2.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3662109375, -0.35034942626953125, -0.3344879150390625, -0.31862640380859375, -0.302764892578125, -0.28690338134765625, -0.2710418701171875, -0.25518035888671875, -0.23931884765625, -0.22345733642578125, -0.2075958251953125, -0.19173431396484375, -0.175872802734375, -0.16001129150390625, -0.1441497802734375, -0.12828826904296875, -0.1124267578125, -0.09656524658203125, -0.0807037353515625, -0.06484222412109375, -0.048980712890625, -0.03311920166015625, -0.0172576904296875, -0.00139617919921875, 0.01446533203125, 0.03032684326171875, 0.0461883544921875, 0.06204986572265625, 0.077911376953125, 0.09377288818359375, 0.1096343994140625, 0.12549591064453125, 0.141357421875, 0.15721893310546875, 0.1730804443359375, 0.18894195556640625, 0.204803466796875, 0.22066497802734375, 0.2365264892578125, 0.25238800048828125, 0.26824951171875, 0.28411102294921875, 0.2999725341796875, 0.31583404541015625, 0.331695556640625, 0.34755706787109375, 0.3634185791015625, 0.37928009033203125, 0.3951416015625, 0.41100311279296875, 0.4268646240234375, 0.44272613525390625, 0.458587646484375, 0.47444915771484375, 0.4903106689453125, 0.5061721801757812, 0.52203369140625, 0.5378952026367188, 0.5537567138671875, 0.5696182250976562, 0.585479736328125, 0.6013412475585938, 0.6172027587890625, 0.6330642700195312, 0.64892578125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 13.0, 11.0, 17.0, 27.0, 42.0, 100.0, 264.0, 1388.0, 17252.0, 4117145.0, 54827.0, 2467.0, 434.0, 133.0, 57.0, 27.0, 19.0, 15.0, 14.0, 7.0, 7.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.6171875, -11.2718505859375, -10.926513671875, -10.5811767578125, -10.23583984375, -9.8905029296875, -9.545166015625, -9.1998291015625, -8.8544921875, -8.5091552734375, -8.163818359375, -7.8184814453125, -7.47314453125, -7.1278076171875, -6.782470703125, -6.4371337890625, -6.091796875, -5.7464599609375, -5.401123046875, -5.0557861328125, -4.71044921875, -4.3651123046875, -4.019775390625, -3.6744384765625, -3.3291015625, -2.9837646484375, -2.638427734375, -2.2930908203125, -1.94775390625, -1.6024169921875, -1.257080078125, -0.9117431640625, -0.56640625, -0.2210693359375, 0.124267578125, 0.4696044921875, 0.81494140625, 1.1602783203125, 1.505615234375, 1.8509521484375, 2.1962890625, 2.5416259765625, 2.886962890625, 3.2322998046875, 3.57763671875, 3.9229736328125, 4.268310546875, 4.6136474609375, 4.958984375, 5.3043212890625, 5.649658203125, 5.9949951171875, 6.34033203125, 6.6856689453125, 7.031005859375, 7.3763427734375, 7.7216796875, 8.0670166015625, 8.412353515625, 8.7576904296875, 9.10302734375, 9.4483642578125, 9.793701171875, 10.1390380859375, 10.484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 3.0, 9.0, 15.0, 12.0, 32.0, 39.0, 57.0, 132.0, 312.0, 923.0, 1721.0, 433.0, 175.0, 73.0, 31.0, 24.0, 19.0, 15.0, 12.0, 5.0, 4.0, 2.0, 5.0, 4.0, 0.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77734375, -0.7532119750976562, -0.7290802001953125, -0.7049484252929688, -0.680816650390625, -0.6566848754882812, -0.6325531005859375, -0.6084213256835938, -0.58428955078125, -0.5601577758789062, -0.5360260009765625, -0.5118942260742188, -0.487762451171875, -0.46363067626953125, -0.4394989013671875, -0.41536712646484375, -0.3912353515625, -0.36710357666015625, -0.3429718017578125, -0.31884002685546875, -0.294708251953125, -0.27057647705078125, -0.2464447021484375, -0.22231292724609375, -0.19818115234375, -0.17404937744140625, -0.1499176025390625, -0.12578582763671875, -0.101654052734375, -0.07752227783203125, -0.0533905029296875, -0.02925872802734375, -0.005126953125, 0.01900482177734375, 0.0431365966796875, 0.06726837158203125, 0.091400146484375, 0.11553192138671875, 0.1396636962890625, 0.16379547119140625, 0.18792724609375, 0.21205902099609375, 0.2361907958984375, 0.26032257080078125, 0.284454345703125, 0.30858612060546875, 0.3327178955078125, 0.35684967041015625, 0.3809814453125, 0.40511322021484375, 0.4292449951171875, 0.45337677001953125, 0.477508544921875, 0.5016403198242188, 0.5257720947265625, 0.5499038696289062, 0.57403564453125, 0.5981674194335938, 0.6222991943359375, 0.6464309692382812, 0.670562744140625, 0.6946945190429688, 0.7188262939453125, 0.7429580688476562, 0.76708984375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 3.0, 15.0, 33.0, 310.0, 523.0, 101.0, 17.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.32281494140625, -12.009095191955566, -11.695374488830566, -11.381654739379883, -11.067934036254883, -10.7542142868042, -10.4404935836792, -10.126773834228516, -9.813053131103516, -9.499333381652832, -9.185612678527832, -8.871892929077148, -8.558172225952148, -8.244452476501465, -7.930731773376465, -7.617012023925781, -7.3032917976379395, -6.989571571350098, -6.675851345062256, -6.362131118774414, -6.048410892486572, -5.7346906661987305, -5.420970916748047, -5.107250213623047, -4.793530464172363, -4.4798102378845215, -4.16609001159668, -3.852369785308838, -3.538649559020996, -3.2249293327331543, -2.9112093448638916, -2.59748911857605, -2.283769130706787, -1.9700489044189453, -1.6563286781311035, -1.3426085710525513, -1.0288883447647095, -0.7151681184768677, -0.40144801139831543, -0.08772778511047363, 0.22599244117736816, 0.53971266746521, 0.853432834148407, 1.167153000831604, 1.4808732271194458, 1.7945934534072876, 2.10831356048584, 2.4220337867736816, 2.7357540130615234, 3.0494742393493652, 3.363194465637207, 3.676914691925049, 3.9906349182128906, 4.304355144500732, 4.618075370788574, 4.931795120239258, 5.245515823364258, 5.5592360496521, 5.872956275939941, 6.186676502227783, 6.500396728515625, 6.814116954803467, 7.127837181091309, 7.441556930541992, 7.755277156829834]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 2.0, 6.0, 5.0, 7.0, 10.0, 12.0, 19.0, 26.0, 38.0, 37.0, 57.0, 66.0, 91.0, 84.0, 90.0, 70.0, 76.0, 77.0, 44.0, 44.0, 46.0, 32.0, 17.0, 15.0, 13.0, 5.0, 5.0, 5.0, 1.0, 4.0, 0.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0142822265625, -2.9110467433929443, -2.8078110218048096, -2.704575538635254, -2.601339817047119, -2.4981043338775635, -2.394868850708008, -2.291633129119873, -2.1883976459503174, -2.0851621627807617, -1.981926441192627, -1.8786909580230713, -1.775455355644226, -1.6722197532653809, -1.5689841508865356, -1.4657485485076904, -1.3625129461288452, -1.25927734375, -1.1560417413711548, -1.0528061389923096, -0.9495706558227539, -0.8463350534439087, -0.7430994510650635, -0.639863908290863, -0.5366283059120178, -0.433392733335495, -0.33015716075897217, -0.22692155838012695, -0.12368598580360413, -0.0204504132270813, 0.08278518915176392, 0.18602073192596436, 0.28925633430480957, 0.3924919068813324, 0.4957274794578552, 0.5989630818367004, 0.7021986246109009, 0.8054342269897461, 0.9086698293685913, 1.0119054317474365, 1.1151409149169922, 1.2183765172958374, 1.3216121196746826, 1.4248476028442383, 1.5280832052230835, 1.6313188076019287, 1.734554409980774, 1.8377900123596191, 1.9410256147384644, 2.0442612171173096, 2.1474967002868652, 2.250732421875, 2.3539679050445557, 2.4572033882141113, 2.560439109802246, 2.6636745929718018, 2.7669103145599365, 2.870145797729492, 2.973381519317627, 3.0766170024871826, 3.1798527240753174, 3.283088207244873, 3.386323928833008, 3.4895594120025635, 3.592794895172119]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 10.0, 7.0, 14.0, 20.0, 33.0, 41.0, 62.0, 81.0, 181.0, 239.0, 451.0, 938.0, 1929.0, 5117.0, 18909.0, 197293.0, 751639.0, 55747.0, 9909.0, 3046.0, 1301.0, 694.0, 355.0, 215.0, 107.0, 81.0, 34.0, 33.0, 19.0, 13.0, 11.0, 8.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.734375, -3.61102294921875, -3.4876708984375, -3.36431884765625, -3.240966796875, -3.11761474609375, -2.9942626953125, -2.87091064453125, -2.74755859375, -2.62420654296875, -2.5008544921875, -2.37750244140625, -2.254150390625, -2.13079833984375, -2.0074462890625, -1.88409423828125, -1.7607421875, -1.63739013671875, -1.5140380859375, -1.39068603515625, -1.267333984375, -1.14398193359375, -1.0206298828125, -0.89727783203125, -0.77392578125, -0.65057373046875, -0.5272216796875, -0.40386962890625, -0.280517578125, -0.15716552734375, -0.0338134765625, 0.08953857421875, 0.212890625, 0.33624267578125, 0.4595947265625, 0.58294677734375, 0.706298828125, 0.82965087890625, 0.9530029296875, 1.07635498046875, 1.19970703125, 1.32305908203125, 1.4464111328125, 1.56976318359375, 1.693115234375, 1.81646728515625, 1.9398193359375, 2.06317138671875, 2.1865234375, 2.30987548828125, 2.4332275390625, 2.55657958984375, 2.679931640625, 2.80328369140625, 2.9266357421875, 3.04998779296875, 3.17333984375, 3.29669189453125, 3.4200439453125, 3.54339599609375, 3.666748046875, 3.79010009765625, 3.9134521484375, 4.03680419921875, 4.16015625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 6.0, 6.0, 5.0, 12.0, 16.0, 21.0, 51.0, 80.0, 132.0, 181.0, 165.0, 135.0, 83.0, 32.0, 21.0, 22.0, 8.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.326416015625, -0.3116264343261719, -0.29683685302734375, -0.2820472717285156, -0.2672576904296875, -0.2524681091308594, -0.23767852783203125, -0.22288894653320312, -0.208099365234375, -0.19330978393554688, -0.17852020263671875, -0.16373062133789062, -0.1489410400390625, -0.13415145874023438, -0.11936187744140625, -0.10457229614257812, -0.08978271484375, -0.07499313354492188, -0.06020355224609375, -0.045413970947265625, -0.0306243896484375, -0.015834808349609375, -0.00104522705078125, 0.013744354248046875, 0.028533935546875, 0.043323516845703125, 0.05811309814453125, 0.07290267944335938, 0.0876922607421875, 0.10248184204101562, 0.11727142333984375, 0.13206100463867188, 0.1468505859375, 0.16164016723632812, 0.17642974853515625, 0.19121932983398438, 0.2060089111328125, 0.22079849243164062, 0.23558807373046875, 0.2503776550292969, 0.265167236328125, 0.2799568176269531, 0.29474639892578125, 0.3095359802246094, 0.3243255615234375, 0.3391151428222656, 0.35390472412109375, 0.3686943054199219, 0.38348388671875, 0.3982734680175781, 0.41306304931640625, 0.4278526306152344, 0.4426422119140625, 0.4574317932128906, 0.47222137451171875, 0.4870109558105469, 0.501800537109375, 0.5165901184082031, 0.5313796997070312, 0.5461692810058594, 0.5609588623046875, 0.5757484436035156, 0.5905380249023438, 0.6053276062011719, 0.6201171875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 0.0, 4.0, 7.0, 7.0, 7.0, 9.0, 18.0, 19.0, 28.0, 38.0, 58.0, 102.0, 160.0, 257.0, 455.0, 833.0, 1970.0, 6246.0, 30321.0, 198763.0, 602223.0, 171036.0, 26585.0, 5670.0, 1781.0, 799.0, 433.0, 236.0, 163.0, 101.0, 60.0, 58.0, 36.0, 21.0, 18.0, 13.0, 2.0, 5.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.478515625, -2.394378662109375, -2.31024169921875, -2.226104736328125, -2.1419677734375, -2.057830810546875, -1.97369384765625, -1.889556884765625, -1.805419921875, -1.721282958984375, -1.63714599609375, -1.553009033203125, -1.4688720703125, -1.384735107421875, -1.30059814453125, -1.216461181640625, -1.13232421875, -1.048187255859375, -0.96405029296875, -0.879913330078125, -0.7957763671875, -0.711639404296875, -0.62750244140625, -0.543365478515625, -0.459228515625, -0.375091552734375, -0.29095458984375, -0.206817626953125, -0.1226806640625, -0.038543701171875, 0.04559326171875, 0.129730224609375, 0.2138671875, 0.298004150390625, 0.38214111328125, 0.466278076171875, 0.5504150390625, 0.634552001953125, 0.71868896484375, 0.802825927734375, 0.886962890625, 0.971099853515625, 1.05523681640625, 1.139373779296875, 1.2235107421875, 1.307647705078125, 1.39178466796875, 1.475921630859375, 1.56005859375, 1.644195556640625, 1.72833251953125, 1.812469482421875, 1.8966064453125, 1.980743408203125, 2.06488037109375, 2.149017333984375, 2.233154296875, 2.317291259765625, 2.40142822265625, 2.485565185546875, 2.5697021484375, 2.653839111328125, 2.73797607421875, 2.822113037109375, 2.90625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 2.0, 5.0, 1.0, 4.0, 8.0, 11.0, 7.0, 11.0, 9.0, 21.0, 20.0, 21.0, 18.0, 19.0, 33.0, 38.0, 39.0, 41.0, 30.0, 58.0, 43.0, 64.0, 37.0, 56.0, 44.0, 32.0, 39.0, 37.0, 41.0, 35.0, 45.0, 21.0, 20.0, 24.0, 15.0, 9.0, 4.0, 13.0, 9.0, 4.0, 2.0, 5.0, 7.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.47265625, -1.4235382080078125, -1.374420166015625, -1.3253021240234375, -1.27618408203125, -1.2270660400390625, -1.177947998046875, -1.1288299560546875, -1.0797119140625, -1.0305938720703125, -0.981475830078125, -0.9323577880859375, -0.88323974609375, -0.8341217041015625, -0.785003662109375, -0.7358856201171875, -0.686767578125, -0.6376495361328125, -0.588531494140625, -0.5394134521484375, -0.49029541015625, -0.4411773681640625, -0.392059326171875, -0.3429412841796875, -0.2938232421875, -0.2447052001953125, -0.195587158203125, -0.1464691162109375, -0.09735107421875, -0.0482330322265625, 0.000885009765625, 0.0500030517578125, 0.09912109375, 0.1482391357421875, 0.197357177734375, 0.2464752197265625, 0.29559326171875, 0.3447113037109375, 0.393829345703125, 0.4429473876953125, 0.4920654296875, 0.5411834716796875, 0.590301513671875, 0.6394195556640625, 0.68853759765625, 0.7376556396484375, 0.786773681640625, 0.8358917236328125, 0.885009765625, 0.9341278076171875, 0.983245849609375, 1.0323638916015625, 1.08148193359375, 1.1305999755859375, 1.179718017578125, 1.2288360595703125, 1.2779541015625, 1.3270721435546875, 1.376190185546875, 1.4253082275390625, 1.47442626953125, 1.5235443115234375, 1.572662353515625, 1.6217803955078125, 1.6708984375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 9.0, 2.0, 8.0, 9.0, 10.0, 15.0, 20.0, 30.0, 45.0, 77.0, 113.0, 191.0, 324.0, 625.0, 1353.0, 3192.0, 10471.0, 52771.0, 675818.0, 265441.0, 26898.0, 6582.0, 2347.0, 1002.0, 482.0, 281.0, 161.0, 99.0, 55.0, 35.0, 23.0, 26.0, 11.0, 10.0, 9.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.7578125, -2.6848907470703125, -2.611968994140625, -2.5390472412109375, -2.46612548828125, -2.3932037353515625, -2.320281982421875, -2.2473602294921875, -2.1744384765625, -2.1015167236328125, -2.028594970703125, -1.9556732177734375, -1.88275146484375, -1.8098297119140625, -1.736907958984375, -1.6639862060546875, -1.591064453125, -1.5181427001953125, -1.445220947265625, -1.3722991943359375, -1.29937744140625, -1.2264556884765625, -1.153533935546875, -1.0806121826171875, -1.0076904296875, -0.9347686767578125, -0.861846923828125, -0.7889251708984375, -0.71600341796875, -0.6430816650390625, -0.570159912109375, -0.4972381591796875, -0.42431640625, -0.3513946533203125, -0.278472900390625, -0.2055511474609375, -0.13262939453125, -0.0597076416015625, 0.013214111328125, 0.0861358642578125, 0.1590576171875, 0.2319793701171875, 0.304901123046875, 0.3778228759765625, 0.45074462890625, 0.5236663818359375, 0.596588134765625, 0.6695098876953125, 0.742431640625, 0.8153533935546875, 0.888275146484375, 0.9611968994140625, 1.03411865234375, 1.1070404052734375, 1.179962158203125, 1.2528839111328125, 1.3258056640625, 1.3987274169921875, 1.471649169921875, 1.5445709228515625, 1.61749267578125, 1.6904144287109375, 1.763336181640625, 1.8362579345703125, 1.9091796875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 9.0, 11.0, 9.0, 15.0, 11.0, 15.0, 34.0, 30.0, 73.0, 90.0, 130.0, 159.0, 119.0, 85.0, 55.0, 45.0, 32.0, 20.0, 14.0, 8.0, 11.0, 9.0, 8.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031256675720214844, -0.00030482932925224304, -0.00029709190130233765, -0.00028935447335243225, -0.00028161704540252686, -0.00027387961745262146, -0.00026614218950271606, -0.00025840476155281067, -0.0002506673336029053, -0.00024292990565299988, -0.00023519247770309448, -0.0002274550497531891, -0.0002197176218032837, -0.0002119801938533783, -0.0002042427659034729, -0.0001965053379535675, -0.0001887679100036621, -0.00018103048205375671, -0.00017329305410385132, -0.00016555562615394592, -0.00015781819820404053, -0.00015008077025413513, -0.00014234334230422974, -0.00013460591435432434, -0.00012686848640441895, -0.00011913105845451355, -0.00011139363050460815, -0.00010365620255470276, -9.591877460479736e-05, -8.818134665489197e-05, -8.044391870498657e-05, -7.270649075508118e-05, -6.496906280517578e-05, -5.7231634855270386e-05, -4.949420690536499e-05, -4.1756778955459595e-05, -3.40193510055542e-05, -2.6281923055648804e-05, -1.8544495105743408e-05, -1.0807067155838013e-05, -3.069639205932617e-06, 4.667788743972778e-06, 1.2405216693878174e-05, 2.014264464378357e-05, 2.7880072593688965e-05, 3.561750054359436e-05, 4.3354928493499756e-05, 5.109235644340515e-05, 5.882978439331055e-05, 6.656721234321594e-05, 7.430464029312134e-05, 8.204206824302673e-05, 8.977949619293213e-05, 9.751692414283752e-05, 0.00010525435209274292, 0.00011299178004264832, 0.00012072920799255371, 0.0001284666359424591, 0.0001362040638923645, 0.0001439414918422699, 0.0001516789197921753, 0.0001594163477420807, 0.00016715377569198608, 0.00017489120364189148, 0.00018262863159179688]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 3.0, 7.0, 6.0, 12.0, 20.0, 19.0, 29.0, 51.0, 81.0, 147.0, 374.0, 1214.0, 6868.0, 127887.0, 881388.0, 26416.0, 2810.0, 688.0, 227.0, 117.0, 67.0, 34.0, 30.0, 15.0, 13.0, 5.0, 5.0, 8.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4453125, -4.30755615234375, -4.1697998046875, -4.03204345703125, -3.894287109375, -3.75653076171875, -3.6187744140625, -3.48101806640625, -3.34326171875, -3.20550537109375, -3.0677490234375, -2.92999267578125, -2.792236328125, -2.65447998046875, -2.5167236328125, -2.37896728515625, -2.2412109375, -2.10345458984375, -1.9656982421875, -1.82794189453125, -1.690185546875, -1.55242919921875, -1.4146728515625, -1.27691650390625, -1.13916015625, -1.00140380859375, -0.8636474609375, -0.72589111328125, -0.588134765625, -0.45037841796875, -0.3126220703125, -0.17486572265625, -0.037109375, 0.10064697265625, 0.2384033203125, 0.37615966796875, 0.513916015625, 0.65167236328125, 0.7894287109375, 0.92718505859375, 1.06494140625, 1.20269775390625, 1.3404541015625, 1.47821044921875, 1.615966796875, 1.75372314453125, 1.8914794921875, 2.02923583984375, 2.1669921875, 2.30474853515625, 2.4425048828125, 2.58026123046875, 2.718017578125, 2.85577392578125, 2.9935302734375, 3.13128662109375, 3.26904296875, 3.40679931640625, 3.5445556640625, 3.68231201171875, 3.820068359375, 3.95782470703125, 4.0955810546875, 4.23333740234375, 4.37109375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 3.0, 3.0, 6.0, 10.0, 11.0, 6.0, 11.0, 14.0, 23.0, 37.0, 51.0, 83.0, 113.0, 178.0, 142.0, 85.0, 65.0, 46.0, 32.0, 25.0, 12.0, 9.0, 8.0, 6.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3544921875, -1.303924560546875, -1.25335693359375, -1.202789306640625, -1.1522216796875, -1.101654052734375, -1.05108642578125, -1.000518798828125, -0.949951171875, -0.899383544921875, -0.84881591796875, -0.798248291015625, -0.7476806640625, -0.697113037109375, -0.64654541015625, -0.595977783203125, -0.54541015625, -0.494842529296875, -0.44427490234375, -0.393707275390625, -0.3431396484375, -0.292572021484375, -0.24200439453125, -0.191436767578125, -0.140869140625, -0.090301513671875, -0.03973388671875, 0.010833740234375, 0.0614013671875, 0.111968994140625, 0.16253662109375, 0.213104248046875, 0.263671875, 0.314239501953125, 0.36480712890625, 0.415374755859375, 0.4659423828125, 0.516510009765625, 0.56707763671875, 0.617645263671875, 0.668212890625, 0.718780517578125, 0.76934814453125, 0.819915771484375, 0.8704833984375, 0.921051025390625, 0.97161865234375, 1.022186279296875, 1.07275390625, 1.123321533203125, 1.17388916015625, 1.224456787109375, 1.2750244140625, 1.325592041015625, 1.37615966796875, 1.426727294921875, 1.477294921875, 1.527862548828125, 1.57843017578125, 1.628997802734375, 1.6795654296875, 1.730133056640625, 1.78070068359375, 1.831268310546875, 1.8818359375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 7.0, 82.0, 670.0, 223.0, 15.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.108497619628906, -32.86878967285156, -30.62908172607422, -28.389375686645508, -26.149667739868164, -23.90995979309082, -21.67025375366211, -19.430545806884766, -17.190837860107422, -14.951129913330078, -12.71142292022705, -10.471715927124023, -8.23200798034668, -5.992300033569336, -3.7525930404663086, -1.5128860473632812, 0.7268218994140625, 2.966529369354248, 5.206236839294434, 7.445944309234619, 9.685651779174805, 11.925359725952148, 14.165066719055176, 16.404773712158203, 18.644481658935547, 20.88418960571289, 23.123897552490234, 25.363603591918945, 27.60331153869629, 29.843019485473633, 32.082725524902344, 34.32243347167969, 36.5621337890625, 38.801841735839844, 41.04154968261719, 43.28125762939453, 45.520965576171875, 47.76067352294922, 50.0003776550293, 52.24008560180664, 54.479793548583984, 56.71950149536133, 58.95920944213867, 61.198917388916016, 63.438621520996094, 65.67832946777344, 67.91803741455078, 70.15774536132812, 72.39745330810547, 74.63716125488281, 76.87686920166016, 79.1165771484375, 81.35628509521484, 83.59599304199219, 85.83570098876953, 88.07540893554688, 90.31510925292969, 92.55481719970703, 94.79452514648438, 97.03423309326172, 99.27394104003906, 101.5136489868164, 103.75335693359375, 105.99305725097656, 108.23277282714844]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 2.0, 9.0, 9.0, 14.0, 16.0, 27.0, 36.0, 37.0, 50.0, 52.0, 62.0, 82.0, 77.0, 60.0, 90.0, 56.0, 64.0, 54.0, 50.0, 32.0, 38.0, 30.0, 11.0, 14.0, 13.0, 5.0, 6.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.03494644165039, -11.450518608093262, -10.866090774536133, -10.28166389465332, -9.697236061096191, -9.112808227539062, -8.528380393981934, -7.943953037261963, -7.359525203704834, -6.775097370147705, -6.190670013427734, -5.6062421798706055, -5.021814346313477, -4.437386989593506, -3.852959156036377, -3.2685317993164062, -2.6841039657592773, -2.0996763706207275, -1.5152486562728882, -0.9308209419250488, -0.346393346786499, 0.23803424835205078, 0.8224620819091797, 1.4068894386291504, 1.9913172721862793, 2.575744867324829, 3.160172462463379, 3.744600296020508, 4.329028129577637, 4.913455486297607, 5.497883319854736, 6.082310676574707, 6.666738510131836, 7.251166343688965, 7.8355937004089355, 8.420021057128906, 9.004448890686035, 9.588876724243164, 10.173304557800293, 10.757732391357422, 11.342159271240234, 11.926587104797363, 12.511014938354492, 13.095441818237305, 13.679869651794434, 14.264297485351562, 14.848725318908691, 15.43315315246582, 16.017581939697266, 16.602008819580078, 17.186437606811523, 17.770864486694336, 18.35529327392578, 18.939720153808594, 19.524147033691406, 20.10857582092285, 20.693002700805664, 21.277429580688477, 21.861858367919922, 22.446285247802734, 23.03071403503418, 23.615140914916992, 24.199569702148438, 24.78399658203125, 25.368423461914062]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 6.0, 10.0, 11.0, 38.0, 62.0, 120.0, 429.0, 3266.0, 4135134.0, 52832.0, 1662.0, 364.0, 159.0, 64.0, 50.0, 30.0, 15.0, 7.0, 12.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.25, -14.55078125, -13.8515625, -13.15234375, -12.453125, -11.75390625, -11.0546875, -10.35546875, -9.65625, -8.95703125, -8.2578125, -7.55859375, -6.859375, -6.16015625, -5.4609375, -4.76171875, -4.0625, -3.36328125, -2.6640625, -1.96484375, -1.265625, -0.56640625, 0.1328125, 0.83203125, 1.53125, 2.23046875, 2.9296875, 3.62890625, 4.328125, 5.02734375, 5.7265625, 6.42578125, 7.125, 7.82421875, 8.5234375, 9.22265625, 9.921875, 10.62109375, 11.3203125, 12.01953125, 12.71875, 13.41796875, 14.1171875, 14.81640625, 15.515625, 16.21484375, 16.9140625, 17.61328125, 18.3125, 19.01171875, 19.7109375, 20.41015625, 21.109375, 21.80859375, 22.5078125, 23.20703125, 23.90625, 24.60546875, 25.3046875, 26.00390625, 26.703125, 27.40234375, 28.1015625, 28.80078125, 29.5]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 9.0, 9.0, 9.0, 16.0, 34.0, 47.0, 78.0, 125.0, 127.0, 155.0, 143.0, 88.0, 66.0, 40.0, 12.0, 18.0, 6.0, 8.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44189453125, -0.42120361328125, -0.4005126953125, -0.37982177734375, -0.359130859375, -0.33843994140625, -0.3177490234375, -0.29705810546875, -0.2763671875, -0.25567626953125, -0.2349853515625, -0.21429443359375, -0.193603515625, -0.17291259765625, -0.1522216796875, -0.13153076171875, -0.11083984375, -0.09014892578125, -0.0694580078125, -0.04876708984375, -0.028076171875, -0.00738525390625, 0.0133056640625, 0.03399658203125, 0.0546875, 0.07537841796875, 0.0960693359375, 0.11676025390625, 0.137451171875, 0.15814208984375, 0.1788330078125, 0.19952392578125, 0.22021484375, 0.24090576171875, 0.2615966796875, 0.28228759765625, 0.302978515625, 0.32366943359375, 0.3443603515625, 0.36505126953125, 0.3857421875, 0.40643310546875, 0.4271240234375, 0.44781494140625, 0.468505859375, 0.48919677734375, 0.5098876953125, 0.53057861328125, 0.55126953125, 0.57196044921875, 0.5926513671875, 0.61334228515625, 0.634033203125, 0.65472412109375, 0.6754150390625, 0.69610595703125, 0.716796875, 0.73748779296875, 0.7581787109375, 0.77886962890625, 0.799560546875, 0.82025146484375, 0.8409423828125, 0.86163330078125, 0.88232421875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 5.0, 1.0, 15.0, 3.0, 11.0, 16.0, 21.0, 33.0, 32.0, 62.0, 70.0, 109.0, 158.0, 192.0, 397.0, 884.0, 2690.0, 13107.0, 164334.0, 3876859.0, 120070.0, 10841.0, 2406.0, 885.0, 401.0, 230.0, 145.0, 83.0, 72.0, 38.0, 30.0, 20.0, 27.0, 11.0, 9.0, 5.0, 8.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.04296875, -3.928924560546875, -3.81488037109375, -3.700836181640625, -3.5867919921875, -3.472747802734375, -3.35870361328125, -3.244659423828125, -3.130615234375, -3.016571044921875, -2.90252685546875, -2.788482666015625, -2.6744384765625, -2.560394287109375, -2.44635009765625, -2.332305908203125, -2.21826171875, -2.104217529296875, -1.99017333984375, -1.876129150390625, -1.7620849609375, -1.648040771484375, -1.53399658203125, -1.419952392578125, -1.305908203125, -1.191864013671875, -1.07781982421875, -0.963775634765625, -0.8497314453125, -0.735687255859375, -0.62164306640625, -0.507598876953125, -0.3935546875, -0.279510498046875, -0.16546630859375, -0.051422119140625, 0.0626220703125, 0.176666259765625, 0.29071044921875, 0.404754638671875, 0.518798828125, 0.632843017578125, 0.74688720703125, 0.860931396484375, 0.9749755859375, 1.089019775390625, 1.20306396484375, 1.317108154296875, 1.43115234375, 1.545196533203125, 1.65924072265625, 1.773284912109375, 1.8873291015625, 2.001373291015625, 2.11541748046875, 2.229461669921875, 2.343505859375, 2.457550048828125, 2.57159423828125, 2.685638427734375, 2.7996826171875, 2.913726806640625, 3.02777099609375, 3.141815185546875, 3.255859375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 2.0, 5.0, 2.0, 6.0, 4.0, 8.0, 23.0, 31.0, 58.0, 98.0, 222.0, 566.0, 1820.0, 688.0, 255.0, 129.0, 56.0, 23.0, 26.0, 17.0, 13.0, 5.0, 9.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67822265625, -0.6544647216796875, -0.630706787109375, -0.6069488525390625, -0.58319091796875, -0.5594329833984375, -0.535675048828125, -0.5119171142578125, -0.4881591796875, -0.4644012451171875, -0.440643310546875, -0.4168853759765625, -0.39312744140625, -0.3693695068359375, -0.345611572265625, -0.3218536376953125, -0.298095703125, -0.2743377685546875, -0.250579833984375, -0.2268218994140625, -0.20306396484375, -0.1793060302734375, -0.155548095703125, -0.1317901611328125, -0.1080322265625, -0.0842742919921875, -0.060516357421875, -0.0367584228515625, -0.01300048828125, 0.0107574462890625, 0.034515380859375, 0.0582733154296875, 0.08203125, 0.1057891845703125, 0.129547119140625, 0.1533050537109375, 0.17706298828125, 0.2008209228515625, 0.224578857421875, 0.2483367919921875, 0.2720947265625, 0.2958526611328125, 0.319610595703125, 0.3433685302734375, 0.36712646484375, 0.3908843994140625, 0.414642333984375, 0.4384002685546875, 0.462158203125, 0.4859161376953125, 0.509674072265625, 0.5334320068359375, 0.55718994140625, 0.5809478759765625, 0.604705810546875, 0.6284637451171875, 0.6522216796875, 0.6759796142578125, 0.699737548828125, 0.7234954833984375, 0.74725341796875, 0.7710113525390625, 0.794769287109375, 0.8185272216796875, 0.84228515625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 12.0, 41.0, 80.0, 208.0, 283.0, 214.0, 93.0, 36.0, 16.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.427711486816406, -5.26033353805542, -5.092955589294434, -4.9255781173706055, -4.758200168609619, -4.590822219848633, -4.423444747924805, -4.256066799163818, -4.088688850402832, -3.9213109016418457, -3.7539331912994385, -3.5865554809570312, -3.419177532196045, -3.2517995834350586, -3.0844218730926514, -2.917044162750244, -2.749666213989258, -2.5822882652282715, -2.4149105548858643, -2.247532844543457, -2.0801548957824707, -1.912777066230774, -1.7453992366790771, -1.5780214071273804, -1.4106435775756836, -1.2432657480239868, -1.07588791847229, -0.9085100889205933, -0.7411322593688965, -0.5737544298171997, -0.40637660026550293, -0.23899877071380615, -0.07162094116210938, 0.0957568883895874, 0.2631347179412842, 0.43051254749298096, 0.5978903770446777, 0.7652682065963745, 0.9326460361480713, 1.100023865699768, 1.2674016952514648, 1.4347795248031616, 1.6021573543548584, 1.7695351839065552, 1.936913013458252, 2.1042909622192383, 2.2716686725616455, 2.4390463829040527, 2.606424331665039, 2.7738022804260254, 2.9411799907684326, 3.10855770111084, 3.275935649871826, 3.4433135986328125, 3.6106913089752197, 3.778069019317627, 3.9454469680786133, 4.1128249168396, 4.280202865600586, 4.447580337524414, 4.6149582862854, 4.782336235046387, 4.949713706970215, 5.117091655731201, 5.2844696044921875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 6.0, 12.0, 17.0, 18.0, 22.0, 27.0, 41.0, 29.0, 45.0, 41.0, 50.0, 53.0, 46.0, 51.0, 51.0, 59.0, 45.0, 57.0, 46.0, 57.0, 39.0, 37.0, 27.0, 34.0, 29.0, 15.0, 5.0, 12.0, 3.0, 6.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.01511812210083, -1.9434629678726196, -1.8718078136444092, -1.8001526594161987, -1.7284975051879883, -1.6568423509597778, -1.5851871967315674, -1.5135321617126465, -1.4418768882751465, -1.370221734046936, -1.2985665798187256, -1.2269114255905151, -1.1552562713623047, -1.0836011171340942, -1.0119459629058838, -0.9402908682823181, -0.8686357736587524, -0.796980619430542, -0.7253254652023315, -0.6536703109741211, -0.5820151567459106, -0.5103600025177002, -0.4387049078941345, -0.3670497536659241, -0.2953945994377136, -0.22373944520950317, -0.15208430588245392, -0.08042916655540466, -0.008774012327194214, 0.06288114190101624, 0.1345362663269043, 0.20619142055511475, 0.2778465747833252, 0.34950172901153564, 0.4211568832397461, 0.49281200766563416, 0.564467191696167, 0.6361223459243774, 0.7077774405479431, 0.7794325947761536, 0.851087749004364, 0.9227429032325745, 0.9943980574607849, 1.0660531520843506, 1.137708306312561, 1.2093634605407715, 1.281018614768982, 1.3526737689971924, 1.4243289232254028, 1.4959840774536133, 1.5676392316818237, 1.6392943859100342, 1.7109495401382446, 1.782604694366455, 1.854259729385376, 1.925915002822876, 1.9975700378417969, 2.0692250728607178, 2.1408803462982178, 2.2125353813171387, 2.2841906547546387, 2.3558456897735596, 2.4275009632110596, 2.4991559982299805, 2.5708112716674805]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 9.0, 9.0, 5.0, 21.0, 25.0, 29.0, 85.0, 128.0, 248.0, 516.0, 1327.0, 4113.0, 22978.0, 604099.0, 393347.0, 15971.0, 3496.0, 1168.0, 457.0, 216.0, 128.0, 74.0, 33.0, 18.0, 12.0, 12.0, 10.0, 9.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.81640625, -4.66064453125, -4.5048828125, -4.34912109375, -4.193359375, -4.03759765625, -3.8818359375, -3.72607421875, -3.5703125, -3.41455078125, -3.2587890625, -3.10302734375, -2.947265625, -2.79150390625, -2.6357421875, -2.47998046875, -2.32421875, -2.16845703125, -2.0126953125, -1.85693359375, -1.701171875, -1.54541015625, -1.3896484375, -1.23388671875, -1.078125, -0.92236328125, -0.7666015625, -0.61083984375, -0.455078125, -0.29931640625, -0.1435546875, 0.01220703125, 0.16796875, 0.32373046875, 0.4794921875, 0.63525390625, 0.791015625, 0.94677734375, 1.1025390625, 1.25830078125, 1.4140625, 1.56982421875, 1.7255859375, 1.88134765625, 2.037109375, 2.19287109375, 2.3486328125, 2.50439453125, 2.66015625, 2.81591796875, 2.9716796875, 3.12744140625, 3.283203125, 3.43896484375, 3.5947265625, 3.75048828125, 3.90625, 4.06201171875, 4.2177734375, 4.37353515625, 4.529296875, 4.68505859375, 4.8408203125, 4.99658203125, 5.15234375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 2.0, 11.0, 12.0, 24.0, 35.0, 70.0, 86.0, 123.0, 160.0, 159.0, 129.0, 68.0, 53.0, 25.0, 14.0, 7.0, 8.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.444091796875, -0.4237861633300781, -0.40348052978515625, -0.3831748962402344, -0.3628692626953125, -0.3425636291503906, -0.32225799560546875, -0.3019523620605469, -0.281646728515625, -0.2613410949707031, -0.24103546142578125, -0.22072982788085938, -0.2004241943359375, -0.18011856079101562, -0.15981292724609375, -0.13950729370117188, -0.11920166015625, -0.09889602661132812, -0.07859039306640625, -0.058284759521484375, -0.0379791259765625, -0.017673492431640625, 0.00263214111328125, 0.022937774658203125, 0.043243408203125, 0.06354904174804688, 0.08385467529296875, 0.10416030883789062, 0.1244659423828125, 0.14477157592773438, 0.16507720947265625, 0.18538284301757812, 0.2056884765625, 0.22599411010742188, 0.24629974365234375, 0.2666053771972656, 0.2869110107421875, 0.3072166442871094, 0.32752227783203125, 0.3478279113769531, 0.368133544921875, 0.3884391784667969, 0.40874481201171875, 0.4290504455566406, 0.4493560791015625, 0.4696617126464844, 0.48996734619140625, 0.5102729797363281, 0.53057861328125, 0.5508842468261719, 0.5711898803710938, 0.5914955139160156, 0.6118011474609375, 0.6321067810058594, 0.6524124145507812, 0.6727180480957031, 0.693023681640625, 0.7133293151855469, 0.7336349487304688, 0.7539405822753906, 0.7742462158203125, 0.7945518493652344, 0.8148574829101562, 0.8351631164550781, 0.85546875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 10.0, 6.0, 10.0, 11.0, 24.0, 22.0, 41.0, 52.0, 56.0, 92.0, 122.0, 195.0, 348.0, 576.0, 990.0, 2079.0, 4527.0, 12887.0, 46764.0, 197997.0, 449671.0, 245089.0, 59973.0, 16076.0, 5699.0, 2282.0, 1103.0, 601.0, 388.0, 267.0, 183.0, 122.0, 86.0, 53.0, 42.0, 26.0, 29.0, 13.0, 12.0, 7.0, 8.0, 7.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.029296875, -1.972259521484375, -1.91522216796875, -1.858184814453125, -1.8011474609375, -1.744110107421875, -1.68707275390625, -1.630035400390625, -1.572998046875, -1.515960693359375, -1.45892333984375, -1.401885986328125, -1.3448486328125, -1.287811279296875, -1.23077392578125, -1.173736572265625, -1.11669921875, -1.059661865234375, -1.00262451171875, -0.945587158203125, -0.8885498046875, -0.831512451171875, -0.77447509765625, -0.717437744140625, -0.660400390625, -0.603363037109375, -0.54632568359375, -0.489288330078125, -0.4322509765625, -0.375213623046875, -0.31817626953125, -0.261138916015625, -0.2041015625, -0.147064208984375, -0.09002685546875, -0.032989501953125, 0.0240478515625, 0.081085205078125, 0.13812255859375, 0.195159912109375, 0.252197265625, 0.309234619140625, 0.36627197265625, 0.423309326171875, 0.4803466796875, 0.537384033203125, 0.59442138671875, 0.651458740234375, 0.70849609375, 0.765533447265625, 0.82257080078125, 0.879608154296875, 0.9366455078125, 0.993682861328125, 1.05072021484375, 1.107757568359375, 1.164794921875, 1.221832275390625, 1.27886962890625, 1.335906982421875, 1.3929443359375, 1.449981689453125, 1.50701904296875, 1.564056396484375, 1.62109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 4.0, 5.0, 8.0, 10.0, 10.0, 14.0, 21.0, 24.0, 28.0, 38.0, 31.0, 33.0, 39.0, 45.0, 39.0, 52.0, 64.0, 66.0, 51.0, 50.0, 34.0, 42.0, 48.0, 32.0, 30.0, 41.0, 23.0, 13.0, 19.0, 13.0, 9.0, 12.0, 12.0, 9.0, 5.0, 7.0, 3.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.068359375, -2.01068115234375, -1.9530029296875, -1.89532470703125, -1.837646484375, -1.77996826171875, -1.7222900390625, -1.66461181640625, -1.60693359375, -1.54925537109375, -1.4915771484375, -1.43389892578125, -1.376220703125, -1.31854248046875, -1.2608642578125, -1.20318603515625, -1.1455078125, -1.08782958984375, -1.0301513671875, -0.97247314453125, -0.914794921875, -0.85711669921875, -0.7994384765625, -0.74176025390625, -0.68408203125, -0.62640380859375, -0.5687255859375, -0.51104736328125, -0.453369140625, -0.39569091796875, -0.3380126953125, -0.28033447265625, -0.22265625, -0.16497802734375, -0.1072998046875, -0.04962158203125, 0.008056640625, 0.06573486328125, 0.1234130859375, 0.18109130859375, 0.23876953125, 0.29644775390625, 0.3541259765625, 0.41180419921875, 0.469482421875, 0.52716064453125, 0.5848388671875, 0.64251708984375, 0.7001953125, 0.75787353515625, 0.8155517578125, 0.87322998046875, 0.930908203125, 0.98858642578125, 1.0462646484375, 1.10394287109375, 1.16162109375, 1.21929931640625, 1.2769775390625, 1.33465576171875, 1.392333984375, 1.45001220703125, 1.5076904296875, 1.56536865234375, 1.623046875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 8.0, 9.0, 9.0, 10.0, 37.0, 56.0, 92.0, 222.0, 612.0, 2241.0, 12738.0, 156106.0, 784765.0, 80871.0, 8242.0, 1660.0, 494.0, 170.0, 100.0, 44.0, 26.0, 14.0, 13.0, 6.0, 3.0, 6.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.439453125, -1.38275146484375, -1.3260498046875, -1.26934814453125, -1.212646484375, -1.15594482421875, -1.0992431640625, -1.04254150390625, -0.98583984375, -0.92913818359375, -0.8724365234375, -0.81573486328125, -0.759033203125, -0.70233154296875, -0.6456298828125, -0.58892822265625, -0.5322265625, -0.47552490234375, -0.4188232421875, -0.36212158203125, -0.305419921875, -0.24871826171875, -0.1920166015625, -0.13531494140625, -0.07861328125, -0.02191162109375, 0.0347900390625, 0.09149169921875, 0.148193359375, 0.20489501953125, 0.2615966796875, 0.31829833984375, 0.375, 0.43170166015625, 0.4884033203125, 0.54510498046875, 0.601806640625, 0.65850830078125, 0.7152099609375, 0.77191162109375, 0.82861328125, 0.88531494140625, 0.9420166015625, 0.99871826171875, 1.055419921875, 1.11212158203125, 1.1688232421875, 1.22552490234375, 1.2822265625, 1.33892822265625, 1.3956298828125, 1.45233154296875, 1.509033203125, 1.56573486328125, 1.6224365234375, 1.67913818359375, 1.73583984375, 1.79254150390625, 1.8492431640625, 1.90594482421875, 1.962646484375, 2.01934814453125, 2.0760498046875, 2.13275146484375, 2.189453125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 0.0, 5.0, 9.0, 10.0, 5.0, 8.0, 11.0, 11.0, 14.0, 6.0, 15.0, 18.0, 18.0, 19.0, 27.0, 29.0, 42.0, 59.0, 64.0, 87.0, 83.0, 62.0, 70.0, 63.0, 28.0, 26.0, 29.0, 21.0, 17.0, 18.0, 18.0, 9.0, 20.0, 12.0, 19.0, 9.0, 3.0, 8.0, 6.0, 2.0, 3.0, 7.0, 5.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010466575622558594, -0.00010123848915100098, -9.781122207641602e-05, -9.438395500183105e-05, -9.09566879272461e-05, -8.752942085266113e-05, -8.410215377807617e-05, -8.067488670349121e-05, -7.724761962890625e-05, -7.382035255432129e-05, -7.039308547973633e-05, -6.696581840515137e-05, -6.35385513305664e-05, -6.0111284255981445e-05, -5.6684017181396484e-05, -5.3256750106811523e-05, -4.982948303222656e-05, -4.64022159576416e-05, -4.297494888305664e-05, -3.954768180847168e-05, -3.612041473388672e-05, -3.269314765930176e-05, -2.9265880584716797e-05, -2.5838613510131836e-05, -2.2411346435546875e-05, -1.8984079360961914e-05, -1.5556812286376953e-05, -1.2129545211791992e-05, -8.702278137207031e-06, -5.27501106262207e-06, -1.8477439880371094e-06, 1.5795230865478516e-06, 5.0067901611328125e-06, 8.434057235717773e-06, 1.1861324310302734e-05, 1.5288591384887695e-05, 1.8715858459472656e-05, 2.2143125534057617e-05, 2.5570392608642578e-05, 2.899765968322754e-05, 3.24249267578125e-05, 3.585219383239746e-05, 3.927946090698242e-05, 4.270672798156738e-05, 4.6133995056152344e-05, 4.9561262130737305e-05, 5.2988529205322266e-05, 5.6415796279907227e-05, 5.984306335449219e-05, 6.327033042907715e-05, 6.669759750366211e-05, 7.012486457824707e-05, 7.355213165283203e-05, 7.697939872741699e-05, 8.040666580200195e-05, 8.383393287658691e-05, 8.726119995117188e-05, 9.068846702575684e-05, 9.41157341003418e-05, 9.754300117492676e-05, 0.00010097026824951172, 0.00010439753532409668, 0.00010782480239868164, 0.0001112520694732666, 0.00011467933654785156]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 13.0, 13.0, 27.0, 45.0, 76.0, 137.0, 317.0, 823.0, 2956.0, 21170.0, 353704.0, 628590.0, 34616.0, 4306.0, 1004.0, 357.0, 175.0, 80.0, 39.0, 40.0, 19.0, 15.0, 4.0, 5.0, 5.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1640625, -2.096649169921875, -2.02923583984375, -1.961822509765625, -1.8944091796875, -1.826995849609375, -1.75958251953125, -1.692169189453125, -1.624755859375, -1.557342529296875, -1.48992919921875, -1.422515869140625, -1.3551025390625, -1.287689208984375, -1.22027587890625, -1.152862548828125, -1.08544921875, -1.018035888671875, -0.95062255859375, -0.883209228515625, -0.8157958984375, -0.748382568359375, -0.68096923828125, -0.613555908203125, -0.546142578125, -0.478729248046875, -0.41131591796875, -0.343902587890625, -0.2764892578125, -0.209075927734375, -0.14166259765625, -0.074249267578125, -0.0068359375, 0.060577392578125, 0.12799072265625, 0.195404052734375, 0.2628173828125, 0.330230712890625, 0.39764404296875, 0.465057373046875, 0.532470703125, 0.599884033203125, 0.66729736328125, 0.734710693359375, 0.8021240234375, 0.869537353515625, 0.93695068359375, 1.004364013671875, 1.07177734375, 1.139190673828125, 1.20660400390625, 1.274017333984375, 1.3414306640625, 1.408843994140625, 1.47625732421875, 1.543670654296875, 1.611083984375, 1.678497314453125, 1.74591064453125, 1.813323974609375, 1.8807373046875, 1.948150634765625, 2.01556396484375, 2.082977294921875, 2.150390625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 7.0, 10.0, 11.0, 10.0, 20.0, 22.0, 30.0, 29.0, 28.0, 67.0, 68.0, 75.0, 71.0, 102.0, 84.0, 70.0, 67.0, 52.0, 40.0, 32.0, 26.0, 16.0, 16.0, 12.0, 6.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90673828125, -0.8802871704101562, -0.8538360595703125, -0.8273849487304688, -0.800933837890625, -0.7744827270507812, -0.7480316162109375, -0.7215805053710938, -0.69512939453125, -0.6686782836914062, -0.6422271728515625, -0.6157760620117188, -0.589324951171875, -0.5628738403320312, -0.5364227294921875, -0.5099716186523438, -0.4835205078125, -0.45706939697265625, -0.4306182861328125, -0.40416717529296875, -0.377716064453125, -0.35126495361328125, -0.3248138427734375, -0.29836273193359375, -0.27191162109375, -0.24546051025390625, -0.2190093994140625, -0.19255828857421875, -0.166107177734375, -0.13965606689453125, -0.1132049560546875, -0.08675384521484375, -0.060302734375, -0.03385162353515625, -0.0074005126953125, 0.01905059814453125, 0.045501708984375, 0.07195281982421875, 0.0984039306640625, 0.12485504150390625, 0.15130615234375, 0.17775726318359375, 0.2042083740234375, 0.23065948486328125, 0.257110595703125, 0.28356170654296875, 0.3100128173828125, 0.33646392822265625, 0.3629150390625, 0.38936614990234375, 0.4158172607421875, 0.44226837158203125, 0.468719482421875, 0.49517059326171875, 0.5216217041015625, 0.5480728149414062, 0.57452392578125, 0.6009750366210938, 0.6274261474609375, 0.6538772583007812, 0.680328369140625, 0.7067794799804688, 0.7332305908203125, 0.7596817016601562, 0.7861328125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 24.0, 97.0, 442.0, 355.0, 69.0, 15.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.884952545166016, -26.552288055419922, -25.21962547302246, -23.886960983276367, -22.554296493530273, -21.221633911132812, -19.88896942138672, -18.556304931640625, -17.22364044189453, -15.890976905822754, -14.55831241607666, -13.225648880004883, -11.892984390258789, -10.560320854187012, -9.227657318115234, -7.894992828369141, -6.56233024597168, -5.229666233062744, -3.8970024585723877, -2.5643386840820312, -1.2316746711730957, 0.10098934173583984, 1.4336528778076172, 2.766317367553711, 4.098980903625488, 5.431644916534424, 6.764308929443359, 8.096972465515137, 9.429636001586914, 10.762300491333008, 12.094964027404785, 13.427628517150879, 14.760292053222656, 16.09295654296875, 17.42561912536621, 18.758283615112305, 20.0909481048584, 21.42361068725586, 22.756275177001953, 24.088939666748047, 25.42160415649414, 26.754268646240234, 28.086931228637695, 29.41959571838379, 30.752260208129883, 32.084922790527344, 33.41758728027344, 34.75025177001953, 36.082916259765625, 37.41558074951172, 38.74824523925781, 40.080909729003906, 41.413570404052734, 42.74623489379883, 44.07889938354492, 45.411563873291016, 46.744224548339844, 48.07688903808594, 49.40955352783203, 50.742218017578125, 52.07487869262695, 53.40754318237305, 54.74020767211914, 56.072872161865234, 57.40553665161133]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 10.0, 10.0, 9.0, 11.0, 12.0, 24.0, 19.0, 27.0, 28.0, 48.0, 44.0, 55.0, 50.0, 65.0, 64.0, 60.0, 59.0, 68.0, 48.0, 52.0, 50.0, 30.0, 29.0, 29.0, 24.0, 15.0, 23.0, 13.0, 7.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.13050651550293, -15.670450210571289, -15.210392951965332, -14.750336647033691, -14.290279388427734, -13.830223083496094, -13.370166778564453, -12.910109519958496, -12.450052261352539, -11.989995956420898, -11.529938697814941, -11.0698823928833, -10.609825134277344, -10.149768829345703, -9.689712524414062, -9.229655265808105, -8.769598960876465, -8.309542655944824, -7.849485397338867, -7.389429092407227, -6.9293718338012695, -6.469315528869629, -6.00925874710083, -5.549201965332031, -5.089145183563232, -4.629088401794434, -4.169031620025635, -3.708975076675415, -3.248918294906616, -2.7888615131378174, -2.3288049697875977, -1.8687481880187988, -1.40869140625, -0.948634684085846, -0.4885779619216919, -0.028521299362182617, 0.4315354824066162, 0.891592264175415, 1.3516488075256348, 1.8117055892944336, 2.2717623710632324, 2.7318191528320312, 3.19187593460083, 3.65193247795105, 4.1119890213012695, 4.572046279907227, 5.032102584838867, 5.492159366607666, 5.952216148376465, 6.412272930145264, 6.8723297119140625, 7.332386016845703, 7.79244327545166, 8.2524995803833, 8.712556838989258, 9.172613143920898, 9.632669448852539, 10.09272575378418, 10.552783012390137, 11.012839317321777, 11.472896575927734, 11.932952880859375, 12.393009185791016, 12.853066444396973, 13.31312370300293]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 9.0, 5.0, 12.0, 13.0, 30.0, 54.0, 103.0, 231.0, 490.0, 1467.0, 8193.0, 366030.0, 3798555.0, 15172.0, 2479.0, 729.0, 335.0, 170.0, 62.0, 51.0, 26.0, 24.0, 14.0, 9.0, 4.0, 1.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.28515625, -6.1009521484375, -5.916748046875, -5.7325439453125, -5.54833984375, -5.3641357421875, -5.179931640625, -4.9957275390625, -4.8115234375, -4.6273193359375, -4.443115234375, -4.2589111328125, -4.07470703125, -3.8905029296875, -3.706298828125, -3.5220947265625, -3.337890625, -3.1536865234375, -2.969482421875, -2.7852783203125, -2.60107421875, -2.4168701171875, -2.232666015625, -2.0484619140625, -1.8642578125, -1.6800537109375, -1.495849609375, -1.3116455078125, -1.12744140625, -0.9432373046875, -0.759033203125, -0.5748291015625, -0.390625, -0.2064208984375, -0.022216796875, 0.1619873046875, 0.34619140625, 0.5303955078125, 0.714599609375, 0.8988037109375, 1.0830078125, 1.2672119140625, 1.451416015625, 1.6356201171875, 1.81982421875, 2.0040283203125, 2.188232421875, 2.3724365234375, 2.556640625, 2.7408447265625, 2.925048828125, 3.1092529296875, 3.29345703125, 3.4776611328125, 3.661865234375, 3.8460693359375, 4.0302734375, 4.2144775390625, 4.398681640625, 4.5828857421875, 4.76708984375, 4.9512939453125, 5.135498046875, 5.3197021484375, 5.50390625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 2.0, 11.0, 18.0, 23.0, 55.0, 58.0, 77.0, 124.0, 120.0, 151.0, 110.0, 83.0, 53.0, 43.0, 32.0, 13.0, 10.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56689453125, -0.5433502197265625, -0.519805908203125, -0.4962615966796875, -0.47271728515625, -0.4491729736328125, -0.425628662109375, -0.4020843505859375, -0.3785400390625, -0.3549957275390625, -0.331451416015625, -0.3079071044921875, -0.28436279296875, -0.2608184814453125, -0.237274169921875, -0.2137298583984375, -0.190185546875, -0.1666412353515625, -0.143096923828125, -0.1195526123046875, -0.09600830078125, -0.0724639892578125, -0.048919677734375, -0.0253753662109375, -0.0018310546875, 0.0217132568359375, 0.045257568359375, 0.0688018798828125, 0.09234619140625, 0.1158905029296875, 0.139434814453125, 0.1629791259765625, 0.1865234375, 0.2100677490234375, 0.233612060546875, 0.2571563720703125, 0.28070068359375, 0.3042449951171875, 0.327789306640625, 0.3513336181640625, 0.3748779296875, 0.3984222412109375, 0.421966552734375, 0.4455108642578125, 0.46905517578125, 0.4925994873046875, 0.516143798828125, 0.5396881103515625, 0.563232421875, 0.5867767333984375, 0.610321044921875, 0.6338653564453125, 0.65740966796875, 0.6809539794921875, 0.704498291015625, 0.7280426025390625, 0.7515869140625, 0.7751312255859375, 0.798675537109375, 0.8222198486328125, 0.84576416015625, 0.8693084716796875, 0.892852783203125, 0.9163970947265625, 0.93994140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 2.0, 5.0, 4.0, 11.0, 10.0, 19.0, 19.0, 51.0, 122.0, 245.0, 676.0, 2085.0, 10316.0, 119170.0, 3890136.0, 154656.0, 12515.0, 2711.0, 847.0, 340.0, 160.0, 71.0, 49.0, 26.0, 13.0, 7.0, 10.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.931640625, -1.841949462890625, -1.75225830078125, -1.662567138671875, -1.5728759765625, -1.483184814453125, -1.39349365234375, -1.303802490234375, -1.214111328125, -1.124420166015625, -1.03472900390625, -0.945037841796875, -0.8553466796875, -0.765655517578125, -0.67596435546875, -0.586273193359375, -0.49658203125, -0.406890869140625, -0.31719970703125, -0.227508544921875, -0.1378173828125, -0.048126220703125, 0.04156494140625, 0.131256103515625, 0.220947265625, 0.310638427734375, 0.40032958984375, 0.490020751953125, 0.5797119140625, 0.669403076171875, 0.75909423828125, 0.848785400390625, 0.9384765625, 1.028167724609375, 1.11785888671875, 1.207550048828125, 1.2972412109375, 1.386932373046875, 1.47662353515625, 1.566314697265625, 1.656005859375, 1.745697021484375, 1.83538818359375, 1.925079345703125, 2.0147705078125, 2.104461669921875, 2.19415283203125, 2.283843994140625, 2.37353515625, 2.463226318359375, 2.55291748046875, 2.642608642578125, 2.7322998046875, 2.821990966796875, 2.91168212890625, 3.001373291015625, 3.091064453125, 3.180755615234375, 3.27044677734375, 3.360137939453125, 3.4498291015625, 3.539520263671875, 3.62921142578125, 3.718902587890625, 3.80859375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 16.0, 16.0, 25.0, 36.0, 41.0, 66.0, 113.0, 235.0, 705.0, 1603.0, 616.0, 234.0, 128.0, 79.0, 42.0, 33.0, 19.0, 11.0, 15.0, 10.0, 3.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.423095703125, -0.4042930603027344, -0.38549041748046875, -0.3666877746582031, -0.3478851318359375, -0.3290824890136719, -0.31027984619140625, -0.2914772033691406, -0.272674560546875, -0.2538719177246094, -0.23506927490234375, -0.21626663208007812, -0.1974639892578125, -0.17866134643554688, -0.15985870361328125, -0.14105606079101562, -0.12225341796875, -0.10345077514648438, -0.08464813232421875, -0.06584548950195312, -0.0470428466796875, -0.028240203857421875, -0.00943756103515625, 0.009365081787109375, 0.028167724609375, 0.046970367431640625, 0.06577301025390625, 0.08457565307617188, 0.1033782958984375, 0.12218093872070312, 0.14098358154296875, 0.15978622436523438, 0.1785888671875, 0.19739151000976562, 0.21619415283203125, 0.23499679565429688, 0.2537994384765625, 0.2726020812988281, 0.29140472412109375, 0.3102073669433594, 0.329010009765625, 0.3478126525878906, 0.36661529541015625, 0.3854179382324219, 0.4042205810546875, 0.4230232238769531, 0.44182586669921875, 0.4606285095214844, 0.47943115234375, 0.4982337951660156, 0.5170364379882812, 0.5358390808105469, 0.5546417236328125, 0.5734443664550781, 0.5922470092773438, 0.6110496520996094, 0.629852294921875, 0.6486549377441406, 0.6674575805664062, 0.6862602233886719, 0.7050628662109375, 0.7238655090332031, 0.7426681518554688, 0.7614707946777344, 0.7802734375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 8.0, 12.0, 25.0, 90.0, 205.0, 317.0, 219.0, 98.0, 24.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8646183013916016, -2.7009494304656982, -2.537280797958374, -2.3736119270324707, -2.2099432945251465, -2.046274423599243, -1.8826055526733398, -1.718936800956726, -1.5552680492401123, -1.3915992975234985, -1.2279305458068848, -1.0642616748809814, -0.9005929231643677, -0.7369241714477539, -0.5732553601264954, -0.4095865488052368, -0.24591779708862305, -0.08224901556968689, 0.08141976594924927, 0.24508854746818542, 0.4087573289871216, 0.5724260807037354, 0.7360948920249939, 0.8997637033462524, 1.0634324550628662, 1.22710120677948, 1.3907699584960938, 1.554438829421997, 1.7181075811386108, 1.8817763328552246, 2.045445203781128, 2.2091140747070312, 2.3727822303771973, 2.5364511013031006, 2.700119733810425, 2.863788604736328, 3.0274572372436523, 3.1911261081695557, 3.354794979095459, 3.518463611602783, 3.6821324825286865, 3.84580135345459, 4.009469985961914, 4.173138618469238, 4.336807727813721, 4.500476360321045, 4.664144992828369, 4.827814102172852, 4.991482734680176, 5.1551513671875, 5.318820476531982, 5.482489109039307, 5.646157741546631, 5.809826850891113, 5.9734954833984375, 6.137164115905762, 6.300832748413086, 6.46450138092041, 6.628170490264893, 6.791839122772217, 6.955507755279541, 7.119176864624023, 7.282845497131348, 7.446514129638672, 7.610183238983154]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 10.0, 2.0, 4.0, 8.0, 4.0, 7.0, 12.0, 18.0, 12.0, 13.0, 23.0, 22.0, 16.0, 32.0, 25.0, 38.0, 34.0, 33.0, 33.0, 34.0, 37.0, 43.0, 42.0, 44.0, 37.0, 40.0, 42.0, 52.0, 33.0, 29.0, 44.0, 20.0, 19.0, 20.0, 20.0, 22.0, 22.0, 9.0, 17.0, 15.0, 5.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.5099492073059082, -1.4612531661987305, -1.4125571250915527, -1.363861083984375, -1.3151651620864868, -1.266469120979309, -1.2177730798721313, -1.1690770387649536, -1.1203811168670654, -1.0716850757598877, -1.02298903465271, -0.974293053150177, -0.925597071647644, -0.8769010305404663, -0.8282049894332886, -0.7795089483261108, -0.7308129072189331, -0.6821168661117554, -0.6334208846092224, -0.5847248435020447, -0.5360288619995117, -0.487332820892334, -0.43863677978515625, -0.3899407684803009, -0.34124475717544556, -0.2925487458705902, -0.24385271966457367, -0.19515669345855713, -0.14646068215370178, -0.09776467084884644, -0.0490686297416687, -0.0003726184368133545, 0.04832339286804199, 0.09701941162347794, 0.14571543037891388, 0.19441145658493042, 0.24310746788978577, 0.2918034791946411, 0.34049952030181885, 0.3891955316066742, 0.43789154291152954, 0.4865875542163849, 0.5352835655212402, 0.583979606628418, 0.6326756477355957, 0.6813716292381287, 0.7300676703453064, 0.7787636518478394, 0.8274596929550171, 0.8761557340621948, 0.9248517155647278, 0.9735477566719055, 1.0222437381744385, 1.0709397792816162, 1.119635820388794, 1.1683318614959717, 1.2170279026031494, 1.2657239437103271, 1.3144199848175049, 1.3631160259246826, 1.4118119478225708, 1.4605079889297485, 1.5092040300369263, 1.557900071144104, 1.6065959930419922]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 2.0, 1.0, 13.0, 7.0, 21.0, 13.0, 22.0, 36.0, 38.0, 42.0, 75.0, 102.0, 120.0, 183.0, 272.0, 411.0, 674.0, 1161.0, 2192.0, 4997.0, 14658.0, 56491.0, 247739.0, 469261.0, 187575.0, 41857.0, 11535.0, 4250.0, 1887.0, 1051.0, 616.0, 409.0, 248.0, 186.0, 117.0, 77.0, 57.0, 44.0, 32.0, 20.0, 13.0, 14.0, 10.0, 8.0, 7.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.609375, -1.561187744140625, -1.51300048828125, -1.464813232421875, -1.4166259765625, -1.368438720703125, -1.32025146484375, -1.272064208984375, -1.223876953125, -1.175689697265625, -1.12750244140625, -1.079315185546875, -1.0311279296875, -0.982940673828125, -0.93475341796875, -0.886566162109375, -0.83837890625, -0.790191650390625, -0.74200439453125, -0.693817138671875, -0.6456298828125, -0.597442626953125, -0.54925537109375, -0.501068115234375, -0.452880859375, -0.404693603515625, -0.35650634765625, -0.308319091796875, -0.2601318359375, -0.211944580078125, -0.16375732421875, -0.115570068359375, -0.0673828125, -0.019195556640625, 0.02899169921875, 0.077178955078125, 0.1253662109375, 0.173553466796875, 0.22174072265625, 0.269927978515625, 0.318115234375, 0.366302490234375, 0.41448974609375, 0.462677001953125, 0.5108642578125, 0.559051513671875, 0.60723876953125, 0.655426025390625, 0.70361328125, 0.751800537109375, 0.79998779296875, 0.848175048828125, 0.8963623046875, 0.944549560546875, 0.99273681640625, 1.040924072265625, 1.089111328125, 1.137298583984375, 1.18548583984375, 1.233673095703125, 1.2818603515625, 1.330047607421875, 1.37823486328125, 1.426422119140625, 1.474609375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 8.0, 14.0, 24.0, 37.0, 57.0, 78.0, 110.0, 141.0, 136.0, 116.0, 98.0, 62.0, 36.0, 32.0, 23.0, 11.0, 4.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57080078125, -0.54736328125, -0.52392578125, -0.50048828125, -0.47705078125, -0.45361328125, -0.43017578125, -0.40673828125, -0.38330078125, -0.35986328125, -0.33642578125, -0.31298828125, -0.28955078125, -0.26611328125, -0.24267578125, -0.21923828125, -0.19580078125, -0.17236328125, -0.14892578125, -0.12548828125, -0.10205078125, -0.07861328125, -0.05517578125, -0.03173828125, -0.00830078125, 0.01513671875, 0.03857421875, 0.06201171875, 0.08544921875, 0.10888671875, 0.13232421875, 0.15576171875, 0.17919921875, 0.20263671875, 0.22607421875, 0.24951171875, 0.27294921875, 0.29638671875, 0.31982421875, 0.34326171875, 0.36669921875, 0.39013671875, 0.41357421875, 0.43701171875, 0.46044921875, 0.48388671875, 0.50732421875, 0.53076171875, 0.55419921875, 0.57763671875, 0.60107421875, 0.62451171875, 0.64794921875, 0.67138671875, 0.69482421875, 0.71826171875, 0.74169921875, 0.76513671875, 0.78857421875, 0.81201171875, 0.83544921875, 0.85888671875, 0.88232421875, 0.90576171875, 0.92919921875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 9.0, 14.0, 14.0, 13.0, 17.0, 25.0, 41.0, 35.0, 43.0, 74.0, 105.0, 168.0, 226.0, 419.0, 643.0, 1291.0, 2747.0, 6617.0, 19071.0, 63150.0, 210017.0, 393746.0, 239491.0, 74350.0, 22210.0, 7610.0, 3075.0, 1372.0, 722.0, 378.0, 270.0, 174.0, 115.0, 90.0, 59.0, 46.0, 28.0, 22.0, 19.0, 16.0, 7.0, 8.0, 2.0, 3.0, 0.0, 1.0, 5.0, 0.0, 1.0], "bins": [-1.517578125, -1.47607421875, -1.4345703125, -1.39306640625, -1.3515625, -1.31005859375, -1.2685546875, -1.22705078125, -1.185546875, -1.14404296875, -1.1025390625, -1.06103515625, -1.01953125, -0.97802734375, -0.9365234375, -0.89501953125, -0.853515625, -0.81201171875, -0.7705078125, -0.72900390625, -0.6875, -0.64599609375, -0.6044921875, -0.56298828125, -0.521484375, -0.47998046875, -0.4384765625, -0.39697265625, -0.35546875, -0.31396484375, -0.2724609375, -0.23095703125, -0.189453125, -0.14794921875, -0.1064453125, -0.06494140625, -0.0234375, 0.01806640625, 0.0595703125, 0.10107421875, 0.142578125, 0.18408203125, 0.2255859375, 0.26708984375, 0.30859375, 0.35009765625, 0.3916015625, 0.43310546875, 0.474609375, 0.51611328125, 0.5576171875, 0.59912109375, 0.640625, 0.68212890625, 0.7236328125, 0.76513671875, 0.806640625, 0.84814453125, 0.8896484375, 0.93115234375, 0.97265625, 1.01416015625, 1.0556640625, 1.09716796875, 1.138671875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 8.0, 11.0, 8.0, 10.0, 8.0, 19.0, 13.0, 11.0, 31.0, 27.0, 19.0, 29.0, 32.0, 35.0, 41.0, 35.0, 44.0, 44.0, 45.0, 38.0, 39.0, 43.0, 44.0, 40.0, 35.0, 29.0, 30.0, 23.0, 20.0, 28.0, 24.0, 20.0, 26.0, 13.0, 9.0, 11.0, 9.0, 9.0, 7.0, 4.0, 3.0, 4.0, 2.0, 4.0, 3.0, 4.0, 0.0, 2.0, 2.0], "bins": [-1.7626953125, -1.711944580078125, -1.66119384765625, -1.610443115234375, -1.5596923828125, -1.508941650390625, -1.45819091796875, -1.407440185546875, -1.356689453125, -1.305938720703125, -1.25518798828125, -1.204437255859375, -1.1536865234375, -1.102935791015625, -1.05218505859375, -1.001434326171875, -0.95068359375, -0.899932861328125, -0.84918212890625, -0.798431396484375, -0.7476806640625, -0.696929931640625, -0.64617919921875, -0.595428466796875, -0.544677734375, -0.493927001953125, -0.44317626953125, -0.392425537109375, -0.3416748046875, -0.290924072265625, -0.24017333984375, -0.189422607421875, -0.138671875, -0.087921142578125, -0.03717041015625, 0.013580322265625, 0.0643310546875, 0.115081787109375, 0.16583251953125, 0.216583251953125, 0.267333984375, 0.318084716796875, 0.36883544921875, 0.419586181640625, 0.4703369140625, 0.521087646484375, 0.57183837890625, 0.622589111328125, 0.67333984375, 0.724090576171875, 0.77484130859375, 0.825592041015625, 0.8763427734375, 0.927093505859375, 0.97784423828125, 1.028594970703125, 1.079345703125, 1.130096435546875, 1.18084716796875, 1.231597900390625, 1.2823486328125, 1.333099365234375, 1.38385009765625, 1.434600830078125, 1.4853515625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 1.0, 7.0, 9.0, 11.0, 13.0, 38.0, 49.0, 75.0, 126.0, 234.0, 476.0, 1027.0, 2545.0, 8916.0, 38265.0, 211283.0, 564767.0, 176900.0, 32048.0, 7394.0, 2407.0, 946.0, 452.0, 203.0, 137.0, 81.0, 51.0, 33.0, 24.0, 15.0, 9.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43603515625, -0.41954803466796875, -0.4030609130859375, -0.38657379150390625, -0.370086669921875, -0.35359954833984375, -0.3371124267578125, -0.32062530517578125, -0.30413818359375, -0.28765106201171875, -0.2711639404296875, -0.25467681884765625, -0.238189697265625, -0.22170257568359375, -0.2052154541015625, -0.18872833251953125, -0.1722412109375, -0.15575408935546875, -0.1392669677734375, -0.12277984619140625, -0.106292724609375, -0.08980560302734375, -0.0733184814453125, -0.05683135986328125, -0.04034423828125, -0.02385711669921875, -0.0073699951171875, 0.00911712646484375, 0.025604248046875, 0.04209136962890625, 0.0585784912109375, 0.07506561279296875, 0.091552734375, 0.10803985595703125, 0.1245269775390625, 0.14101409912109375, 0.157501220703125, 0.17398834228515625, 0.1904754638671875, 0.20696258544921875, 0.22344970703125, 0.23993682861328125, 0.2564239501953125, 0.27291107177734375, 0.289398193359375, 0.30588531494140625, 0.3223724365234375, 0.33885955810546875, 0.3553466796875, 0.37183380126953125, 0.3883209228515625, 0.40480804443359375, 0.421295166015625, 0.43778228759765625, 0.4542694091796875, 0.47075653076171875, 0.48724365234375, 0.5037307739257812, 0.5202178955078125, 0.5367050170898438, 0.553192138671875, 0.5696792602539062, 0.5861663818359375, 0.6026535034179688, 0.619140625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 12.0, 7.0, 7.0, 10.0, 18.0, 21.0, 24.0, 30.0, 36.0, 24.0, 32.0, 45.0, 61.0, 80.0, 91.0, 77.0, 80.0, 51.0, 48.0, 44.0, 39.0, 20.0, 28.0, 21.0, 18.0, 4.0, 18.0, 10.0, 9.0, 5.0, 9.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.715557098388672e-05, -9.412877261638641e-05, -9.110197424888611e-05, -8.80751758813858e-05, -8.50483775138855e-05, -8.202157914638519e-05, -7.899478077888489e-05, -7.596798241138458e-05, -7.294118404388428e-05, -6.991438567638397e-05, -6.688758730888367e-05, -6.386078894138336e-05, -6.083399057388306e-05, -5.780719220638275e-05, -5.4780393838882446e-05, -5.175359547138214e-05, -4.8726797103881836e-05, -4.569999873638153e-05, -4.2673200368881226e-05, -3.964640200138092e-05, -3.6619603633880615e-05, -3.359280526638031e-05, -3.0566006898880005e-05, -2.75392085313797e-05, -2.4512410163879395e-05, -2.148561179637909e-05, -1.8458813428878784e-05, -1.543201506137848e-05, -1.2405216693878174e-05, -9.378418326377869e-06, -6.3516199588775635e-06, -3.3248215913772583e-06, -2.980232238769531e-07, 2.728775143623352e-06, 5.755573511123657e-06, 8.782371878623962e-06, 1.1809170246124268e-05, 1.4835968613624573e-05, 1.7862766981124878e-05, 2.0889565348625183e-05, 2.3916363716125488e-05, 2.6943162083625793e-05, 2.99699604511261e-05, 3.2996758818626404e-05, 3.602355718612671e-05, 3.9050355553627014e-05, 4.207715392112732e-05, 4.5103952288627625e-05, 4.813075065612793e-05, 5.1157549023628235e-05, 5.418434739112854e-05, 5.7211145758628845e-05, 6.023794412612915e-05, 6.326474249362946e-05, 6.629154086112976e-05, 6.931833922863007e-05, 7.234513759613037e-05, 7.537193596363068e-05, 7.839873433113098e-05, 8.142553269863129e-05, 8.445233106613159e-05, 8.74791294336319e-05, 9.05059278011322e-05, 9.353272616863251e-05, 9.655952453613281e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 5.0, 7.0, 12.0, 16.0, 25.0, 44.0, 72.0, 89.0, 191.0, 311.0, 632.0, 1558.0, 4331.0, 16095.0, 78856.0, 452036.0, 404478.0, 68707.0, 14364.0, 3924.0, 1432.0, 657.0, 319.0, 148.0, 92.0, 54.0, 37.0, 16.0, 15.0, 11.0, 3.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.677734375, -0.6583480834960938, -0.6389617919921875, -0.6195755004882812, -0.600189208984375, -0.5808029174804688, -0.5614166259765625, -0.5420303344726562, -0.52264404296875, -0.5032577514648438, -0.4838714599609375, -0.46448516845703125, -0.445098876953125, -0.42571258544921875, -0.4063262939453125, -0.38694000244140625, -0.3675537109375, -0.34816741943359375, -0.3287811279296875, -0.30939483642578125, -0.290008544921875, -0.27062225341796875, -0.2512359619140625, -0.23184967041015625, -0.21246337890625, -0.19307708740234375, -0.1736907958984375, -0.15430450439453125, -0.134918212890625, -0.11553192138671875, -0.0961456298828125, -0.07675933837890625, -0.057373046875, -0.03798675537109375, -0.0186004638671875, 0.00078582763671875, 0.020172119140625, 0.03955841064453125, 0.0589447021484375, 0.07833099365234375, 0.09771728515625, 0.11710357666015625, 0.1364898681640625, 0.15587615966796875, 0.175262451171875, 0.19464874267578125, 0.2140350341796875, 0.23342132568359375, 0.2528076171875, 0.27219390869140625, 0.2915802001953125, 0.31096649169921875, 0.330352783203125, 0.34973907470703125, 0.3691253662109375, 0.38851165771484375, 0.40789794921875, 0.42728424072265625, 0.4466705322265625, 0.46605682373046875, 0.485443115234375, 0.5048294067382812, 0.5242156982421875, 0.5436019897460938, 0.56298828125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 6.0, 7.0, 4.0, 9.0, 15.0, 15.0, 27.0, 29.0, 28.0, 39.0, 70.0, 57.0, 67.0, 68.0, 70.0, 80.0, 81.0, 58.0, 51.0, 42.0, 42.0, 24.0, 25.0, 24.0, 11.0, 10.0, 12.0, 9.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.454833984375, -0.4400596618652344, -0.42528533935546875, -0.4105110168457031, -0.3957366943359375, -0.3809623718261719, -0.36618804931640625, -0.3514137268066406, -0.336639404296875, -0.3218650817871094, -0.30709075927734375, -0.2923164367675781, -0.2775421142578125, -0.2627677917480469, -0.24799346923828125, -0.23321914672851562, -0.21844482421875, -0.20367050170898438, -0.18889617919921875, -0.17412185668945312, -0.1593475341796875, -0.14457321166992188, -0.12979888916015625, -0.11502456665039062, -0.100250244140625, -0.08547592163085938, -0.07070159912109375, -0.055927276611328125, -0.0411529541015625, -0.026378631591796875, -0.01160430908203125, 0.003170013427734375, 0.0179443359375, 0.032718658447265625, 0.04749298095703125, 0.062267303466796875, 0.0770416259765625, 0.09181594848632812, 0.10659027099609375, 0.12136459350585938, 0.136138916015625, 0.15091323852539062, 0.16568756103515625, 0.18046188354492188, 0.1952362060546875, 0.21001052856445312, 0.22478485107421875, 0.23955917358398438, 0.25433349609375, 0.2691078186035156, 0.28388214111328125, 0.2986564636230469, 0.3134307861328125, 0.3282051086425781, 0.34297943115234375, 0.3577537536621094, 0.372528076171875, 0.3873023986816406, 0.40207672119140625, 0.4168510437011719, 0.4316253662109375, 0.4463996887207031, 0.46117401123046875, 0.4759483337402344, 0.49072265625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 12.0, 17.0, 47.0, 148.0, 316.0, 281.0, 122.0, 46.0, 13.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.087081432342529, -5.400757789611816, -4.714433670043945, -4.028110027313232, -3.3417863845825195, -2.6554627418518066, -1.9691386222839355, -1.2828149795532227, -0.5964913368225098, 0.08983242511749268, 0.7761561870574951, 1.462480068206787, 2.1488037109375, 2.835127353668213, 3.521451473236084, 4.207775115966797, 4.89409875869751, 5.580422401428223, 6.266746520996094, 6.953070163726807, 7.6393938064575195, 8.32571792602539, 9.012041091918945, 9.698365211486816, 10.384689331054688, 11.071013450622559, 11.757336616516113, 12.443660736083984, 13.129983901977539, 13.81630802154541, 14.502632141113281, 15.188955307006836, 15.87527847290039, 16.561601638793945, 17.247926712036133, 17.934249877929688, 18.620573043823242, 19.306896209716797, 19.993221282958984, 20.67954444885254, 21.365867614746094, 22.05219078063965, 22.738515853881836, 23.42483901977539, 24.111162185668945, 24.7974853515625, 25.483810424804688, 26.170133590698242, 26.85645866394043, 27.542781829833984, 28.229106903076172, 28.915430068969727, 29.60175323486328, 30.28807830810547, 30.974401473999023, 31.660724639892578, 32.347049713134766, 33.03337478637695, 33.719696044921875, 34.40602111816406, 35.09234619140625, 35.77866744995117, 36.46499252319336, 37.15131759643555, 37.83763885498047]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 7.0, 3.0, 3.0, 7.0, 8.0, 13.0, 10.0, 20.0, 24.0, 31.0, 33.0, 48.0, 54.0, 54.0, 55.0, 50.0, 58.0, 57.0, 60.0, 56.0, 48.0, 43.0, 45.0, 32.0, 34.0, 39.0, 22.0, 24.0, 17.0, 14.0, 12.0, 5.0, 3.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.844799041748047, -11.413665771484375, -10.982531547546387, -10.551398277282715, -10.120264053344727, -9.689130783081055, -9.257997512817383, -8.826864242553711, -8.395730018615723, -7.964596271514893, -7.5334625244140625, -7.102329254150391, -6.6711955070495605, -6.2400617599487305, -5.808928489685059, -5.3777947425842285, -4.946660995483398, -4.515527248382568, -4.084393501281738, -3.6532602310180664, -3.2221264839172363, -2.7909927368164062, -2.3598592281341553, -1.9287257194519043, -1.4975919723510742, -1.0664583444595337, -0.6353247165679932, -0.20419108867645264, 0.2269425392150879, 0.658076286315918, 1.089209794998169, 1.52034330368042, 1.95147705078125, 2.38261079788208, 2.813744306564331, 3.244877815246582, 3.676011562347412, 4.107145309448242, 4.538278579711914, 4.969412326812744, 5.400546073913574, 5.831679821014404, 6.262813568115234, 6.693946838378906, 7.125080585479736, 7.556214332580566, 7.987347602844238, 8.418481826782227, 8.849615097045898, 9.28074836730957, 9.711882591247559, 10.14301586151123, 10.574150085449219, 11.00528335571289, 11.436416625976562, 11.867549896240234, 12.298684120178223, 12.729817390441895, 13.160951614379883, 13.592084884643555, 14.023218154907227, 14.454352378845215, 14.885485649108887, 15.316619873046875, 15.747753143310547]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 8.0, 6.0, 9.0, 20.0, 25.0, 23.0, 74.0, 112.0, 234.0, 601.0, 1918.0, 10458.0, 252827.0, 3896565.0, 25771.0, 3734.0, 1038.0, 416.0, 166.0, 102.0, 66.0, 39.0, 27.0, 12.0, 9.0, 4.0, 8.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6015625, -2.502227783203125, -2.40289306640625, -2.303558349609375, -2.2042236328125, -2.104888916015625, -2.00555419921875, -1.906219482421875, -1.806884765625, -1.707550048828125, -1.60821533203125, -1.508880615234375, -1.4095458984375, -1.310211181640625, -1.21087646484375, -1.111541748046875, -1.01220703125, -0.912872314453125, -0.81353759765625, -0.714202880859375, -0.6148681640625, -0.515533447265625, -0.41619873046875, -0.316864013671875, -0.217529296875, -0.118194580078125, -0.01885986328125, 0.080474853515625, 0.1798095703125, 0.279144287109375, 0.37847900390625, 0.477813720703125, 0.5771484375, 0.676483154296875, 0.77581787109375, 0.875152587890625, 0.9744873046875, 1.073822021484375, 1.17315673828125, 1.272491455078125, 1.371826171875, 1.471160888671875, 1.57049560546875, 1.669830322265625, 1.7691650390625, 1.868499755859375, 1.96783447265625, 2.067169189453125, 2.16650390625, 2.265838623046875, 2.36517333984375, 2.464508056640625, 2.5638427734375, 2.663177490234375, 2.76251220703125, 2.861846923828125, 2.961181640625, 3.060516357421875, 3.15985107421875, 3.259185791015625, 3.3585205078125, 3.457855224609375, 3.55718994140625, 3.656524658203125, 3.755859375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 3.0, 12.0, 12.0, 21.0, 26.0, 35.0, 63.0, 110.0, 120.0, 122.0, 131.0, 104.0, 76.0, 47.0, 43.0, 22.0, 26.0, 11.0, 6.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.623046875, -0.5980758666992188, -0.5731048583984375, -0.5481338500976562, -0.523162841796875, -0.49819183349609375, -0.4732208251953125, -0.44824981689453125, -0.42327880859375, -0.39830780029296875, -0.3733367919921875, -0.34836578369140625, -0.323394775390625, -0.29842376708984375, -0.2734527587890625, -0.24848175048828125, -0.2235107421875, -0.19853973388671875, -0.1735687255859375, -0.14859771728515625, -0.123626708984375, -0.09865570068359375, -0.0736846923828125, -0.04871368408203125, -0.02374267578125, 0.00122833251953125, 0.0261993408203125, 0.05117034912109375, 0.076141357421875, 0.10111236572265625, 0.1260833740234375, 0.15105438232421875, 0.176025390625, 0.20099639892578125, 0.2259674072265625, 0.25093841552734375, 0.275909423828125, 0.30088043212890625, 0.3258514404296875, 0.35082244873046875, 0.37579345703125, 0.40076446533203125, 0.4257354736328125, 0.45070648193359375, 0.475677490234375, 0.5006484985351562, 0.5256195068359375, 0.5505905151367188, 0.5755615234375, 0.6005325317382812, 0.6255035400390625, 0.6504745483398438, 0.675445556640625, 0.7004165649414062, 0.7253875732421875, 0.7503585815429688, 0.77532958984375, 0.8003005981445312, 0.8252716064453125, 0.8502426147460938, 0.875213623046875, 0.9001846313476562, 0.9251556396484375, 0.9501266479492188, 0.97509765625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 2.0, 3.0, 19.0, 9.0, 14.0, 32.0, 41.0, 45.0, 62.0, 103.0, 140.0, 303.0, 681.0, 2631.0, 15893.0, 356305.0, 3759709.0, 50309.0, 5851.0, 1314.0, 391.0, 155.0, 96.0, 62.0, 33.0, 26.0, 19.0, 19.0, 7.0, 6.0, 5.0, 3.0, 3.0], "bins": [-3.322265625, -3.251922607421875, -3.18157958984375, -3.111236572265625, -3.0408935546875, -2.970550537109375, -2.90020751953125, -2.829864501953125, -2.759521484375, -2.689178466796875, -2.61883544921875, -2.548492431640625, -2.4781494140625, -2.407806396484375, -2.33746337890625, -2.267120361328125, -2.19677734375, -2.126434326171875, -2.05609130859375, -1.985748291015625, -1.9154052734375, -1.845062255859375, -1.77471923828125, -1.704376220703125, -1.634033203125, -1.563690185546875, -1.49334716796875, -1.423004150390625, -1.3526611328125, -1.282318115234375, -1.21197509765625, -1.141632080078125, -1.0712890625, -1.000946044921875, -0.93060302734375, -0.860260009765625, -0.7899169921875, -0.719573974609375, -0.64923095703125, -0.578887939453125, -0.508544921875, -0.438201904296875, -0.36785888671875, -0.297515869140625, -0.2271728515625, -0.156829833984375, -0.08648681640625, -0.016143798828125, 0.05419921875, 0.124542236328125, 0.19488525390625, 0.265228271484375, 0.3355712890625, 0.405914306640625, 0.47625732421875, 0.546600341796875, 0.616943359375, 0.687286376953125, 0.75762939453125, 0.827972412109375, 0.8983154296875, 0.968658447265625, 1.03900146484375, 1.109344482421875, 1.1796875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 6.0, 17.0, 8.0, 30.0, 38.0, 80.0, 174.0, 535.0, 1974.0, 757.0, 212.0, 88.0, 48.0, 28.0, 20.0, 20.0, 13.0, 6.0, 4.0, 3.0, 3.0, 2.0, 6.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.85693359375, -0.8381500244140625, -0.819366455078125, -0.8005828857421875, -0.78179931640625, -0.7630157470703125, -0.744232177734375, -0.7254486083984375, -0.7066650390625, -0.6878814697265625, -0.669097900390625, -0.6503143310546875, -0.63153076171875, -0.6127471923828125, -0.593963623046875, -0.5751800537109375, -0.556396484375, -0.5376129150390625, -0.518829345703125, -0.5000457763671875, -0.48126220703125, -0.4624786376953125, -0.443695068359375, -0.4249114990234375, -0.4061279296875, -0.3873443603515625, -0.368560791015625, -0.3497772216796875, -0.33099365234375, -0.3122100830078125, -0.293426513671875, -0.2746429443359375, -0.255859375, -0.2370758056640625, -0.218292236328125, -0.1995086669921875, -0.18072509765625, -0.1619415283203125, -0.143157958984375, -0.1243743896484375, -0.1055908203125, -0.0868072509765625, -0.068023681640625, -0.0492401123046875, -0.03045654296875, -0.0116729736328125, 0.007110595703125, 0.0258941650390625, 0.044677734375, 0.0634613037109375, 0.082244873046875, 0.1010284423828125, 0.11981201171875, 0.1385955810546875, 0.157379150390625, 0.1761627197265625, 0.1949462890625, 0.2137298583984375, 0.232513427734375, 0.2512969970703125, 0.27008056640625, 0.2888641357421875, 0.307647705078125, 0.3264312744140625, 0.34521484375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 14.0, 58.0, 168.0, 255.0, 271.0, 160.0, 51.0, 16.0, 9.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.223796844482422, -4.0991315841674805, -3.974466562271118, -3.849801540374756, -3.7251362800598145, -3.600471258163452, -3.47580623626709, -3.3511409759521484, -3.226475715637207, -3.1018106937408447, -2.9771454334259033, -2.852480411529541, -2.7278151512145996, -2.6031501293182373, -2.478485107421875, -2.3538198471069336, -2.2291548252105713, -2.104489803314209, -1.9798245429992676, -1.8551595211029053, -1.7304942607879639, -1.6058292388916016, -1.4811640977859497, -1.3564989566802979, -1.231833815574646, -1.1071686744689941, -0.9825035333633423, -0.8578384518623352, -0.7331733107566833, -0.6085081696510315, -0.4838430881500244, -0.35917794704437256, -0.2345130443572998, -0.10984791815280914, 0.014817208051681519, 0.139482319355011, 0.26414746046066284, 0.3888126015663147, 0.5134776830673218, 0.6381428241729736, 0.7628079652786255, 0.8874731063842773, 1.0121382474899292, 1.136803388595581, 1.2614684104919434, 1.3861336708068848, 1.510798692703247, 1.635463833808899, 1.7601289749145508, 1.8847941160202026, 2.0094592571258545, 2.134124279022217, 2.258789539337158, 2.3834545612335205, 2.508119583129883, 2.632784843444824, 2.7574501037597656, 2.882115125656128, 3.0067803859710693, 3.1314454078674316, 3.256110668182373, 3.3807756900787354, 3.5054407119750977, 3.630105972290039, 3.7547709941864014]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 9.0, 12.0, 11.0, 18.0, 26.0, 19.0, 23.0, 41.0, 42.0, 34.0, 55.0, 50.0, 65.0, 67.0, 64.0, 45.0, 60.0, 56.0, 33.0, 38.0, 33.0, 42.0, 25.0, 25.0, 23.0, 21.0, 14.0, 10.0, 13.0, 3.0, 1.0, 0.0, 3.0, 4.0, 1.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5798777341842651, -1.5281381607055664, -1.4763985872268677, -1.424659013748169, -1.3729193210601807, -1.3211798667907715, -1.2694401741027832, -1.2177006006240845, -1.1659610271453857, -1.114221453666687, -1.0624818801879883, -1.0107423067092896, -0.959002673625946, -0.9072631001472473, -0.8555234670639038, -0.8037838935852051, -0.7520443201065063, -0.7003047466278076, -0.6485651731491089, -0.5968255400657654, -0.5450859665870667, -0.4933463931083679, -0.4416067898273468, -0.3898671865463257, -0.33812761306762695, -0.2863880395889282, -0.2346484363079071, -0.18290884792804718, -0.13116925954818726, -0.07942968606948853, -0.027690082788467407, 0.02404952049255371, 0.07578909397125244, 0.12752868235111237, 0.1792682707309723, 0.23100785911083221, 0.28274744749069214, 0.33448702096939087, 0.386226624250412, 0.4379662275314331, 0.48970580101013184, 0.5414453744888306, 0.5931849479675293, 0.6449245810508728, 0.6966641545295715, 0.7484037280082703, 0.8001433610916138, 0.8518829345703125, 0.9036225080490112, 0.95536208152771, 1.0071016550064087, 1.0588412284851074, 1.1105809211730957, 1.1623203754425049, 1.2140600681304932, 1.265799641609192, 1.3175392150878906, 1.3692787885665894, 1.421018362045288, 1.4727579355239868, 1.5244975090026855, 1.5762372016906738, 1.6279767751693726, 1.6797163486480713, 1.73145592212677]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 13.0, 12.0, 19.0, 24.0, 39.0, 63.0, 101.0, 187.0, 335.0, 729.0, 1493.0, 3966.0, 13604.0, 80158.0, 470417.0, 399254.0, 61236.0, 10870.0, 3260.0, 1337.0, 634.0, 335.0, 175.0, 108.0, 59.0, 40.0, 26.0, 18.0, 12.0, 8.0, 6.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.107421875, -2.043426513671875, -1.97943115234375, -1.915435791015625, -1.8514404296875, -1.787445068359375, -1.72344970703125, -1.659454345703125, -1.595458984375, -1.531463623046875, -1.46746826171875, -1.403472900390625, -1.3394775390625, -1.275482177734375, -1.21148681640625, -1.147491455078125, -1.08349609375, -1.019500732421875, -0.95550537109375, -0.891510009765625, -0.8275146484375, -0.763519287109375, -0.69952392578125, -0.635528564453125, -0.571533203125, -0.507537841796875, -0.44354248046875, -0.379547119140625, -0.3155517578125, -0.251556396484375, -0.18756103515625, -0.123565673828125, -0.0595703125, 0.004425048828125, 0.06842041015625, 0.132415771484375, 0.1964111328125, 0.260406494140625, 0.32440185546875, 0.388397216796875, 0.452392578125, 0.516387939453125, 0.58038330078125, 0.644378662109375, 0.7083740234375, 0.772369384765625, 0.83636474609375, 0.900360107421875, 0.96435546875, 1.028350830078125, 1.09234619140625, 1.156341552734375, 1.2203369140625, 1.284332275390625, 1.34832763671875, 1.412322998046875, 1.476318359375, 1.540313720703125, 1.60430908203125, 1.668304443359375, 1.7322998046875, 1.796295166015625, 1.86029052734375, 1.924285888671875, 1.98828125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 15.0, 15.0, 27.0, 27.0, 63.0, 113.0, 94.0, 127.0, 137.0, 109.0, 87.0, 48.0, 45.0, 31.0, 20.0, 14.0, 10.0, 8.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62841796875, -0.6034774780273438, -0.5785369873046875, -0.5535964965820312, -0.528656005859375, -0.5037155151367188, -0.4787750244140625, -0.45383453369140625, -0.42889404296875, -0.40395355224609375, -0.3790130615234375, -0.35407257080078125, -0.329132080078125, -0.30419158935546875, -0.2792510986328125, -0.25431060791015625, -0.2293701171875, -0.20442962646484375, -0.1794891357421875, -0.15454864501953125, -0.129608154296875, -0.10466766357421875, -0.0797271728515625, -0.05478668212890625, -0.02984619140625, -0.00490570068359375, 0.0200347900390625, 0.04497528076171875, 0.069915771484375, 0.09485626220703125, 0.1197967529296875, 0.14473724365234375, 0.169677734375, 0.19461822509765625, 0.2195587158203125, 0.24449920654296875, 0.269439697265625, 0.29438018798828125, 0.3193206787109375, 0.34426116943359375, 0.36920166015625, 0.39414215087890625, 0.4190826416015625, 0.44402313232421875, 0.468963623046875, 0.49390411376953125, 0.5188446044921875, 0.5437850952148438, 0.5687255859375, 0.5936660766601562, 0.6186065673828125, 0.6435470581054688, 0.668487548828125, 0.6934280395507812, 0.7183685302734375, 0.7433090209960938, 0.76824951171875, 0.7931900024414062, 0.8181304931640625, 0.8430709838867188, 0.868011474609375, 0.8929519653320312, 0.9178924560546875, 0.9428329467773438, 0.9677734375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 1.0, 8.0, 14.0, 18.0, 23.0, 32.0, 47.0, 52.0, 114.0, 173.0, 286.0, 487.0, 993.0, 2408.0, 8338.0, 38996.0, 209694.0, 510200.0, 221415.0, 41741.0, 8641.0, 2516.0, 983.0, 496.0, 285.0, 190.0, 115.0, 83.0, 64.0, 48.0, 34.0, 21.0, 13.0, 9.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5048828125, -1.4539031982421875, -1.402923583984375, -1.3519439697265625, -1.30096435546875, -1.2499847412109375, -1.199005126953125, -1.1480255126953125, -1.0970458984375, -1.0460662841796875, -0.995086669921875, -0.9441070556640625, -0.89312744140625, -0.8421478271484375, -0.791168212890625, -0.7401885986328125, -0.689208984375, -0.6382293701171875, -0.587249755859375, -0.5362701416015625, -0.48529052734375, -0.4343109130859375, -0.383331298828125, -0.3323516845703125, -0.2813720703125, -0.2303924560546875, -0.179412841796875, -0.1284332275390625, -0.07745361328125, -0.0264739990234375, 0.024505615234375, 0.0754852294921875, 0.12646484375, 0.1774444580078125, 0.228424072265625, 0.2794036865234375, 0.33038330078125, 0.3813629150390625, 0.432342529296875, 0.4833221435546875, 0.5343017578125, 0.5852813720703125, 0.636260986328125, 0.6872406005859375, 0.73822021484375, 0.7891998291015625, 0.840179443359375, 0.8911590576171875, 0.942138671875, 0.9931182861328125, 1.044097900390625, 1.0950775146484375, 1.14605712890625, 1.1970367431640625, 1.248016357421875, 1.2989959716796875, 1.3499755859375, 1.4009552001953125, 1.451934814453125, 1.5029144287109375, 1.55389404296875, 1.6048736572265625, 1.655853271484375, 1.7068328857421875, 1.7578125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 0.0, 4.0, 5.0, 3.0, 6.0, 5.0, 13.0, 9.0, 18.0, 11.0, 17.0, 19.0, 23.0, 19.0, 22.0, 20.0, 40.0, 52.0, 29.0, 42.0, 32.0, 38.0, 55.0, 41.0, 34.0, 40.0, 43.0, 37.0, 33.0, 26.0, 38.0, 34.0, 27.0, 17.0, 27.0, 21.0, 9.0, 12.0, 15.0, 11.0, 10.0, 7.0, 4.0, 6.0, 7.0, 5.0, 7.0, 4.0, 3.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.50390625, -1.45623779296875, -1.4085693359375, -1.36090087890625, -1.313232421875, -1.26556396484375, -1.2178955078125, -1.17022705078125, -1.12255859375, -1.07489013671875, -1.0272216796875, -0.97955322265625, -0.931884765625, -0.88421630859375, -0.8365478515625, -0.78887939453125, -0.7412109375, -0.69354248046875, -0.6458740234375, -0.59820556640625, -0.550537109375, -0.50286865234375, -0.4552001953125, -0.40753173828125, -0.35986328125, -0.31219482421875, -0.2645263671875, -0.21685791015625, -0.169189453125, -0.12152099609375, -0.0738525390625, -0.02618408203125, 0.021484375, 0.06915283203125, 0.1168212890625, 0.16448974609375, 0.212158203125, 0.25982666015625, 0.3074951171875, 0.35516357421875, 0.40283203125, 0.45050048828125, 0.4981689453125, 0.54583740234375, 0.593505859375, 0.64117431640625, 0.6888427734375, 0.73651123046875, 0.7841796875, 0.83184814453125, 0.8795166015625, 0.92718505859375, 0.974853515625, 1.02252197265625, 1.0701904296875, 1.11785888671875, 1.16552734375, 1.21319580078125, 1.2608642578125, 1.30853271484375, 1.356201171875, 1.40386962890625, 1.4515380859375, 1.49920654296875, 1.546875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 7.0, 3.0, 4.0, 12.0, 4.0, 13.0, 10.0, 20.0, 24.0, 41.0, 56.0, 97.0, 216.0, 441.0, 1038.0, 3003.0, 11864.0, 73963.0, 485313.0, 402422.0, 56110.0, 9603.0, 2534.0, 893.0, 380.0, 189.0, 111.0, 48.0, 39.0, 25.0, 11.0, 13.0, 9.0, 10.0, 9.0, 3.0, 3.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.544921875, -0.5288619995117188, -0.5128021240234375, -0.49674224853515625, -0.480682373046875, -0.46462249755859375, -0.4485626220703125, -0.43250274658203125, -0.41644287109375, -0.40038299560546875, -0.3843231201171875, -0.36826324462890625, -0.352203369140625, -0.33614349365234375, -0.3200836181640625, -0.30402374267578125, -0.2879638671875, -0.27190399169921875, -0.2558441162109375, -0.23978424072265625, -0.223724365234375, -0.20766448974609375, -0.1916046142578125, -0.17554473876953125, -0.15948486328125, -0.14342498779296875, -0.1273651123046875, -0.11130523681640625, -0.095245361328125, -0.07918548583984375, -0.0631256103515625, -0.04706573486328125, -0.031005859375, -0.01494598388671875, 0.0011138916015625, 0.01717376708984375, 0.033233642578125, 0.04929351806640625, 0.0653533935546875, 0.08141326904296875, 0.09747314453125, 0.11353302001953125, 0.1295928955078125, 0.14565277099609375, 0.161712646484375, 0.17777252197265625, 0.1938323974609375, 0.20989227294921875, 0.2259521484375, 0.24201202392578125, 0.2580718994140625, 0.27413177490234375, 0.290191650390625, 0.30625152587890625, 0.3223114013671875, 0.33837127685546875, 0.35443115234375, 0.37049102783203125, 0.3865509033203125, 0.40261077880859375, 0.418670654296875, 0.43473052978515625, 0.4507904052734375, 0.46685028076171875, 0.48291015625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 3.0, 2.0, 7.0, 6.0, 8.0, 10.0, 14.0, 16.0, 18.0, 22.0, 23.0, 30.0, 45.0, 56.0, 72.0, 81.0, 86.0, 90.0, 92.0, 71.0, 53.0, 35.0, 34.0, 23.0, 15.0, 14.0, 12.0, 11.0, 16.0, 6.0, 7.0, 8.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.088350296020508e-05, -7.79908150434494e-05, -7.509812712669373e-05, -7.220543920993805e-05, -6.931275129318237e-05, -6.64200633764267e-05, -6.352737545967102e-05, -6.0634687542915344e-05, -5.774199962615967e-05, -5.484931170940399e-05, -5.1956623792648315e-05, -4.906393587589264e-05, -4.617124795913696e-05, -4.327856004238129e-05, -4.038587212562561e-05, -3.7493184208869934e-05, -3.460049629211426e-05, -3.170780837535858e-05, -2.8815120458602905e-05, -2.592243254184723e-05, -2.3029744625091553e-05, -2.0137056708335876e-05, -1.72443687915802e-05, -1.4351680874824524e-05, -1.1458992958068848e-05, -8.566305041313171e-06, -5.673617124557495e-06, -2.780929207801819e-06, 1.1175870895385742e-07, 3.0044466257095337e-06, 5.89713454246521e-06, 8.789822459220886e-06, 1.1682510375976562e-05, 1.4575198292732239e-05, 1.7467886209487915e-05, 2.036057412624359e-05, 2.3253262042999268e-05, 2.6145949959754944e-05, 2.903863787651062e-05, 3.1931325793266296e-05, 3.482401371002197e-05, 3.771670162677765e-05, 4.0609389543533325e-05, 4.3502077460289e-05, 4.639476537704468e-05, 4.9287453293800354e-05, 5.218014121055603e-05, 5.5072829127311707e-05, 5.796551704406738e-05, 6.085820496082306e-05, 6.375089287757874e-05, 6.664358079433441e-05, 6.953626871109009e-05, 7.242895662784576e-05, 7.532164454460144e-05, 7.821433246135712e-05, 8.110702037811279e-05, 8.399970829486847e-05, 8.689239621162415e-05, 8.978508412837982e-05, 9.26777720451355e-05, 9.557045996189117e-05, 9.846314787864685e-05, 0.00010135583579540253, 0.0001042485237121582]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 9.0, 6.0, 12.0, 16.0, 22.0, 48.0, 77.0, 92.0, 167.0, 345.0, 694.0, 1585.0, 4336.0, 14479.0, 73404.0, 451359.0, 415560.0, 65795.0, 13475.0, 4076.0, 1519.0, 676.0, 357.0, 175.0, 93.0, 53.0, 43.0, 28.0, 14.0, 13.0, 11.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.51025390625, -0.494293212890625, -0.47833251953125, -0.462371826171875, -0.4464111328125, -0.430450439453125, -0.41448974609375, -0.398529052734375, -0.382568359375, -0.366607666015625, -0.35064697265625, -0.334686279296875, -0.3187255859375, -0.302764892578125, -0.28680419921875, -0.270843505859375, -0.2548828125, -0.238922119140625, -0.22296142578125, -0.207000732421875, -0.1910400390625, -0.175079345703125, -0.15911865234375, -0.143157958984375, -0.127197265625, -0.111236572265625, -0.09527587890625, -0.079315185546875, -0.0633544921875, -0.047393798828125, -0.03143310546875, -0.015472412109375, 0.00048828125, 0.016448974609375, 0.03240966796875, 0.048370361328125, 0.0643310546875, 0.080291748046875, 0.09625244140625, 0.112213134765625, 0.128173828125, 0.144134521484375, 0.16009521484375, 0.176055908203125, 0.1920166015625, 0.207977294921875, 0.22393798828125, 0.239898681640625, 0.255859375, 0.271820068359375, 0.28778076171875, 0.303741455078125, 0.3197021484375, 0.335662841796875, 0.35162353515625, 0.367584228515625, 0.383544921875, 0.399505615234375, 0.41546630859375, 0.431427001953125, 0.4473876953125, 0.463348388671875, 0.47930908203125, 0.495269775390625, 0.51123046875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 6.0, 4.0, 4.0, 5.0, 12.0, 10.0, 11.0, 24.0, 21.0, 17.0, 29.0, 44.0, 39.0, 61.0, 72.0, 68.0, 67.0, 79.0, 72.0, 60.0, 44.0, 37.0, 42.0, 41.0, 27.0, 19.0, 18.0, 20.0, 7.0, 11.0, 8.0, 3.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.396484375, -0.38440704345703125, -0.3723297119140625, -0.36025238037109375, -0.348175048828125, -0.33609771728515625, -0.3240203857421875, -0.31194305419921875, -0.29986572265625, -0.28778839111328125, -0.2757110595703125, -0.26363372802734375, -0.251556396484375, -0.23947906494140625, -0.2274017333984375, -0.21532440185546875, -0.2032470703125, -0.19116973876953125, -0.1790924072265625, -0.16701507568359375, -0.154937744140625, -0.14286041259765625, -0.1307830810546875, -0.11870574951171875, -0.10662841796875, -0.09455108642578125, -0.0824737548828125, -0.07039642333984375, -0.058319091796875, -0.04624176025390625, -0.0341644287109375, -0.02208709716796875, -0.010009765625, 0.00206756591796875, 0.0141448974609375, 0.02622222900390625, 0.038299560546875, 0.05037689208984375, 0.0624542236328125, 0.07453155517578125, 0.08660888671875, 0.09868621826171875, 0.1107635498046875, 0.12284088134765625, 0.134918212890625, 0.14699554443359375, 0.1590728759765625, 0.17115020751953125, 0.1832275390625, 0.19530487060546875, 0.2073822021484375, 0.21945953369140625, 0.231536865234375, 0.24361419677734375, 0.2556915283203125, 0.26776885986328125, 0.27984619140625, 0.29192352294921875, 0.3040008544921875, 0.31607818603515625, 0.328155517578125, 0.34023284912109375, 0.3523101806640625, 0.36438751220703125, 0.37646484375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 5.0, 9.0, 15.0, 30.0, 62.0, 161.0, 217.0, 257.0, 140.0, 59.0, 35.0, 11.0, 7.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0767645835876465, -5.570794105529785, -5.064823150634766, -4.558852672576904, -4.052882194519043, -3.5469117164611816, -3.040940999984741, -2.534970283508301, -2.0289998054504395, -1.5230292081832886, -1.0170586109161377, -0.5110880136489868, -0.0051174163818359375, 0.5008530616760254, 1.0068237781524658, 1.5127944946289062, 2.0187649726867676, 2.524735450744629, 3.0307061672210693, 3.5366768836975098, 4.042647361755371, 4.548617839813232, 5.054588317871094, 5.560559272766113, 6.066529750823975, 6.572500228881836, 7.0784711837768555, 7.584441661834717, 8.090412139892578, 8.596382141113281, 9.1023530960083, 9.60832405090332, 10.114295959472656, 10.620266914367676, 11.126236915588379, 11.632207870483398, 12.138177871704102, 12.644148826599121, 13.15011978149414, 13.656089782714844, 14.162060737609863, 14.668031692504883, 15.174001693725586, 15.679972648620605, 16.185943603515625, 16.691913604736328, 17.19788360595703, 17.703855514526367, 18.20982551574707, 18.715795516967773, 19.22176742553711, 19.727737426757812, 20.233707427978516, 20.73967742919922, 21.245649337768555, 21.751619338989258, 22.257591247558594, 22.763561248779297, 23.269533157348633, 23.775503158569336, 24.28147315979004, 24.787445068359375, 25.293415069580078, 25.79938507080078, 26.305355072021484]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 6.0, 9.0, 10.0, 15.0, 18.0, 28.0, 22.0, 33.0, 30.0, 46.0, 53.0, 55.0, 65.0, 44.0, 54.0, 58.0, 54.0, 48.0, 50.0, 37.0, 44.0, 35.0, 29.0, 27.0, 31.0, 22.0, 13.0, 16.0, 5.0, 11.0, 6.0, 7.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-11.890177726745605, -11.531302452087402, -11.1724271774292, -10.81355094909668, -10.454675674438477, -10.095800399780273, -9.73692512512207, -9.378049850463867, -9.019173622131348, -8.660298347473145, -8.301423072814941, -7.94254732131958, -7.583671569824219, -7.224796295166016, -6.8659210205078125, -6.507045269012451, -6.148169994354248, -5.789294719696045, -5.430418968200684, -5.0715436935424805, -4.712667942047119, -4.353792667388916, -3.994917154312134, -3.6360416412353516, -3.2771661281585693, -2.918290615081787, -2.559415102005005, -2.2005395889282227, -1.84166419506073, -1.4827886819839478, -1.123913288116455, -0.7650377750396729, -0.4061622619628906, -0.047286778688430786, 0.31158870458602905, 0.6704641580581665, 1.0293396711349487, 1.388215184211731, 1.7470905780792236, 2.105966091156006, 2.464841604232788, 2.8237171173095703, 3.1825926303863525, 3.5414681434631348, 3.900343418121338, 4.259219169616699, 4.618094444274902, 4.9769697189331055, 5.335845470428467, 5.69472074508667, 6.053596496582031, 6.412471771240234, 6.771347522735596, 7.130222797393799, 7.48909854888916, 7.847973823547363, 8.206849098205566, 8.56572437286377, 8.924599647521973, 9.283475875854492, 9.642351150512695, 10.001226425170898, 10.360101699829102, 10.718976974487305, 11.077853202819824]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 4.0, 11.0, 11.0, 18.0, 28.0, 31.0, 49.0, 79.0, 143.0, 271.0, 576.0, 1369.0, 3919.0, 21833.0, 758883.0, 3363800.0, 33866.0, 5817.0, 1820.0, 803.0, 399.0, 224.0, 103.0, 75.0, 42.0, 31.0, 25.0, 17.0, 7.0, 7.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.521484375, -2.431732177734375, -2.34197998046875, -2.252227783203125, -2.1624755859375, -2.072723388671875, -1.98297119140625, -1.893218994140625, -1.803466796875, -1.713714599609375, -1.62396240234375, -1.534210205078125, -1.4444580078125, -1.354705810546875, -1.26495361328125, -1.175201416015625, -1.08544921875, -0.995697021484375, -0.90594482421875, -0.816192626953125, -0.7264404296875, -0.636688232421875, -0.54693603515625, -0.457183837890625, -0.367431640625, -0.277679443359375, -0.18792724609375, -0.098175048828125, -0.0084228515625, 0.081329345703125, 0.17108154296875, 0.260833740234375, 0.3505859375, 0.440338134765625, 0.53009033203125, 0.619842529296875, 0.7095947265625, 0.799346923828125, 0.88909912109375, 0.978851318359375, 1.068603515625, 1.158355712890625, 1.24810791015625, 1.337860107421875, 1.4276123046875, 1.517364501953125, 1.60711669921875, 1.696868896484375, 1.78662109375, 1.876373291015625, 1.96612548828125, 2.055877685546875, 2.1456298828125, 2.235382080078125, 2.32513427734375, 2.414886474609375, 2.504638671875, 2.594390869140625, 2.68414306640625, 2.773895263671875, 2.8636474609375, 2.953399658203125, 3.04315185546875, 3.132904052734375, 3.22265625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 0.0, 3.0, 4.0, 8.0, 18.0, 17.0, 26.0, 56.0, 65.0, 83.0, 107.0, 142.0, 109.0, 111.0, 69.0, 63.0, 41.0, 26.0, 27.0, 9.0, 9.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64111328125, -0.6154556274414062, -0.5897979736328125, -0.5641403198242188, -0.538482666015625, -0.5128250122070312, -0.4871673583984375, -0.46150970458984375, -0.43585205078125, -0.41019439697265625, -0.3845367431640625, -0.35887908935546875, -0.333221435546875, -0.30756378173828125, -0.2819061279296875, -0.25624847412109375, -0.2305908203125, -0.20493316650390625, -0.1792755126953125, -0.15361785888671875, -0.127960205078125, -0.10230255126953125, -0.0766448974609375, -0.05098724365234375, -0.02532958984375, 0.00032806396484375, 0.0259857177734375, 0.05164337158203125, 0.077301025390625, 0.10295867919921875, 0.1286163330078125, 0.15427398681640625, 0.179931640625, 0.20558929443359375, 0.2312469482421875, 0.25690460205078125, 0.282562255859375, 0.30821990966796875, 0.3338775634765625, 0.35953521728515625, 0.38519287109375, 0.41085052490234375, 0.4365081787109375, 0.46216583251953125, 0.487823486328125, 0.5134811401367188, 0.5391387939453125, 0.5647964477539062, 0.5904541015625, 0.6161117553710938, 0.6417694091796875, 0.6674270629882812, 0.693084716796875, 0.7187423706054688, 0.7444000244140625, 0.7700576782226562, 0.79571533203125, 0.8213729858398438, 0.8470306396484375, 0.8726882934570312, 0.898345947265625, 0.9240036010742188, 0.9496612548828125, 0.9753189086914062, 1.0009765625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 6.0, 4.0, 6.0, 15.0, 30.0, 30.0, 54.0, 107.0, 253.0, 487.0, 1128.0, 3176.0, 13889.0, 597683.0, 3547570.0, 23573.0, 3945.0, 1265.0, 522.0, 261.0, 128.0, 61.0, 42.0, 22.0, 10.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.357421875, -3.259033203125, -3.16064453125, -3.062255859375, -2.9638671875, -2.865478515625, -2.76708984375, -2.668701171875, -2.5703125, -2.471923828125, -2.37353515625, -2.275146484375, -2.1767578125, -2.078369140625, -1.97998046875, -1.881591796875, -1.783203125, -1.684814453125, -1.58642578125, -1.488037109375, -1.3896484375, -1.291259765625, -1.19287109375, -1.094482421875, -0.99609375, -0.897705078125, -0.79931640625, -0.700927734375, -0.6025390625, -0.504150390625, -0.40576171875, -0.307373046875, -0.208984375, -0.110595703125, -0.01220703125, 0.086181640625, 0.1845703125, 0.282958984375, 0.38134765625, 0.479736328125, 0.578125, 0.676513671875, 0.77490234375, 0.873291015625, 0.9716796875, 1.070068359375, 1.16845703125, 1.266845703125, 1.365234375, 1.463623046875, 1.56201171875, 1.660400390625, 1.7587890625, 1.857177734375, 1.95556640625, 2.053955078125, 2.15234375, 2.250732421875, 2.34912109375, 2.447509765625, 2.5458984375, 2.644287109375, 2.74267578125, 2.841064453125, 2.939453125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 7.0, 10.0, 7.0, 10.0, 25.0, 38.0, 99.0, 276.0, 1398.0, 1672.0, 332.0, 98.0, 51.0, 18.0, 13.0, 6.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4208984375, -1.3778839111328125, -1.334869384765625, -1.2918548583984375, -1.24884033203125, -1.2058258056640625, -1.162811279296875, -1.1197967529296875, -1.0767822265625, -1.0337677001953125, -0.990753173828125, -0.9477386474609375, -0.90472412109375, -0.8617095947265625, -0.818695068359375, -0.7756805419921875, -0.732666015625, -0.6896514892578125, -0.646636962890625, -0.6036224365234375, -0.56060791015625, -0.5175933837890625, -0.474578857421875, -0.4315643310546875, -0.3885498046875, -0.3455352783203125, -0.302520751953125, -0.2595062255859375, -0.21649169921875, -0.1734771728515625, -0.130462646484375, -0.0874481201171875, -0.04443359375, -0.0014190673828125, 0.041595458984375, 0.0846099853515625, 0.12762451171875, 0.1706390380859375, 0.213653564453125, 0.2566680908203125, 0.2996826171875, 0.3426971435546875, 0.385711669921875, 0.4287261962890625, 0.47174072265625, 0.5147552490234375, 0.557769775390625, 0.6007843017578125, 0.643798828125, 0.6868133544921875, 0.729827880859375, 0.7728424072265625, 0.81585693359375, 0.8588714599609375, 0.901885986328125, 0.9449005126953125, 0.9879150390625, 1.0309295654296875, 1.073944091796875, 1.1169586181640625, 1.15997314453125, 1.2029876708984375, 1.246002197265625, 1.2890167236328125, 1.33203125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 9.0, 12.0, 53.0, 157.0, 326.0, 267.0, 108.0, 39.0, 10.0, 6.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.99445915222168, -9.755186080932617, -9.515913963317871, -9.276640892028809, -9.037368774414062, -8.798095703125, -8.558823585510254, -8.319550514221191, -8.080278396606445, -7.841005802154541, -7.601733207702637, -7.362460613250732, -7.123188018798828, -6.883915424346924, -6.6446428298950195, -6.405370235443115, -6.166097640991211, -5.926825046539307, -5.687552452087402, -5.448279857635498, -5.209007263183594, -4.9697346687316895, -4.730462074279785, -4.491189479827881, -4.251916408538818, -4.012643814086914, -3.7733712196350098, -3.5340986251831055, -3.294826030731201, -3.055553436279297, -2.8162808418273926, -2.5770082473754883, -2.337735652923584, -2.0984630584716797, -1.8591904640197754, -1.619917869567871, -1.3806452751159668, -1.141372561454773, -0.9020999670028687, -0.6628273725509644, -0.42355477809906006, -0.18428216874599457, 0.05499044060707092, 0.2942630648612976, 0.5335356593132019, 0.772808313369751, 1.0120809078216553, 1.2513535022735596, 1.4906260967254639, 1.7298986911773682, 1.9691712856292725, 2.2084438800811768, 2.447716474533081, 2.6869893074035645, 2.9262619018554688, 3.165534496307373, 3.4048070907592773, 3.6440796852111816, 3.883352279663086, 4.12262487411499, 4.3618974685668945, 4.601170063018799, 4.840442657470703, 5.079715251922607, 5.318987846374512]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 8.0, 4.0, 16.0, 9.0, 20.0, 23.0, 37.0, 36.0, 51.0, 52.0, 69.0, 88.0, 59.0, 68.0, 70.0, 60.0, 67.0, 57.0, 62.0, 31.0, 26.0, 20.0, 19.0, 9.0, 10.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.001364707946777, -3.878387928009033, -3.755411148071289, -3.632434368133545, -3.50945782661438, -3.3864810466766357, -3.2635042667388916, -3.1405274868011475, -3.0175509452819824, -2.8945741653442383, -2.771597385406494, -2.64862060546875, -2.525644063949585, -2.402667284011841, -2.2796905040740967, -2.1567137241363525, -2.0337369441986084, -1.9107601642608643, -1.7877835035324097, -1.6648067235946655, -1.541830062866211, -1.4188532829284668, -1.2958765029907227, -1.1728997230529785, -1.049923062324524, -0.9269463419914246, -0.8039696216583252, -0.680992841720581, -0.5580161213874817, -0.4350394010543823, -0.3120626211166382, -0.18908590078353882, -0.06610918045043945, 0.056867554783821106, 0.17984429001808167, 0.3028210401535034, 0.4257977604866028, 0.5487744808197021, 0.6717512607574463, 0.7947279810905457, 0.917704701423645, 1.0406814813613892, 1.1636581420898438, 1.286634922027588, 1.409611701965332, 1.5325883626937866, 1.6555651426315308, 1.7785418033599854, 1.9015185832977295, 2.0244953632354736, 2.1474721431732178, 2.270448684692383, 2.393425464630127, 2.516402244567871, 2.6393790245056152, 2.7623558044433594, 2.8853325843811035, 3.0083093643188477, 3.131286144256592, 3.254262924194336, 3.377239465713501, 3.500216245651245, 3.6231930255889893, 3.7461698055267334, 3.8691463470458984]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 1.0, 10.0, 13.0, 19.0, 25.0, 35.0, 68.0, 108.0, 170.0, 341.0, 576.0, 1387.0, 2984.0, 8159.0, 36574.0, 256944.0, 577487.0, 133128.0, 20445.0, 5510.0, 2323.0, 1009.0, 527.0, 276.0, 173.0, 85.0, 55.0, 42.0, 25.0, 19.0, 15.0, 8.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.96875, -1.899261474609375, -1.82977294921875, -1.760284423828125, -1.6907958984375, -1.621307373046875, -1.55181884765625, -1.482330322265625, -1.412841796875, -1.343353271484375, -1.27386474609375, -1.204376220703125, -1.1348876953125, -1.065399169921875, -0.99591064453125, -0.926422119140625, -0.85693359375, -0.787445068359375, -0.71795654296875, -0.648468017578125, -0.5789794921875, -0.509490966796875, -0.44000244140625, -0.370513916015625, -0.301025390625, -0.231536865234375, -0.16204833984375, -0.092559814453125, -0.0230712890625, 0.046417236328125, 0.11590576171875, 0.185394287109375, 0.2548828125, 0.324371337890625, 0.39385986328125, 0.463348388671875, 0.5328369140625, 0.602325439453125, 0.67181396484375, 0.741302490234375, 0.810791015625, 0.880279541015625, 0.94976806640625, 1.019256591796875, 1.0887451171875, 1.158233642578125, 1.22772216796875, 1.297210693359375, 1.36669921875, 1.436187744140625, 1.50567626953125, 1.575164794921875, 1.6446533203125, 1.714141845703125, 1.78363037109375, 1.853118896484375, 1.922607421875, 1.992095947265625, 2.06158447265625, 2.131072998046875, 2.2005615234375, 2.270050048828125, 2.33953857421875, 2.409027099609375, 2.478515625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 5.0, 2.0, 13.0, 17.0, 19.0, 52.0, 57.0, 88.0, 112.0, 99.0, 138.0, 101.0, 97.0, 55.0, 55.0, 26.0, 28.0, 13.0, 5.0, 5.0, 2.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65869140625, -0.6336669921875, -0.608642578125, -0.5836181640625, -0.55859375, -0.5335693359375, -0.508544921875, -0.4835205078125, -0.45849609375, -0.4334716796875, -0.408447265625, -0.3834228515625, -0.3583984375, -0.3333740234375, -0.308349609375, -0.2833251953125, -0.25830078125, -0.2332763671875, -0.208251953125, -0.1832275390625, -0.158203125, -0.1331787109375, -0.108154296875, -0.0831298828125, -0.05810546875, -0.0330810546875, -0.008056640625, 0.0169677734375, 0.0419921875, 0.0670166015625, 0.092041015625, 0.1170654296875, 0.14208984375, 0.1671142578125, 0.192138671875, 0.2171630859375, 0.2421875, 0.2672119140625, 0.292236328125, 0.3172607421875, 0.34228515625, 0.3673095703125, 0.392333984375, 0.4173583984375, 0.4423828125, 0.4674072265625, 0.492431640625, 0.5174560546875, 0.54248046875, 0.5675048828125, 0.592529296875, 0.6175537109375, 0.642578125, 0.6676025390625, 0.692626953125, 0.7176513671875, 0.74267578125, 0.7677001953125, 0.792724609375, 0.8177490234375, 0.8427734375, 0.8677978515625, 0.892822265625, 0.9178466796875, 0.94287109375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 9.0, 10.0, 19.0, 21.0, 22.0, 35.0, 36.0, 51.0, 80.0, 136.0, 235.0, 352.0, 654.0, 1483.0, 3427.0, 9901.0, 35116.0, 138596.0, 375679.0, 334000.0, 107867.0, 27368.0, 7912.0, 2827.0, 1164.0, 591.0, 315.0, 188.0, 119.0, 95.0, 54.0, 40.0, 41.0, 26.0, 23.0, 13.0, 11.0, 9.0, 3.0, 12.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1279296875, -1.0860137939453125, -1.044097900390625, -1.0021820068359375, -0.96026611328125, -0.9183502197265625, -0.876434326171875, -0.8345184326171875, -0.7926025390625, -0.7506866455078125, -0.708770751953125, -0.6668548583984375, -0.62493896484375, -0.5830230712890625, -0.541107177734375, -0.4991912841796875, -0.457275390625, -0.4153594970703125, -0.373443603515625, -0.3315277099609375, -0.28961181640625, -0.2476959228515625, -0.205780029296875, -0.1638641357421875, -0.1219482421875, -0.0800323486328125, -0.038116455078125, 0.0037994384765625, 0.04571533203125, 0.0876312255859375, 0.129547119140625, 0.1714630126953125, 0.21337890625, 0.2552947998046875, 0.297210693359375, 0.3391265869140625, 0.38104248046875, 0.4229583740234375, 0.464874267578125, 0.5067901611328125, 0.5487060546875, 0.5906219482421875, 0.632537841796875, 0.6744537353515625, 0.71636962890625, 0.7582855224609375, 0.800201416015625, 0.8421173095703125, 0.884033203125, 0.9259490966796875, 0.967864990234375, 1.0097808837890625, 1.05169677734375, 1.0936126708984375, 1.135528564453125, 1.1774444580078125, 1.2193603515625, 1.2612762451171875, 1.303192138671875, 1.3451080322265625, 1.38702392578125, 1.4289398193359375, 1.470855712890625, 1.5127716064453125, 1.5546875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 8.0, 5.0, 6.0, 7.0, 8.0, 15.0, 8.0, 14.0, 13.0, 29.0, 18.0, 24.0, 29.0, 22.0, 34.0, 42.0, 37.0, 45.0, 39.0, 46.0, 57.0, 51.0, 50.0, 34.0, 37.0, 50.0, 46.0, 30.0, 29.0, 23.0, 26.0, 24.0, 13.0, 20.0, 8.0, 9.0, 9.0, 7.0, 8.0, 3.0, 5.0, 5.0, 4.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.626953125, -1.5720977783203125, -1.517242431640625, -1.4623870849609375, -1.40753173828125, -1.3526763916015625, -1.297821044921875, -1.2429656982421875, -1.1881103515625, -1.1332550048828125, -1.078399658203125, -1.0235443115234375, -0.96868896484375, -0.9138336181640625, -0.858978271484375, -0.8041229248046875, -0.749267578125, -0.6944122314453125, -0.639556884765625, -0.5847015380859375, -0.52984619140625, -0.4749908447265625, -0.420135498046875, -0.3652801513671875, -0.3104248046875, -0.2555694580078125, -0.200714111328125, -0.1458587646484375, -0.09100341796875, -0.0361480712890625, 0.018707275390625, 0.0735626220703125, 0.12841796875, 0.1832733154296875, 0.238128662109375, 0.2929840087890625, 0.34783935546875, 0.4026947021484375, 0.457550048828125, 0.5124053955078125, 0.5672607421875, 0.6221160888671875, 0.676971435546875, 0.7318267822265625, 0.78668212890625, 0.8415374755859375, 0.896392822265625, 0.9512481689453125, 1.006103515625, 1.0609588623046875, 1.115814208984375, 1.1706695556640625, 1.22552490234375, 1.2803802490234375, 1.335235595703125, 1.3900909423828125, 1.4449462890625, 1.4998016357421875, 1.554656982421875, 1.6095123291015625, 1.66436767578125, 1.7192230224609375, 1.774078369140625, 1.8289337158203125, 1.8837890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 6.0, 8.0, 11.0, 6.0, 11.0, 32.0, 73.0, 124.0, 287.0, 712.0, 2505.0, 20684.0, 737172.0, 274378.0, 9904.0, 1638.0, 540.0, 213.0, 105.0, 54.0, 25.0, 19.0, 9.0, 9.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-1.4755859375, -1.4376068115234375, -1.399627685546875, -1.3616485595703125, -1.32366943359375, -1.2856903076171875, -1.247711181640625, -1.2097320556640625, -1.1717529296875, -1.1337738037109375, -1.095794677734375, -1.0578155517578125, -1.01983642578125, -0.9818572998046875, -0.943878173828125, -0.9058990478515625, -0.867919921875, -0.8299407958984375, -0.791961669921875, -0.7539825439453125, -0.71600341796875, -0.6780242919921875, -0.640045166015625, -0.6020660400390625, -0.5640869140625, -0.5261077880859375, -0.488128662109375, -0.4501495361328125, -0.41217041015625, -0.3741912841796875, -0.336212158203125, -0.2982330322265625, -0.26025390625, -0.2222747802734375, -0.184295654296875, -0.1463165283203125, -0.10833740234375, -0.0703582763671875, -0.032379150390625, 0.0055999755859375, 0.0435791015625, 0.0815582275390625, 0.119537353515625, 0.1575164794921875, 0.19549560546875, 0.2334747314453125, 0.271453857421875, 0.3094329833984375, 0.347412109375, 0.3853912353515625, 0.423370361328125, 0.4613494873046875, 0.49932861328125, 0.5373077392578125, 0.575286865234375, 0.6132659912109375, 0.6512451171875, 0.6892242431640625, 0.727203369140625, 0.7651824951171875, 0.80316162109375, 0.8411407470703125, 0.879119873046875, 0.9170989990234375, 0.955078125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 9.0, 11.0, 14.0, 19.0, 28.0, 24.0, 45.0, 74.0, 116.0, 169.0, 147.0, 107.0, 66.0, 44.0, 22.0, 17.0, 24.0, 16.0, 11.0, 7.0, 9.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015997886657714844, -0.00015585683286190033, -0.00015173479914665222, -0.00014761276543140411, -0.000143490731716156, -0.0001393686980009079, -0.0001352466642856598, -0.00013112463057041168, -0.00012700259685516357, -0.00012288056313991547, -0.00011875852942466736, -0.00011463649570941925, -0.00011051446199417114, -0.00010639242827892303, -0.00010227039456367493, -9.814836084842682e-05, -9.402632713317871e-05, -8.99042934179306e-05, -8.57822597026825e-05, -8.166022598743439e-05, -7.753819227218628e-05, -7.341615855693817e-05, -6.929412484169006e-05, -6.517209112644196e-05, -6.105005741119385e-05, -5.692802369594574e-05, -5.280598998069763e-05, -4.8683956265449524e-05, -4.4561922550201416e-05, -4.043988883495331e-05, -3.63178551197052e-05, -3.219582140445709e-05, -2.8073787689208984e-05, -2.3951753973960876e-05, -1.982972025871277e-05, -1.570768654346466e-05, -1.1585652828216553e-05, -7.463619112968445e-06, -3.341585397720337e-06, 7.80448317527771e-07, 4.902482032775879e-06, 9.024515748023987e-06, 1.3146549463272095e-05, 1.7268583178520203e-05, 2.139061689376831e-05, 2.551265060901642e-05, 2.9634684324264526e-05, 3.3756718039512634e-05, 3.787875175476074e-05, 4.200078547000885e-05, 4.612281918525696e-05, 5.0244852900505066e-05, 5.4366886615753174e-05, 5.848892033100128e-05, 6.261095404624939e-05, 6.67329877614975e-05, 7.08550214767456e-05, 7.497705519199371e-05, 7.909908890724182e-05, 8.322112262248993e-05, 8.734315633773804e-05, 9.146519005298615e-05, 9.558722376823425e-05, 9.970925748348236e-05, 0.00010383129119873047]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 0.0, 5.0, 8.0, 10.0, 16.0, 25.0, 29.0, 81.0, 202.0, 424.0, 1470.0, 8681.0, 321921.0, 699030.0, 13836.0, 1930.0, 499.0, 195.0, 95.0, 36.0, 20.0, 14.0, 10.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.328125, -1.28399658203125, -1.2398681640625, -1.19573974609375, -1.151611328125, -1.10748291015625, -1.0633544921875, -1.01922607421875, -0.97509765625, -0.93096923828125, -0.8868408203125, -0.84271240234375, -0.798583984375, -0.75445556640625, -0.7103271484375, -0.66619873046875, -0.6220703125, -0.57794189453125, -0.5338134765625, -0.48968505859375, -0.445556640625, -0.40142822265625, -0.3572998046875, -0.31317138671875, -0.26904296875, -0.22491455078125, -0.1807861328125, -0.13665771484375, -0.092529296875, -0.04840087890625, -0.0042724609375, 0.03985595703125, 0.083984375, 0.12811279296875, 0.1722412109375, 0.21636962890625, 0.260498046875, 0.30462646484375, 0.3487548828125, 0.39288330078125, 0.43701171875, 0.48114013671875, 0.5252685546875, 0.56939697265625, 0.613525390625, 0.65765380859375, 0.7017822265625, 0.74591064453125, 0.7900390625, 0.83416748046875, 0.8782958984375, 0.92242431640625, 0.966552734375, 1.01068115234375, 1.0548095703125, 1.09893798828125, 1.14306640625, 1.18719482421875, 1.2313232421875, 1.27545166015625, 1.319580078125, 1.36370849609375, 1.4078369140625, 1.45196533203125, 1.49609375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 8.0, 5.0, 9.0, 7.0, 14.0, 26.0, 62.0, 94.0, 167.0, 211.0, 171.0, 101.0, 51.0, 22.0, 18.0, 5.0, 5.0, 10.0, 3.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.001953125, -0.96673583984375, -0.9315185546875, -0.89630126953125, -0.861083984375, -0.82586669921875, -0.7906494140625, -0.75543212890625, -0.72021484375, -0.68499755859375, -0.6497802734375, -0.61456298828125, -0.579345703125, -0.54412841796875, -0.5089111328125, -0.47369384765625, -0.4384765625, -0.40325927734375, -0.3680419921875, -0.33282470703125, -0.297607421875, -0.26239013671875, -0.2271728515625, -0.19195556640625, -0.15673828125, -0.12152099609375, -0.0863037109375, -0.05108642578125, -0.015869140625, 0.01934814453125, 0.0545654296875, 0.08978271484375, 0.125, 0.16021728515625, 0.1954345703125, 0.23065185546875, 0.265869140625, 0.30108642578125, 0.3363037109375, 0.37152099609375, 0.40673828125, 0.44195556640625, 0.4771728515625, 0.51239013671875, 0.547607421875, 0.58282470703125, 0.6180419921875, 0.65325927734375, 0.6884765625, 0.72369384765625, 0.7589111328125, 0.79412841796875, 0.829345703125, 0.86456298828125, 0.8997802734375, 0.93499755859375, 0.97021484375, 1.00543212890625, 1.0406494140625, 1.07586669921875, 1.111083984375, 1.14630126953125, 1.1815185546875, 1.21673583984375, 1.251953125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 11.0, 17.0, 51.0, 82.0, 128.0, 178.0, 207.0, 123.0, 102.0, 46.0, 24.0, 18.0, 9.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.435640335083008, -13.028328895568848, -12.621017456054688, -12.213706016540527, -11.806394577026367, -11.399084091186523, -10.991772651672363, -10.584461212158203, -10.177149772644043, -9.769838333129883, -9.362526893615723, -8.955215454101562, -8.547904968261719, -8.140592575073242, -7.733282089233398, -7.325970649719238, -6.918659210205078, -6.511347770690918, -6.104036331176758, -5.696725368499756, -5.289413928985596, -4.8821024894714355, -4.474791526794434, -4.067480087280273, -3.6601686477661133, -3.252857208251953, -2.845546007156372, -2.438234806060791, -2.030923366546631, -1.6236119270324707, -1.2163007259368896, -0.8089895248413086, -0.40167808532714844, 0.005633234977722168, 0.4129445552825928, 0.8202558755874634, 1.227567195892334, 1.6348786354064941, 2.042189836502075, 2.4495010375976562, 2.8568124771118164, 3.2641239166259766, 3.6714351177215576, 4.078746318817139, 4.486057758331299, 4.893369197845459, 5.300680160522461, 5.707991600036621, 6.115303039550781, 6.522614479064941, 6.929925918579102, 7.3372368812561035, 7.744548320770264, 8.151859283447266, 8.559170722961426, 8.966482162475586, 9.373793601989746, 9.781105041503906, 10.188416481018066, 10.595727920532227, 11.00303840637207, 11.410350799560547, 11.81766128540039, 12.22497272491455, 12.632284164428711]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 6.0, 8.0, 7.0, 13.0, 21.0, 20.0, 28.0, 32.0, 44.0, 46.0, 42.0, 44.0, 47.0, 51.0, 58.0, 72.0, 79.0, 52.0, 61.0, 52.0, 36.0, 46.0, 27.0, 26.0, 25.0, 12.0, 11.0, 14.0, 8.0, 8.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-17.41448974609375, -16.992488861083984, -16.57048797607422, -16.148487091064453, -15.726485252380371, -15.304483413696289, -14.882482528686523, -14.460481643676758, -14.038479804992676, -13.61647891998291, -13.194477081298828, -12.772476196289062, -12.350475311279297, -11.928473472595215, -11.50647258758545, -11.084470748901367, -10.662469863891602, -10.240468978881836, -9.818467140197754, -9.396466255187988, -8.974465370178223, -8.55246353149414, -8.130462646484375, -7.708461284637451, -7.286460876464844, -6.86445951461792, -6.442458629608154, -6.0204572677612305, -5.598455905914307, -5.176454544067383, -4.754453659057617, -4.332452297210693, -3.9104509353637695, -3.488449811935425, -3.066448450088501, -2.6444473266601562, -2.2224459648132324, -1.8004448413848877, -1.378443717956543, -0.9564423561096191, -0.5344412326812744, -0.11244001984596252, 0.30956119298934937, 0.7315623760223389, 1.1535636186599731, 1.5755648612976074, 1.9975659847259521, 2.419567346572876, 2.8415684700012207, 3.2635695934295654, 3.6855709552764893, 4.107572078704834, 4.529573440551758, 4.951574325561523, 5.373575687408447, 5.795577049255371, 6.217577934265137, 6.6395792961120605, 7.061580181121826, 7.48358154296875, 7.905582904815674, 8.327584266662598, 8.749585151672363, 9.171586990356445, 9.593587875366211]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 3.0, 5.0, 9.0, 15.0, 24.0, 34.0, 59.0, 111.0, 212.0, 400.0, 1022.0, 3171.0, 16288.0, 400227.0, 3733500.0, 30679.0, 5382.0, 1650.0, 676.0, 332.0, 179.0, 115.0, 50.0, 35.0, 26.0, 22.0, 15.0, 11.0, 11.0, 6.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.236328125, -2.15960693359375, -2.0828857421875, -2.00616455078125, -1.929443359375, -1.85272216796875, -1.7760009765625, -1.69927978515625, -1.62255859375, -1.54583740234375, -1.4691162109375, -1.39239501953125, -1.315673828125, -1.23895263671875, -1.1622314453125, -1.08551025390625, -1.0087890625, -0.93206787109375, -0.8553466796875, -0.77862548828125, -0.701904296875, -0.62518310546875, -0.5484619140625, -0.47174072265625, -0.39501953125, -0.31829833984375, -0.2415771484375, -0.16485595703125, -0.088134765625, -0.01141357421875, 0.0653076171875, 0.14202880859375, 0.21875, 0.29547119140625, 0.3721923828125, 0.44891357421875, 0.525634765625, 0.60235595703125, 0.6790771484375, 0.75579833984375, 0.83251953125, 0.90924072265625, 0.9859619140625, 1.06268310546875, 1.139404296875, 1.21612548828125, 1.2928466796875, 1.36956787109375, 1.4462890625, 1.52301025390625, 1.5997314453125, 1.67645263671875, 1.753173828125, 1.82989501953125, 1.9066162109375, 1.98333740234375, 2.06005859375, 2.13677978515625, 2.2135009765625, 2.29022216796875, 2.366943359375, 2.44366455078125, 2.5203857421875, 2.59710693359375, 2.673828125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 6.0, 14.0, 21.0, 44.0, 50.0, 75.0, 95.0, 102.0, 108.0, 117.0, 83.0, 85.0, 59.0, 46.0, 32.0, 17.0, 13.0, 8.0, 1.0, 4.0, 12.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75146484375, -0.7245941162109375, -0.697723388671875, -0.6708526611328125, -0.64398193359375, -0.6171112060546875, -0.590240478515625, -0.5633697509765625, -0.5364990234375, -0.5096282958984375, -0.482757568359375, -0.4558868408203125, -0.42901611328125, -0.4021453857421875, -0.375274658203125, -0.3484039306640625, -0.321533203125, -0.2946624755859375, -0.267791748046875, -0.2409210205078125, -0.21405029296875, -0.1871795654296875, -0.160308837890625, -0.1334381103515625, -0.1065673828125, -0.0796966552734375, -0.052825927734375, -0.0259552001953125, 0.00091552734375, 0.0277862548828125, 0.054656982421875, 0.0815277099609375, 0.1083984375, 0.1352691650390625, 0.162139892578125, 0.1890106201171875, 0.21588134765625, 0.2427520751953125, 0.269622802734375, 0.2964935302734375, 0.3233642578125, 0.3502349853515625, 0.377105712890625, 0.4039764404296875, 0.43084716796875, 0.4577178955078125, 0.484588623046875, 0.5114593505859375, 0.538330078125, 0.5652008056640625, 0.592071533203125, 0.6189422607421875, 0.64581298828125, 0.6726837158203125, 0.699554443359375, 0.7264251708984375, 0.7532958984375, 0.7801666259765625, 0.807037353515625, 0.8339080810546875, 0.86077880859375, 0.8876495361328125, 0.914520263671875, 0.9413909912109375, 0.96826171875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 7.0, 3.0, 19.0, 21.0, 48.0, 80.0, 148.0, 318.0, 827.0, 2698.0, 11248.0, 82194.0, 3579180.0, 482229.0, 27572.0, 5324.0, 1481.0, 471.0, 195.0, 82.0, 54.0, 26.0, 10.0, 18.0, 3.0, 5.0, 4.0, 8.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.6943359375, -1.6494598388671875, -1.604583740234375, -1.5597076416015625, -1.51483154296875, -1.4699554443359375, -1.425079345703125, -1.3802032470703125, -1.3353271484375, -1.2904510498046875, -1.245574951171875, -1.2006988525390625, -1.15582275390625, -1.1109466552734375, -1.066070556640625, -1.0211944580078125, -0.976318359375, -0.9314422607421875, -0.886566162109375, -0.8416900634765625, -0.79681396484375, -0.7519378662109375, -0.707061767578125, -0.6621856689453125, -0.6173095703125, -0.5724334716796875, -0.527557373046875, -0.4826812744140625, -0.43780517578125, -0.3929290771484375, -0.348052978515625, -0.3031768798828125, -0.25830078125, -0.2134246826171875, -0.168548583984375, -0.1236724853515625, -0.07879638671875, -0.0339202880859375, 0.010955810546875, 0.0558319091796875, 0.1007080078125, 0.1455841064453125, 0.190460205078125, 0.2353363037109375, 0.28021240234375, 0.3250885009765625, 0.369964599609375, 0.4148406982421875, 0.459716796875, 0.5045928955078125, 0.549468994140625, 0.5943450927734375, 0.63922119140625, 0.6840972900390625, 0.728973388671875, 0.7738494873046875, 0.8187255859375, 0.8636016845703125, 0.908477783203125, 0.9533538818359375, 0.99822998046875, 1.0431060791015625, 1.087982177734375, 1.1328582763671875, 1.177734375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 1.0, 4.0, 2.0, 6.0, 5.0, 3.0, 7.0, 6.0, 17.0, 25.0, 24.0, 49.0, 78.0, 153.0, 264.0, 712.0, 1471.0, 599.0, 251.0, 155.0, 87.0, 47.0, 27.0, 18.0, 14.0, 7.0, 10.0, 7.0, 6.0, 2.0, 5.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.52197265625, -0.5087318420410156, -0.49549102783203125, -0.4822502136230469, -0.4690093994140625, -0.4557685852050781, -0.44252777099609375, -0.4292869567871094, -0.416046142578125, -0.4028053283691406, -0.38956451416015625, -0.3763236999511719, -0.3630828857421875, -0.3498420715332031, -0.33660125732421875, -0.3233604431152344, -0.31011962890625, -0.2968788146972656, -0.28363800048828125, -0.2703971862792969, -0.2571563720703125, -0.24391555786132812, -0.23067474365234375, -0.21743392944335938, -0.204193115234375, -0.19095230102539062, -0.17771148681640625, -0.16447067260742188, -0.1512298583984375, -0.13798904418945312, -0.12474822998046875, -0.11150741577148438, -0.0982666015625, -0.08502578735351562, -0.07178497314453125, -0.058544158935546875, -0.0453033447265625, -0.032062530517578125, -0.01882171630859375, -0.005580902099609375, 0.007659912109375, 0.020900726318359375, 0.03414154052734375, 0.047382354736328125, 0.0606231689453125, 0.07386398315429688, 0.08710479736328125, 0.10034561157226562, 0.11358642578125, 0.12682723999023438, 0.14006805419921875, 0.15330886840820312, 0.1665496826171875, 0.17979049682617188, 0.19303131103515625, 0.20627212524414062, 0.219512939453125, 0.23275375366210938, 0.24599456787109375, 0.2592353820800781, 0.2724761962890625, 0.2857170104980469, 0.29895782470703125, 0.3121986389160156, 0.325439453125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 7.0, 17.0, 33.0, 74.0, 122.0, 189.0, 195.0, 161.0, 98.0, 56.0, 28.0, 12.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9603676795959473, -3.8686041831970215, -3.7768406867980957, -3.68507719039917, -3.593313694000244, -3.5015501976013184, -3.4097867012023926, -3.318023204803467, -3.226259708404541, -3.1344962120056152, -3.0427327156066895, -2.9509692192077637, -2.859205722808838, -2.767442226409912, -2.6756787300109863, -2.5839152336120605, -2.4921514987945557, -2.40038800239563, -2.308624505996704, -2.2168610095977783, -2.1250975131988525, -2.0333340167999268, -1.9415704011917114, -1.8498069047927856, -1.7580434083938599, -1.666279911994934, -1.5745164155960083, -1.482752799987793, -1.3909893035888672, -1.2992258071899414, -1.2074623107910156, -1.1156988143920898, -1.0239351987838745, -0.9321717023849487, -0.840408205986023, -0.7486446499824524, -0.6568811535835266, -0.5651176571846008, -0.4733541011810303, -0.3815906047821045, -0.2898271083831787, -0.19806359708309174, -0.10630008578300476, -0.014536559581756592, 0.07722693681716919, 0.16899043321609497, 0.2607539892196655, 0.3525174856185913, 0.4442809820175171, 0.5360444784164429, 0.6278079748153687, 0.7195715308189392, 0.811335027217865, 0.9030985236167908, 0.9948620796203613, 1.086625576019287, 1.178389072418213, 1.2701525688171387, 1.3619160652160645, 1.4536795616149902, 1.545443058013916, 1.6372065544128418, 1.7289701700210571, 1.820733666419983, 1.9124971628189087]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 7.0, 10.0, 8.0, 13.0, 16.0, 19.0, 21.0, 19.0, 30.0, 37.0, 41.0, 28.0, 42.0, 36.0, 55.0, 40.0, 50.0, 65.0, 54.0, 62.0, 41.0, 45.0, 40.0, 28.0, 27.0, 29.0, 19.0, 19.0, 14.0, 22.0, 6.0, 15.0, 15.0, 7.0, 5.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.764317512512207, -1.7188403606414795, -1.673363208770752, -1.6278860569000244, -1.5824089050292969, -1.5369316339492798, -1.4914544820785522, -1.4459773302078247, -1.4005001783370972, -1.3550230264663696, -1.309545874595642, -1.2640687227249146, -1.2185914516448975, -1.17311429977417, -1.1276371479034424, -1.0821599960327148, -1.0366828441619873, -0.9912056922912598, -0.9457285404205322, -0.9002513289451599, -0.8547741770744324, -0.8092970252037048, -0.7638198137283325, -0.718342661857605, -0.6728655099868774, -0.6273883581161499, -0.5819112062454224, -0.53643399477005, -0.4909568428993225, -0.44547969102859497, -0.40000250935554504, -0.3545253276824951, -0.3090481758117676, -0.26357102394104004, -0.2180938422679901, -0.17261667549610138, -0.12713950872421265, -0.08166234195232391, -0.03618517518043518, 0.009292006492614746, 0.054769158363342285, 0.10024632513523102, 0.14572349190711975, 0.19120065867900848, 0.23667782545089722, 0.28215497732162476, 0.3276321589946747, 0.3731093406677246, 0.41858649253845215, 0.4640636444091797, 0.5095407962799072, 0.5550180077552795, 0.6004951596260071, 0.6459723114967346, 0.6914495229721069, 0.7369266748428345, 0.782403826713562, 0.8278809785842896, 0.8733581304550171, 0.9188353419303894, 0.9643124938011169, 1.0097897052764893, 1.0552668571472168, 1.1007440090179443, 1.1462211608886719]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 9.0, 11.0, 18.0, 27.0, 22.0, 33.0, 43.0, 86.0, 118.0, 135.0, 225.0, 360.0, 560.0, 906.0, 1572.0, 2895.0, 6699.0, 17782.0, 58038.0, 203049.0, 411523.0, 238044.0, 70190.0, 20720.0, 7638.0, 3437.0, 1731.0, 921.0, 593.0, 368.0, 232.0, 173.0, 109.0, 90.0, 47.0, 45.0, 27.0, 23.0, 15.0, 6.0, 10.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.443359375, -1.3990478515625, -1.354736328125, -1.3104248046875, -1.26611328125, -1.2218017578125, -1.177490234375, -1.1331787109375, -1.0888671875, -1.0445556640625, -1.000244140625, -0.9559326171875, -0.91162109375, -0.8673095703125, -0.822998046875, -0.7786865234375, -0.734375, -0.6900634765625, -0.645751953125, -0.6014404296875, -0.55712890625, -0.5128173828125, -0.468505859375, -0.4241943359375, -0.3798828125, -0.3355712890625, -0.291259765625, -0.2469482421875, -0.20263671875, -0.1583251953125, -0.114013671875, -0.0697021484375, -0.025390625, 0.0189208984375, 0.063232421875, 0.1075439453125, 0.15185546875, 0.1961669921875, 0.240478515625, 0.2847900390625, 0.3291015625, 0.3734130859375, 0.417724609375, 0.4620361328125, 0.50634765625, 0.5506591796875, 0.594970703125, 0.6392822265625, 0.68359375, 0.7279052734375, 0.772216796875, 0.8165283203125, 0.86083984375, 0.9051513671875, 0.949462890625, 0.9937744140625, 1.0380859375, 1.0823974609375, 1.126708984375, 1.1710205078125, 1.21533203125, 1.2596435546875, 1.303955078125, 1.3482666015625, 1.392578125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 9.0, 12.0, 27.0, 35.0, 67.0, 64.0, 97.0, 110.0, 107.0, 107.0, 92.0, 79.0, 64.0, 39.0, 32.0, 22.0, 9.0, 3.0, 5.0, 4.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.771484375, -0.7447509765625, -0.718017578125, -0.6912841796875, -0.66455078125, -0.6378173828125, -0.611083984375, -0.5843505859375, -0.5576171875, -0.5308837890625, -0.504150390625, -0.4774169921875, -0.45068359375, -0.4239501953125, -0.397216796875, -0.3704833984375, -0.34375, -0.3170166015625, -0.290283203125, -0.2635498046875, -0.23681640625, -0.2100830078125, -0.183349609375, -0.1566162109375, -0.1298828125, -0.1031494140625, -0.076416015625, -0.0496826171875, -0.02294921875, 0.0037841796875, 0.030517578125, 0.0572509765625, 0.083984375, 0.1107177734375, 0.137451171875, 0.1641845703125, 0.19091796875, 0.2176513671875, 0.244384765625, 0.2711181640625, 0.2978515625, 0.3245849609375, 0.351318359375, 0.3780517578125, 0.40478515625, 0.4315185546875, 0.458251953125, 0.4849853515625, 0.51171875, 0.5384521484375, 0.565185546875, 0.5919189453125, 0.61865234375, 0.6453857421875, 0.672119140625, 0.6988525390625, 0.7255859375, 0.7523193359375, 0.779052734375, 0.8057861328125, 0.83251953125, 0.8592529296875, 0.885986328125, 0.9127197265625, 0.939453125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 5.0, 13.0, 8.0, 13.0, 27.0, 41.0, 31.0, 82.0, 89.0, 94.0, 163.0, 273.0, 457.0, 752.0, 1463.0, 3266.0, 7699.0, 21741.0, 65664.0, 182079.0, 332890.0, 263676.0, 108882.0, 37030.0, 12566.0, 4794.0, 2053.0, 1067.0, 549.0, 362.0, 211.0, 143.0, 102.0, 72.0, 52.0, 38.0, 24.0, 32.0, 16.0, 15.0, 4.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.0390625, -1.00732421875, -0.9755859375, -0.94384765625, -0.912109375, -0.88037109375, -0.8486328125, -0.81689453125, -0.78515625, -0.75341796875, -0.7216796875, -0.68994140625, -0.658203125, -0.62646484375, -0.5947265625, -0.56298828125, -0.53125, -0.49951171875, -0.4677734375, -0.43603515625, -0.404296875, -0.37255859375, -0.3408203125, -0.30908203125, -0.27734375, -0.24560546875, -0.2138671875, -0.18212890625, -0.150390625, -0.11865234375, -0.0869140625, -0.05517578125, -0.0234375, 0.00830078125, 0.0400390625, 0.07177734375, 0.103515625, 0.13525390625, 0.1669921875, 0.19873046875, 0.23046875, 0.26220703125, 0.2939453125, 0.32568359375, 0.357421875, 0.38916015625, 0.4208984375, 0.45263671875, 0.484375, 0.51611328125, 0.5478515625, 0.57958984375, 0.611328125, 0.64306640625, 0.6748046875, 0.70654296875, 0.73828125, 0.77001953125, 0.8017578125, 0.83349609375, 0.865234375, 0.89697265625, 0.9287109375, 0.96044921875, 0.9921875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 8.0, 8.0, 5.0, 5.0, 7.0, 11.0, 16.0, 15.0, 17.0, 20.0, 25.0, 27.0, 30.0, 32.0, 40.0, 46.0, 44.0, 56.0, 32.0, 48.0, 48.0, 42.0, 47.0, 29.0, 40.0, 42.0, 43.0, 27.0, 34.0, 35.0, 22.0, 19.0, 22.0, 10.0, 8.0, 13.0, 12.0, 6.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.78515625, -1.727630615234375, -1.67010498046875, -1.612579345703125, -1.5550537109375, -1.497528076171875, -1.44000244140625, -1.382476806640625, -1.324951171875, -1.267425537109375, -1.20989990234375, -1.152374267578125, -1.0948486328125, -1.037322998046875, -0.97979736328125, -0.922271728515625, -0.86474609375, -0.807220458984375, -0.74969482421875, -0.692169189453125, -0.6346435546875, -0.577117919921875, -0.51959228515625, -0.462066650390625, -0.404541015625, -0.347015380859375, -0.28948974609375, -0.231964111328125, -0.1744384765625, -0.116912841796875, -0.05938720703125, -0.001861572265625, 0.0556640625, 0.113189697265625, 0.17071533203125, 0.228240966796875, 0.2857666015625, 0.343292236328125, 0.40081787109375, 0.458343505859375, 0.515869140625, 0.573394775390625, 0.63092041015625, 0.688446044921875, 0.7459716796875, 0.803497314453125, 0.86102294921875, 0.918548583984375, 0.97607421875, 1.033599853515625, 1.09112548828125, 1.148651123046875, 1.2061767578125, 1.263702392578125, 1.32122802734375, 1.378753662109375, 1.436279296875, 1.493804931640625, 1.55133056640625, 1.608856201171875, 1.6663818359375, 1.723907470703125, 1.78143310546875, 1.838958740234375, 1.896484375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 6.0, 5.0, 9.0, 10.0, 15.0, 31.0, 44.0, 74.0, 123.0, 262.0, 632.0, 1503.0, 4673.0, 19563.0, 147233.0, 667761.0, 175955.0, 22557.0, 5133.0, 1690.0, 630.0, 290.0, 136.0, 85.0, 53.0, 27.0, 18.0, 9.0, 10.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.74609375, -0.7262191772460938, -0.7063446044921875, -0.6864700317382812, -0.666595458984375, -0.6467208862304688, -0.6268463134765625, -0.6069717407226562, -0.58709716796875, -0.5672225952148438, -0.5473480224609375, -0.5274734497070312, -0.507598876953125, -0.48772430419921875, -0.4678497314453125, -0.44797515869140625, -0.4281005859375, -0.40822601318359375, -0.3883514404296875, -0.36847686767578125, -0.348602294921875, -0.32872772216796875, -0.3088531494140625, -0.28897857666015625, -0.26910400390625, -0.24922943115234375, -0.2293548583984375, -0.20948028564453125, -0.189605712890625, -0.16973114013671875, -0.1498565673828125, -0.12998199462890625, -0.110107421875, -0.09023284912109375, -0.0703582763671875, -0.05048370361328125, -0.030609130859375, -0.01073455810546875, 0.0091400146484375, 0.02901458740234375, 0.04888916015625, 0.06876373291015625, 0.0886383056640625, 0.10851287841796875, 0.128387451171875, 0.14826202392578125, 0.1681365966796875, 0.18801116943359375, 0.2078857421875, 0.22776031494140625, 0.2476348876953125, 0.26750946044921875, 0.287384033203125, 0.30725860595703125, 0.3271331787109375, 0.34700775146484375, 0.36688232421875, 0.38675689697265625, 0.4066314697265625, 0.42650604248046875, 0.446380615234375, 0.46625518798828125, 0.4861297607421875, 0.5060043334960938, 0.52587890625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 9.0, 3.0, 7.0, 12.0, 8.0, 10.0, 13.0, 16.0, 16.0, 11.0, 24.0, 26.0, 41.0, 46.0, 77.0, 74.0, 70.0, 94.0, 93.0, 67.0, 56.0, 61.0, 19.0, 23.0, 25.0, 19.0, 15.0, 9.0, 11.0, 11.0, 12.0, 2.0, 3.0, 8.0, 2.0, 5.0, 2.0, 2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.340047836303711e-05, -9.060557931661606e-05, -8.781068027019501e-05, -8.501578122377396e-05, -8.22208821773529e-05, -7.942598313093185e-05, -7.66310840845108e-05, -7.383618503808975e-05, -7.10412859916687e-05, -6.824638694524765e-05, -6.54514878988266e-05, -6.265658885240555e-05, -5.98616898059845e-05, -5.7066790759563446e-05, -5.4271891713142395e-05, -5.1476992666721344e-05, -4.868209362030029e-05, -4.588719457387924e-05, -4.309229552745819e-05, -4.029739648103714e-05, -3.750249743461609e-05, -3.470759838819504e-05, -3.191269934177399e-05, -2.9117800295352936e-05, -2.6322901248931885e-05, -2.3528002202510834e-05, -2.0733103156089783e-05, -1.793820410966873e-05, -1.514330506324768e-05, -1.234840601682663e-05, -9.553506970405579e-06, -6.758607923984528e-06, -3.9637088775634766e-06, -1.1688098311424255e-06, 1.6260892152786255e-06, 4.4209882616996765e-06, 7.2158873081207275e-06, 1.0010786354541779e-05, 1.280568540096283e-05, 1.560058444738388e-05, 1.839548349380493e-05, 2.1190382540225983e-05, 2.3985281586647034e-05, 2.6780180633068085e-05, 2.9575079679489136e-05, 3.236997872591019e-05, 3.516487777233124e-05, 3.795977681875229e-05, 4.075467586517334e-05, 4.354957491159439e-05, 4.634447395801544e-05, 4.913937300443649e-05, 5.1934272050857544e-05, 5.4729171097278595e-05, 5.7524070143699646e-05, 6.03189691901207e-05, 6.311386823654175e-05, 6.59087672829628e-05, 6.870366632938385e-05, 7.14985653758049e-05, 7.429346442222595e-05, 7.7088363468647e-05, 7.988326251506805e-05, 8.26781615614891e-05, 8.547306060791016e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 6.0, 9.0, 12.0, 20.0, 30.0, 44.0, 77.0, 143.0, 232.0, 538.0, 1407.0, 4355.0, 16705.0, 92101.0, 582944.0, 294547.0, 42156.0, 8836.0, 2578.0, 898.0, 423.0, 175.0, 97.0, 82.0, 37.0, 20.0, 19.0, 15.0, 5.0, 8.0, 5.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.69287109375, -0.6735076904296875, -0.654144287109375, -0.6347808837890625, -0.61541748046875, -0.5960540771484375, -0.576690673828125, -0.5573272705078125, -0.5379638671875, -0.5186004638671875, -0.499237060546875, -0.4798736572265625, -0.46051025390625, -0.4411468505859375, -0.421783447265625, -0.4024200439453125, -0.383056640625, -0.3636932373046875, -0.344329833984375, -0.3249664306640625, -0.30560302734375, -0.2862396240234375, -0.266876220703125, -0.2475128173828125, -0.2281494140625, -0.2087860107421875, -0.189422607421875, -0.1700592041015625, -0.15069580078125, -0.1313323974609375, -0.111968994140625, -0.0926055908203125, -0.0732421875, -0.0538787841796875, -0.034515380859375, -0.0151519775390625, 0.00421142578125, 0.0235748291015625, 0.042938232421875, 0.0623016357421875, 0.0816650390625, 0.1010284423828125, 0.120391845703125, 0.1397552490234375, 0.15911865234375, 0.1784820556640625, 0.197845458984375, 0.2172088623046875, 0.236572265625, 0.2559356689453125, 0.275299072265625, 0.2946624755859375, 0.31402587890625, 0.3333892822265625, 0.352752685546875, 0.3721160888671875, 0.3914794921875, 0.4108428955078125, 0.430206298828125, 0.4495697021484375, 0.46893310546875, 0.4882965087890625, 0.507659912109375, 0.5270233154296875, 0.54638671875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 5.0, 6.0, 10.0, 13.0, 7.0, 16.0, 14.0, 36.0, 28.0, 52.0, 56.0, 63.0, 83.0, 96.0, 81.0, 88.0, 84.0, 57.0, 53.0, 24.0, 29.0, 23.0, 13.0, 17.0, 11.0, 7.0, 6.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.63623046875, -0.6190032958984375, -0.601776123046875, -0.5845489501953125, -0.56732177734375, -0.5500946044921875, -0.532867431640625, -0.5156402587890625, -0.4984130859375, -0.4811859130859375, -0.463958740234375, -0.4467315673828125, -0.42950439453125, -0.4122772216796875, -0.395050048828125, -0.3778228759765625, -0.360595703125, -0.3433685302734375, -0.326141357421875, -0.3089141845703125, -0.29168701171875, -0.2744598388671875, -0.257232666015625, -0.2400054931640625, -0.2227783203125, -0.2055511474609375, -0.188323974609375, -0.1710968017578125, -0.15386962890625, -0.1366424560546875, -0.119415283203125, -0.1021881103515625, -0.0849609375, -0.0677337646484375, -0.050506591796875, -0.0332794189453125, -0.01605224609375, 0.0011749267578125, 0.018402099609375, 0.0356292724609375, 0.0528564453125, 0.0700836181640625, 0.087310791015625, 0.1045379638671875, 0.12176513671875, 0.1389923095703125, 0.156219482421875, 0.1734466552734375, 0.190673828125, 0.2079010009765625, 0.225128173828125, 0.2423553466796875, 0.25958251953125, 0.2768096923828125, 0.294036865234375, 0.3112640380859375, 0.3284912109375, 0.3457183837890625, 0.362945556640625, 0.3801727294921875, 0.39739990234375, 0.4146270751953125, 0.431854248046875, 0.4490814208984375, 0.46630859375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 3.0, 1.0, 7.0, 5.0, 17.0, 22.0, 32.0, 54.0, 90.0, 99.0, 147.0, 154.0, 120.0, 86.0, 75.0, 47.0, 21.0, 8.0, 5.0, 5.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.080207824707031, -12.77075481414795, -12.46130084991455, -12.151847839355469, -11.84239387512207, -11.532940864562988, -11.223487854003906, -10.914033889770508, -10.604580879211426, -10.295127868652344, -9.985673904418945, -9.676220893859863, -9.366767883300781, -9.057313919067383, -8.7478609085083, -8.438407897949219, -8.12895393371582, -7.81950044631958, -7.51004695892334, -7.200593948364258, -6.891140460968018, -6.581686973571777, -6.272233963012695, -5.962780475616455, -5.653326988220215, -5.343873500823975, -5.034420013427734, -4.724967002868652, -4.415513515472412, -4.106060028076172, -3.7966067790985107, -3.4871535301208496, -3.177699565887451, -2.868246078491211, -2.55879282951355, -2.2493395805358887, -1.9398860931396484, -1.6304327249526978, -1.320979356765747, -1.011526107788086, -0.7020726203918457, -0.392619252204895, -0.08316588401794434, 0.22628748416900635, 0.535740852355957, 0.8451942205429077, 1.1546475887298584, 1.4641008377075195, 1.7735543251037598, 2.0830078125, 2.392461061477661, 2.7019143104553223, 3.0113677978515625, 3.3208212852478027, 3.630274534225464, 3.939727783203125, 4.249181270599365, 4.5586347579956055, 4.8680877685546875, 5.177541255950928, 5.486994743347168, 5.796448230743408, 6.105901718139648, 6.4153547286987305, 6.724808216094971]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 7.0, 3.0, 1.0, 3.0, 8.0, 6.0, 9.0, 7.0, 9.0, 10.0, 19.0, 19.0, 12.0, 18.0, 19.0, 28.0, 39.0, 30.0, 23.0, 26.0, 40.0, 31.0, 36.0, 33.0, 42.0, 53.0, 38.0, 49.0, 32.0, 34.0, 40.0, 36.0, 36.0, 31.0, 29.0, 24.0, 22.0, 18.0, 14.0, 12.0, 9.0, 11.0, 8.0, 11.0, 5.0, 9.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.01206111907959, -9.717901229858398, -9.42374038696289, -9.1295804977417, -8.835420608520508, -8.541259765625, -8.247099876403809, -7.952939987182617, -7.658779621124268, -7.364619255065918, -7.070459365844727, -6.776298999786377, -6.482138633728027, -6.187978744506836, -5.893818378448486, -5.599658012390137, -5.305498123168945, -5.011337757110596, -4.717177867889404, -4.423017501831055, -4.128857612609863, -3.8346972465515137, -3.540536880493164, -3.2463767528533936, -2.952216625213623, -2.6580564975738525, -2.363896369934082, -2.0697360038757324, -1.775575876235962, -1.4814157485961914, -1.1872555017471313, -0.8930952548980713, -0.5989341735839844, -0.3047739863395691, -0.010613799095153809, 0.2835463881492615, 0.5777065753936768, 0.8718667030334473, 1.1660269498825073, 1.4601871967315674, 1.754347324371338, 2.0485074520111084, 2.342667579650879, 2.6368279457092285, 2.930988073348999, 3.2251482009887695, 3.519308567047119, 3.8134686946868896, 4.10762882232666, 4.40178918838501, 4.695949077606201, 4.990109443664551, 5.284269332885742, 5.578429698944092, 5.872590065002441, 6.166749954223633, 6.460910320281982, 6.755070686340332, 7.049230575561523, 7.343390941619873, 7.637551307678223, 7.931711196899414, 8.225871086120605, 8.520031929016113, 8.814191818237305]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 3.0, 8.0, 7.0, 12.0, 16.0, 15.0, 32.0, 52.0, 68.0, 120.0, 193.0, 335.0, 623.0, 1542.0, 4618.0, 20268.0, 287563.0, 3807681.0, 56602.0, 9423.0, 2683.0, 1108.0, 519.0, 270.0, 190.0, 108.0, 73.0, 47.0, 32.0, 23.0, 19.0, 9.0, 4.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9697265625, -1.9046173095703125, -1.839508056640625, -1.7743988037109375, -1.70928955078125, -1.6441802978515625, -1.579071044921875, -1.5139617919921875, -1.4488525390625, -1.3837432861328125, -1.318634033203125, -1.2535247802734375, -1.18841552734375, -1.1233062744140625, -1.058197021484375, -0.9930877685546875, -0.927978515625, -0.8628692626953125, -0.797760009765625, -0.7326507568359375, -0.66754150390625, -0.6024322509765625, -0.537322998046875, -0.4722137451171875, -0.4071044921875, -0.3419952392578125, -0.276885986328125, -0.2117767333984375, -0.14666748046875, -0.0815582275390625, -0.016448974609375, 0.0486602783203125, 0.11376953125, 0.1788787841796875, 0.243988037109375, 0.3090972900390625, 0.37420654296875, 0.4393157958984375, 0.504425048828125, 0.5695343017578125, 0.6346435546875, 0.6997528076171875, 0.764862060546875, 0.8299713134765625, 0.89508056640625, 0.9601898193359375, 1.025299072265625, 1.0904083251953125, 1.155517578125, 1.2206268310546875, 1.285736083984375, 1.3508453369140625, 1.41595458984375, 1.4810638427734375, 1.546173095703125, 1.6112823486328125, 1.6763916015625, 1.7415008544921875, 1.806610107421875, 1.8717193603515625, 1.93682861328125, 2.0019378662109375, 2.067047119140625, 2.1321563720703125, 2.197265625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 5.0, 9.0, 18.0, 27.0, 33.0, 52.0, 67.0, 85.0, 81.0, 116.0, 98.0, 82.0, 80.0, 70.0, 48.0, 44.0, 22.0, 14.0, 14.0, 10.0, 8.0, 3.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78564453125, -0.7578125, -0.72998046875, -0.7021484375, -0.67431640625, -0.646484375, -0.61865234375, -0.5908203125, -0.56298828125, -0.53515625, -0.50732421875, -0.4794921875, -0.45166015625, -0.423828125, -0.39599609375, -0.3681640625, -0.34033203125, -0.3125, -0.28466796875, -0.2568359375, -0.22900390625, -0.201171875, -0.17333984375, -0.1455078125, -0.11767578125, -0.08984375, -0.06201171875, -0.0341796875, -0.00634765625, 0.021484375, 0.04931640625, 0.0771484375, 0.10498046875, 0.1328125, 0.16064453125, 0.1884765625, 0.21630859375, 0.244140625, 0.27197265625, 0.2998046875, 0.32763671875, 0.35546875, 0.38330078125, 0.4111328125, 0.43896484375, 0.466796875, 0.49462890625, 0.5224609375, 0.55029296875, 0.578125, 0.60595703125, 0.6337890625, 0.66162109375, 0.689453125, 0.71728515625, 0.7451171875, 0.77294921875, 0.80078125, 0.82861328125, 0.8564453125, 0.88427734375, 0.912109375, 0.93994140625, 0.9677734375, 0.99560546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 8.0, 7.0, 26.0, 48.0, 90.0, 179.0, 371.0, 809.0, 1854.0, 5503.0, 24375.0, 468036.0, 3611859.0, 66175.0, 10038.0, 2947.0, 1067.0, 430.0, 221.0, 112.0, 61.0, 22.0, 11.0, 14.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9169921875, -1.8654937744140625, -1.813995361328125, -1.7624969482421875, -1.71099853515625, -1.6595001220703125, -1.608001708984375, -1.5565032958984375, -1.5050048828125, -1.4535064697265625, -1.402008056640625, -1.3505096435546875, -1.29901123046875, -1.2475128173828125, -1.196014404296875, -1.1445159912109375, -1.093017578125, -1.0415191650390625, -0.990020751953125, -0.9385223388671875, -0.88702392578125, -0.8355255126953125, -0.784027099609375, -0.7325286865234375, -0.6810302734375, -0.6295318603515625, -0.578033447265625, -0.5265350341796875, -0.47503662109375, -0.4235382080078125, -0.372039794921875, -0.3205413818359375, -0.26904296875, -0.2175445556640625, -0.166046142578125, -0.1145477294921875, -0.06304931640625, -0.0115509033203125, 0.039947509765625, 0.0914459228515625, 0.1429443359375, 0.1944427490234375, 0.245941162109375, 0.2974395751953125, 0.34893798828125, 0.4004364013671875, 0.451934814453125, 0.5034332275390625, 0.554931640625, 0.6064300537109375, 0.657928466796875, 0.7094268798828125, 0.76092529296875, 0.8124237060546875, 0.863922119140625, 0.9154205322265625, 0.9669189453125, 1.0184173583984375, 1.069915771484375, 1.1214141845703125, 1.17291259765625, 1.2244110107421875, 1.275909423828125, 1.3274078369140625, 1.37890625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 0.0, 6.0, 1.0, 4.0, 3.0, 4.0, 12.0, 13.0, 34.0, 44.0, 64.0, 160.0, 325.0, 1187.0, 1402.0, 440.0, 145.0, 69.0, 51.0, 35.0, 14.0, 14.0, 7.0, 7.0, 2.0, 9.0, 7.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70751953125, -0.6867446899414062, -0.6659698486328125, -0.6451950073242188, -0.624420166015625, -0.6036453247070312, -0.5828704833984375, -0.5620956420898438, -0.54132080078125, -0.5205459594726562, -0.4997711181640625, -0.47899627685546875, -0.458221435546875, -0.43744659423828125, -0.4166717529296875, -0.39589691162109375, -0.3751220703125, -0.35434722900390625, -0.3335723876953125, -0.31279754638671875, -0.292022705078125, -0.27124786376953125, -0.2504730224609375, -0.22969818115234375, -0.20892333984375, -0.18814849853515625, -0.1673736572265625, -0.14659881591796875, -0.125823974609375, -0.10504913330078125, -0.0842742919921875, -0.06349945068359375, -0.042724609375, -0.02194976806640625, -0.0011749267578125, 0.01959991455078125, 0.040374755859375, 0.06114959716796875, 0.0819244384765625, 0.10269927978515625, 0.12347412109375, 0.14424896240234375, 0.1650238037109375, 0.18579864501953125, 0.206573486328125, 0.22734832763671875, 0.2481231689453125, 0.26889801025390625, 0.2896728515625, 0.31044769287109375, 0.3312225341796875, 0.35199737548828125, 0.372772216796875, 0.39354705810546875, 0.4143218994140625, 0.43509674072265625, 0.45587158203125, 0.47664642333984375, 0.4974212646484375, 0.5181961059570312, 0.538970947265625, 0.5597457885742188, 0.5805206298828125, 0.6012954711914062, 0.6220703125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 7.0, 7.0, 34.0, 105.0, 277.0, 320.0, 177.0, 60.0, 16.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-9.58192253112793, -9.38638973236084, -9.190855979919434, -8.995323181152344, -8.799789428710938, -8.604256629943848, -8.408723831176758, -8.213190078735352, -8.017657279968262, -7.822124004364014, -7.626590728759766, -7.431057929992676, -7.235524654388428, -7.03999137878418, -6.84445858001709, -6.648925304412842, -6.453392028808594, -6.257858753204346, -6.062325477600098, -5.866792678833008, -5.67125940322876, -5.475726127624512, -5.280193328857422, -5.084660053253174, -4.889126777648926, -4.693593502044678, -4.49806022644043, -4.30252742767334, -4.106994152069092, -3.9114608764648438, -3.715927839279175, -3.520394802093506, -3.324861526489258, -3.1293282508850098, -2.933795213699341, -2.738262176513672, -2.542728900909424, -2.347195625305176, -2.151662588119507, -1.9561294317245483, -1.7605962753295898, -1.5650631189346313, -1.3695299625396729, -1.1739968061447144, -0.9784636497497559, -0.7829304933547974, -0.5873973369598389, -0.39186418056488037, -0.19633102416992188, -0.0007978677749633789, 0.19473528861999512, 0.3902684450149536, 0.5858016014099121, 0.7813347578048706, 0.9768679141998291, 1.1724010705947876, 1.367934226989746, 1.5634673833847046, 1.759000539779663, 1.9545336961746216, 2.15006685256958, 2.345600128173828, 2.541133165359497, 2.736666202545166, 2.932199478149414]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 11.0, 8.0, 15.0, 28.0, 26.0, 63.0, 68.0, 73.0, 85.0, 97.0, 93.0, 106.0, 70.0, 68.0, 50.0, 49.0, 31.0, 27.0, 12.0, 10.0, 7.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.362725734710693, -4.242800235748291, -4.122874736785889, -4.0029497146606445, -3.883024215698242, -3.76309871673584, -3.6431732177734375, -3.5232479572296143, -3.403322696685791, -3.2833971977233887, -3.1634719371795654, -3.043546438217163, -2.92362117767334, -2.8036956787109375, -2.683770179748535, -2.563844919204712, -2.4439194202423096, -2.3239939212799072, -2.204068660736084, -2.0841431617736816, -1.9642179012298584, -1.844292402267456, -1.7243670225143433, -1.6044416427612305, -1.4845162630081177, -1.3645908832550049, -1.244665503501892, -1.1247401237487793, -1.004814624786377, -0.8848893046379089, -0.7649638652801514, -0.6450384855270386, -0.5251133441925049, -0.4051879644393921, -0.2852625548839569, -0.16533714532852173, -0.045411765575408936, 0.07451361417770386, 0.19443905353546143, 0.3143644332885742, 0.434289813041687, 0.5542151927947998, 0.6741405725479126, 0.7940660119056702, 0.913991391658783, 1.033916711807251, 1.1538422107696533, 1.2737675905227661, 1.393692970275879, 1.5136183500289917, 1.6335437297821045, 1.7534692287445068, 1.87339448928833, 1.9933199882507324, 2.1132454872131348, 2.233170747756958, 2.3530960083007812, 2.4730215072631836, 2.592946767807007, 2.712872266769409, 2.8327975273132324, 2.9527230262756348, 3.072648525238037, 3.1925737857818604, 3.3124992847442627]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 7.0, 14.0, 9.0, 23.0, 47.0, 51.0, 62.0, 109.0, 198.0, 321.0, 591.0, 1046.0, 2020.0, 4329.0, 10993.0, 36913.0, 158510.0, 472342.0, 269680.0, 62769.0, 16905.0, 6011.0, 2564.0, 1265.0, 695.0, 398.0, 221.0, 146.0, 98.0, 62.0, 47.0, 28.0, 18.0, 13.0, 7.0, 9.0, 8.0, 7.0, 5.0, 1.0, 2.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5537109375, -1.503082275390625, -1.45245361328125, -1.401824951171875, -1.3511962890625, -1.300567626953125, -1.24993896484375, -1.199310302734375, -1.148681640625, -1.098052978515625, -1.04742431640625, -0.996795654296875, -0.9461669921875, -0.895538330078125, -0.84490966796875, -0.794281005859375, -0.74365234375, -0.693023681640625, -0.64239501953125, -0.591766357421875, -0.5411376953125, -0.490509033203125, -0.43988037109375, -0.389251708984375, -0.338623046875, -0.287994384765625, -0.23736572265625, -0.186737060546875, -0.1361083984375, -0.085479736328125, -0.03485107421875, 0.015777587890625, 0.06640625, 0.117034912109375, 0.16766357421875, 0.218292236328125, 0.2689208984375, 0.319549560546875, 0.37017822265625, 0.420806884765625, 0.471435546875, 0.522064208984375, 0.57269287109375, 0.623321533203125, 0.6739501953125, 0.724578857421875, 0.77520751953125, 0.825836181640625, 0.87646484375, 0.927093505859375, 0.97772216796875, 1.028350830078125, 1.0789794921875, 1.129608154296875, 1.18023681640625, 1.230865478515625, 1.281494140625, 1.332122802734375, 1.38275146484375, 1.433380126953125, 1.4840087890625, 1.534637451171875, 1.58526611328125, 1.635894775390625, 1.6865234375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 15.0, 24.0, 32.0, 46.0, 60.0, 65.0, 92.0, 107.0, 99.0, 87.0, 82.0, 75.0, 52.0, 51.0, 30.0, 16.0, 15.0, 13.0, 8.0, 6.0, 5.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78955078125, -0.762908935546875, -0.73626708984375, -0.709625244140625, -0.6829833984375, -0.656341552734375, -0.62969970703125, -0.603057861328125, -0.576416015625, -0.549774169921875, -0.52313232421875, -0.496490478515625, -0.4698486328125, -0.443206787109375, -0.41656494140625, -0.389923095703125, -0.36328125, -0.336639404296875, -0.30999755859375, -0.283355712890625, -0.2567138671875, -0.230072021484375, -0.20343017578125, -0.176788330078125, -0.150146484375, -0.123504638671875, -0.09686279296875, -0.070220947265625, -0.0435791015625, -0.016937255859375, 0.00970458984375, 0.036346435546875, 0.06298828125, 0.089630126953125, 0.11627197265625, 0.142913818359375, 0.1695556640625, 0.196197509765625, 0.22283935546875, 0.249481201171875, 0.276123046875, 0.302764892578125, 0.32940673828125, 0.356048583984375, 0.3826904296875, 0.409332275390625, 0.43597412109375, 0.462615966796875, 0.4892578125, 0.515899658203125, 0.54254150390625, 0.569183349609375, 0.5958251953125, 0.622467041015625, 0.64910888671875, 0.675750732421875, 0.702392578125, 0.729034423828125, 0.75567626953125, 0.782318115234375, 0.8089599609375, 0.835601806640625, 0.86224365234375, 0.888885498046875, 0.91552734375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 8.0, 6.0, 12.0, 11.0, 18.0, 26.0, 51.0, 47.0, 71.0, 76.0, 123.0, 224.0, 353.0, 696.0, 1651.0, 5635.0, 28353.0, 180515.0, 556199.0, 227576.0, 36233.0, 6949.0, 1890.0, 746.0, 357.0, 211.0, 131.0, 101.0, 72.0, 46.0, 39.0, 31.0, 25.0, 18.0, 12.0, 4.0, 11.0, 4.0, 3.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6435546875, -1.58978271484375, -1.5360107421875, -1.48223876953125, -1.428466796875, -1.37469482421875, -1.3209228515625, -1.26715087890625, -1.21337890625, -1.15960693359375, -1.1058349609375, -1.05206298828125, -0.998291015625, -0.94451904296875, -0.8907470703125, -0.83697509765625, -0.783203125, -0.72943115234375, -0.6756591796875, -0.62188720703125, -0.568115234375, -0.51434326171875, -0.4605712890625, -0.40679931640625, -0.35302734375, -0.29925537109375, -0.2454833984375, -0.19171142578125, -0.137939453125, -0.08416748046875, -0.0303955078125, 0.02337646484375, 0.0771484375, 0.13092041015625, 0.1846923828125, 0.23846435546875, 0.292236328125, 0.34600830078125, 0.3997802734375, 0.45355224609375, 0.50732421875, 0.56109619140625, 0.6148681640625, 0.66864013671875, 0.722412109375, 0.77618408203125, 0.8299560546875, 0.88372802734375, 0.9375, 0.99127197265625, 1.0450439453125, 1.09881591796875, 1.152587890625, 1.20635986328125, 1.2601318359375, 1.31390380859375, 1.36767578125, 1.42144775390625, 1.4752197265625, 1.52899169921875, 1.582763671875, 1.63653564453125, 1.6903076171875, 1.74407958984375, 1.7978515625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 7.0, 1.0, 5.0, 1.0, 6.0, 7.0, 10.0, 7.0, 8.0, 12.0, 21.0, 21.0, 27.0, 28.0, 29.0, 41.0, 39.0, 33.0, 27.0, 51.0, 45.0, 53.0, 38.0, 43.0, 49.0, 47.0, 50.0, 41.0, 43.0, 40.0, 31.0, 16.0, 26.0, 18.0, 10.0, 17.0, 10.0, 8.0, 6.0, 5.0, 6.0, 7.0, 6.0, 4.0, 4.0, 1.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.8916015625, -1.8349151611328125, -1.778228759765625, -1.7215423583984375, -1.66485595703125, -1.6081695556640625, -1.551483154296875, -1.4947967529296875, -1.4381103515625, -1.3814239501953125, -1.324737548828125, -1.2680511474609375, -1.21136474609375, -1.1546783447265625, -1.097991943359375, -1.0413055419921875, -0.984619140625, -0.9279327392578125, -0.871246337890625, -0.8145599365234375, -0.75787353515625, -0.7011871337890625, -0.644500732421875, -0.5878143310546875, -0.5311279296875, -0.4744415283203125, -0.417755126953125, -0.3610687255859375, -0.30438232421875, -0.2476959228515625, -0.191009521484375, -0.1343231201171875, -0.07763671875, -0.0209503173828125, 0.035736083984375, 0.0924224853515625, 0.14910888671875, 0.2057952880859375, 0.262481689453125, 0.3191680908203125, 0.3758544921875, 0.4325408935546875, 0.489227294921875, 0.5459136962890625, 0.60260009765625, 0.6592864990234375, 0.715972900390625, 0.7726593017578125, 0.829345703125, 0.8860321044921875, 0.942718505859375, 0.9994049072265625, 1.05609130859375, 1.1127777099609375, 1.169464111328125, 1.2261505126953125, 1.2828369140625, 1.3395233154296875, 1.396209716796875, 1.4528961181640625, 1.50958251953125, 1.5662689208984375, 1.622955322265625, 1.6796417236328125, 1.736328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 8.0, 14.0, 38.0, 71.0, 222.0, 851.0, 13236.0, 961997.0, 69558.0, 1996.0, 337.0, 143.0, 50.0, 13.0, 13.0, 10.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.32421875, -1.2746124267578125, -1.225006103515625, -1.1753997802734375, -1.12579345703125, -1.0761871337890625, -1.026580810546875, -0.9769744873046875, -0.9273681640625, -0.8777618408203125, -0.828155517578125, -0.7785491943359375, -0.72894287109375, -0.6793365478515625, -0.629730224609375, -0.5801239013671875, -0.530517578125, -0.4809112548828125, -0.431304931640625, -0.3816986083984375, -0.33209228515625, -0.2824859619140625, -0.232879638671875, -0.1832733154296875, -0.1336669921875, -0.0840606689453125, -0.034454345703125, 0.0151519775390625, 0.06475830078125, 0.1143646240234375, 0.163970947265625, 0.2135772705078125, 0.26318359375, 0.3127899169921875, 0.362396240234375, 0.4120025634765625, 0.46160888671875, 0.5112152099609375, 0.560821533203125, 0.6104278564453125, 0.6600341796875, 0.7096405029296875, 0.759246826171875, 0.8088531494140625, 0.85845947265625, 0.9080657958984375, 0.957672119140625, 1.0072784423828125, 1.056884765625, 1.1064910888671875, 1.156097412109375, 1.2057037353515625, 1.25531005859375, 1.3049163818359375, 1.354522705078125, 1.4041290283203125, 1.4537353515625, 1.5033416748046875, 1.552947998046875, 1.6025543212890625, 1.65216064453125, 1.7017669677734375, 1.751373291015625, 1.8009796142578125, 1.8505859375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 6.0, 7.0, 6.0, 7.0, 6.0, 7.0, 10.0, 21.0, 26.0, 32.0, 48.0, 105.0, 130.0, 172.0, 140.0, 92.0, 55.0, 27.0, 18.0, 20.0, 15.0, 9.0, 10.0, 9.0, 11.0, 7.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001100301742553711, -0.00010601244866847992, -0.00010199472308158875, -9.797699749469757e-05, -9.39592719078064e-05, -8.994154632091522e-05, -8.592382073402405e-05, -8.190609514713287e-05, -7.78883695602417e-05, -7.387064397335052e-05, -6.985291838645935e-05, -6.583519279956818e-05, -6.1817467212677e-05, -5.779974162578583e-05, -5.378201603889465e-05, -4.976429045200348e-05, -4.5746564865112305e-05, -4.172883927822113e-05, -3.7711113691329956e-05, -3.369338810443878e-05, -2.9675662517547607e-05, -2.5657936930656433e-05, -2.164021134376526e-05, -1.7622485756874084e-05, -1.360476016998291e-05, -9.587034583091736e-06, -5.5693089962005615e-06, -1.5515834093093872e-06, 2.466142177581787e-06, 6.4838677644729614e-06, 1.0501593351364136e-05, 1.451931893825531e-05, 1.8537044525146484e-05, 2.255477011203766e-05, 2.6572495698928833e-05, 3.059022128582001e-05, 3.460794687271118e-05, 3.8625672459602356e-05, 4.264339804649353e-05, 4.6661123633384705e-05, 5.067884922027588e-05, 5.469657480716705e-05, 5.871430039405823e-05, 6.27320259809494e-05, 6.674975156784058e-05, 7.076747715473175e-05, 7.478520274162292e-05, 7.88029283285141e-05, 8.282065391540527e-05, 8.683837950229645e-05, 9.085610508918762e-05, 9.48738306760788e-05, 9.889155626296997e-05, 0.00010290928184986115, 0.00010692700743675232, 0.0001109447330236435, 0.00011496245861053467, 0.00011898018419742584, 0.00012299790978431702, 0.0001270156353712082, 0.00013103336095809937, 0.00013505108654499054, 0.00013906881213188171, 0.0001430865377187729, 0.00014710426330566406]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 9.0, 18.0, 26.0, 52.0, 102.0, 172.0, 333.0, 1047.0, 12908.0, 901441.0, 127965.0, 3363.0, 568.0, 246.0, 145.0, 78.0, 33.0, 27.0, 6.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4169921875, -1.372406005859375, -1.32781982421875, -1.283233642578125, -1.2386474609375, -1.194061279296875, -1.14947509765625, -1.104888916015625, -1.060302734375, -1.015716552734375, -0.97113037109375, -0.926544189453125, -0.8819580078125, -0.837371826171875, -0.79278564453125, -0.748199462890625, -0.70361328125, -0.659027099609375, -0.61444091796875, -0.569854736328125, -0.5252685546875, -0.480682373046875, -0.43609619140625, -0.391510009765625, -0.346923828125, -0.302337646484375, -0.25775146484375, -0.213165283203125, -0.1685791015625, -0.123992919921875, -0.07940673828125, -0.034820556640625, 0.009765625, 0.054351806640625, 0.09893798828125, 0.143524169921875, 0.1881103515625, 0.232696533203125, 0.27728271484375, 0.321868896484375, 0.366455078125, 0.411041259765625, 0.45562744140625, 0.500213623046875, 0.5447998046875, 0.589385986328125, 0.63397216796875, 0.678558349609375, 0.72314453125, 0.767730712890625, 0.81231689453125, 0.856903076171875, 0.9014892578125, 0.946075439453125, 0.99066162109375, 1.035247802734375, 1.079833984375, 1.124420166015625, 1.16900634765625, 1.213592529296875, 1.2581787109375, 1.302764892578125, 1.34735107421875, 1.391937255859375, 1.4365234375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 16.0, 18.0, 32.0, 64.0, 140.0, 269.0, 210.0, 106.0, 64.0, 31.0, 21.0, 8.0, 11.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.791015625, -0.7593231201171875, -0.727630615234375, -0.6959381103515625, -0.66424560546875, -0.6325531005859375, -0.600860595703125, -0.5691680908203125, -0.5374755859375, -0.5057830810546875, -0.474090576171875, -0.4423980712890625, -0.41070556640625, -0.3790130615234375, -0.347320556640625, -0.3156280517578125, -0.283935546875, -0.2522430419921875, -0.220550537109375, -0.1888580322265625, -0.15716552734375, -0.1254730224609375, -0.093780517578125, -0.0620880126953125, -0.0303955078125, 0.0012969970703125, 0.032989501953125, 0.0646820068359375, 0.09637451171875, 0.1280670166015625, 0.159759521484375, 0.1914520263671875, 0.22314453125, 0.2548370361328125, 0.286529541015625, 0.3182220458984375, 0.34991455078125, 0.3816070556640625, 0.413299560546875, 0.4449920654296875, 0.4766845703125, 0.5083770751953125, 0.540069580078125, 0.5717620849609375, 0.60345458984375, 0.6351470947265625, 0.666839599609375, 0.6985321044921875, 0.730224609375, 0.7619171142578125, 0.793609619140625, 0.8253021240234375, 0.85699462890625, 0.8886871337890625, 0.920379638671875, 0.9520721435546875, 0.9837646484375, 1.0154571533203125, 1.047149658203125, 1.0788421630859375, 1.11053466796875, 1.1422271728515625, 1.173919677734375, 1.2056121826171875, 1.2373046875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 11.0, 15.0, 20.0, 36.0, 51.0, 82.0, 102.0, 168.0, 146.0, 116.0, 99.0, 72.0, 29.0, 19.0, 11.0, 11.0, 6.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.52981948852539, -12.206793785095215, -11.883768081665039, -11.560742378234863, -11.237716674804688, -10.914690971374512, -10.591665267944336, -10.26863956451416, -9.945613861083984, -9.622588157653809, -9.299562454223633, -8.976536750793457, -8.653511047363281, -8.330485343933105, -8.00745964050293, -7.684433937072754, -7.361408233642578, -7.038382530212402, -6.715356826782227, -6.392331123352051, -6.069305419921875, -5.746279716491699, -5.423254013061523, -5.100228309631348, -4.777202606201172, -4.454176902770996, -4.13115119934082, -3.8081254959106445, -3.4850997924804688, -3.162074089050293, -2.839048385620117, -2.5160226821899414, -2.1929969787597656, -1.8699712753295898, -1.546945571899414, -1.2239198684692383, -0.9008941650390625, -0.5778684616088867, -0.25484275817871094, 0.06818294525146484, 0.3912086486816406, 0.7142343521118164, 1.0372600555419922, 1.360285758972168, 1.6833114624023438, 2.0063371658325195, 2.3293628692626953, 2.652388572692871, 2.975414276123047, 3.2984399795532227, 3.6214656829833984, 3.944491386413574, 4.26751708984375, 4.590542793273926, 4.913568496704102, 5.236594200134277, 5.559619903564453, 5.882645606994629, 6.205671310424805, 6.5286970138549805, 6.851722717285156, 7.174748420715332, 7.497774124145508, 7.820799827575684, 8.14382553100586]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 4.0, 7.0, 8.0, 5.0, 17.0, 15.0, 19.0, 16.0, 18.0, 18.0, 18.0, 31.0, 35.0, 27.0, 46.0, 39.0, 42.0, 45.0, 41.0, 51.0, 40.0, 46.0, 35.0, 45.0, 32.0, 35.0, 34.0, 26.0, 27.0, 33.0, 20.0, 29.0, 19.0, 16.0, 15.0, 6.0, 6.0, 8.0, 10.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.699926376342773, -9.414116859436035, -9.128307342529297, -8.842498779296875, -8.556689262390137, -8.270879745483398, -7.985070705413818, -7.699261665344238, -7.4134521484375, -7.127642631530762, -6.841833591461182, -6.556024551391602, -6.270215034484863, -5.984405517578125, -5.698596477508545, -5.412787437438965, -5.126977920532227, -4.841168403625488, -4.555359363555908, -4.269550323486328, -3.98374080657959, -3.6979315280914307, -3.4121222496032715, -3.1263129711151123, -2.840503692626953, -2.554694414138794, -2.2688851356506348, -1.9830758571624756, -1.6972665786743164, -1.4114573001861572, -1.125648021697998, -0.8398387432098389, -0.5540294647216797, -0.2682201862335205, 0.017589092254638672, 0.30339837074279785, 0.589207649230957, 0.8750169277191162, 1.1608262062072754, 1.4466354846954346, 1.7324447631835938, 2.018254041671753, 2.304063320159912, 2.5898725986480713, 2.8756818771362305, 3.1614911556243896, 3.447300434112549, 3.733109712600708, 4.018918991088867, 4.3047285079956055, 4.5905375480651855, 4.876346588134766, 5.162156105041504, 5.447965621948242, 5.733774662017822, 6.019583702087402, 6.305393218994141, 6.591202735900879, 6.877011775970459, 7.162820816040039, 7.448630332946777, 7.734439849853516, 8.020248413085938, 8.306057929992676, 8.591867446899414]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 4.0, 11.0, 14.0, 25.0, 25.0, 26.0, 49.0, 115.0, 206.0, 413.0, 1086.0, 3197.0, 14453.0, 211746.0, 3913906.0, 39010.0, 6651.0, 1866.0, 740.0, 302.0, 180.0, 82.0, 55.0, 36.0, 23.0, 16.0, 12.0, 8.0, 7.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.4453125, -3.359710693359375, -3.27410888671875, -3.188507080078125, -3.1029052734375, -3.017303466796875, -2.93170166015625, -2.846099853515625, -2.760498046875, -2.674896240234375, -2.58929443359375, -2.503692626953125, -2.4180908203125, -2.332489013671875, -2.24688720703125, -2.161285400390625, -2.07568359375, -1.990081787109375, -1.90447998046875, -1.818878173828125, -1.7332763671875, -1.647674560546875, -1.56207275390625, -1.476470947265625, -1.390869140625, -1.305267333984375, -1.21966552734375, -1.134063720703125, -1.0484619140625, -0.962860107421875, -0.87725830078125, -0.791656494140625, -0.7060546875, -0.620452880859375, -0.53485107421875, -0.449249267578125, -0.3636474609375, -0.278045654296875, -0.19244384765625, -0.106842041015625, -0.021240234375, 0.064361572265625, 0.14996337890625, 0.235565185546875, 0.3211669921875, 0.406768798828125, 0.49237060546875, 0.577972412109375, 0.66357421875, 0.749176025390625, 0.83477783203125, 0.920379638671875, 1.0059814453125, 1.091583251953125, 1.17718505859375, 1.262786865234375, 1.348388671875, 1.433990478515625, 1.51959228515625, 1.605194091796875, 1.6907958984375, 1.776397705078125, 1.86199951171875, 1.947601318359375, 2.033203125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 6.0, 9.0, 15.0, 25.0, 30.0, 40.0, 64.0, 60.0, 81.0, 91.0, 90.0, 83.0, 88.0, 80.0, 42.0, 53.0, 32.0, 31.0, 31.0, 15.0, 4.0, 10.0, 9.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81787109375, -0.7905960083007812, -0.7633209228515625, -0.7360458374023438, -0.708770751953125, -0.6814956665039062, -0.6542205810546875, -0.6269454956054688, -0.59967041015625, -0.5723953247070312, -0.5451202392578125, -0.5178451538085938, -0.490570068359375, -0.46329498291015625, -0.4360198974609375, -0.40874481201171875, -0.3814697265625, -0.35419464111328125, -0.3269195556640625, -0.29964447021484375, -0.272369384765625, -0.24509429931640625, -0.2178192138671875, -0.19054412841796875, -0.16326904296875, -0.13599395751953125, -0.1087188720703125, -0.08144378662109375, -0.054168701171875, -0.02689361572265625, 0.0003814697265625, 0.02765655517578125, 0.054931640625, 0.08220672607421875, 0.1094818115234375, 0.13675689697265625, 0.164031982421875, 0.19130706787109375, 0.2185821533203125, 0.24585723876953125, 0.27313232421875, 0.30040740966796875, 0.3276824951171875, 0.35495758056640625, 0.382232666015625, 0.40950775146484375, 0.4367828369140625, 0.46405792236328125, 0.4913330078125, 0.5186080932617188, 0.5458831787109375, 0.5731582641601562, 0.600433349609375, 0.6277084350585938, 0.6549835205078125, 0.6822586059570312, 0.70953369140625, 0.7368087768554688, 0.7640838623046875, 0.7913589477539062, 0.818634033203125, 0.8459091186523438, 0.8731842041015625, 0.9004592895507812, 0.927734375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 9.0, 8.0, 27.0, 29.0, 62.0, 104.0, 182.0, 293.0, 580.0, 1121.0, 2431.0, 6099.0, 20252.0, 116067.0, 3517426.0, 472117.0, 40743.0, 10029.0, 3510.0, 1543.0, 749.0, 413.0, 218.0, 105.0, 71.0, 34.0, 14.0, 12.0, 11.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.390625, -1.3527679443359375, -1.314910888671875, -1.2770538330078125, -1.23919677734375, -1.2013397216796875, -1.163482666015625, -1.1256256103515625, -1.0877685546875, -1.0499114990234375, -1.012054443359375, -0.9741973876953125, -0.93634033203125, -0.8984832763671875, -0.860626220703125, -0.8227691650390625, -0.784912109375, -0.7470550537109375, -0.709197998046875, -0.6713409423828125, -0.63348388671875, -0.5956268310546875, -0.557769775390625, -0.5199127197265625, -0.4820556640625, -0.4441986083984375, -0.406341552734375, -0.3684844970703125, -0.33062744140625, -0.2927703857421875, -0.254913330078125, -0.2170562744140625, -0.17919921875, -0.1413421630859375, -0.103485107421875, -0.0656280517578125, -0.02777099609375, 0.0100860595703125, 0.047943115234375, 0.0858001708984375, 0.1236572265625, 0.1615142822265625, 0.199371337890625, 0.2372283935546875, 0.27508544921875, 0.3129425048828125, 0.350799560546875, 0.3886566162109375, 0.426513671875, 0.4643707275390625, 0.502227783203125, 0.5400848388671875, 0.57794189453125, 0.6157989501953125, 0.653656005859375, 0.6915130615234375, 0.7293701171875, 0.7672271728515625, 0.805084228515625, 0.8429412841796875, 0.88079833984375, 0.9186553955078125, 0.956512451171875, 0.9943695068359375, 1.0322265625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 1.0, 5.0, 5.0, 7.0, 6.0, 5.0, 19.0, 31.0, 36.0, 51.0, 101.0, 199.0, 657.0, 1963.0, 602.0, 188.0, 63.0, 49.0, 23.0, 19.0, 6.0, 16.0, 9.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59912109375, -0.5800552368164062, -0.5609893798828125, -0.5419235229492188, -0.522857666015625, -0.5037918090820312, -0.4847259521484375, -0.46566009521484375, -0.44659423828125, -0.42752838134765625, -0.4084625244140625, -0.38939666748046875, -0.370330810546875, -0.35126495361328125, -0.3321990966796875, -0.31313323974609375, -0.2940673828125, -0.27500152587890625, -0.2559356689453125, -0.23686981201171875, -0.217803955078125, -0.19873809814453125, -0.1796722412109375, -0.16060638427734375, -0.14154052734375, -0.12247467041015625, -0.1034088134765625, -0.08434295654296875, -0.065277099609375, -0.04621124267578125, -0.0271453857421875, -0.00807952880859375, 0.010986328125, 0.03005218505859375, 0.0491180419921875, 0.06818389892578125, 0.087249755859375, 0.10631561279296875, 0.1253814697265625, 0.14444732666015625, 0.16351318359375, 0.18257904052734375, 0.2016448974609375, 0.22071075439453125, 0.239776611328125, 0.25884246826171875, 0.2779083251953125, 0.29697418212890625, 0.3160400390625, 0.33510589599609375, 0.3541717529296875, 0.37323760986328125, 0.392303466796875, 0.41136932373046875, 0.4304351806640625, 0.44950103759765625, 0.46856689453125, 0.48763275146484375, 0.5066986083984375, 0.5257644653320312, 0.544830322265625, 0.5638961791992188, 0.5829620361328125, 0.6020278930664062, 0.62109375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 10.0, 17.0, 41.0, 69.0, 168.0, 233.0, 197.0, 143.0, 68.0, 32.0, 20.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.956377029418945, -5.837344646453857, -5.7183122634887695, -5.599279880523682, -5.480247497558594, -5.361215114593506, -5.242182731628418, -5.12315034866333, -5.004117965698242, -4.885085582733154, -4.766053199768066, -4.6470208168029785, -4.527988433837891, -4.408956050872803, -4.289923667907715, -4.170891284942627, -4.051859378814697, -3.9328269958496094, -3.8137946128845215, -3.6947622299194336, -3.5757298469543457, -3.456697463989258, -3.33766508102417, -3.218632936477661, -3.099600315093994, -2.9805679321289062, -2.8615355491638184, -2.7425031661987305, -2.6234707832336426, -2.5044384002685547, -2.385406017303467, -2.266373872756958, -2.147341728210449, -2.0283093452453613, -1.9092769622802734, -1.7902445793151855, -1.6712123155593872, -1.5521799325942993, -1.4331475496292114, -1.314115285873413, -1.195082664489746, -1.0760502815246582, -0.9570179581642151, -0.8379855751991272, -0.7189532518386841, -0.5999208688735962, -0.4808884859085083, -0.3618561625480652, -0.24282383918762207, -0.12379147857427597, -0.004759117960929871, 0.11427325010299683, 0.23330560326576233, 0.35233795642852783, 0.4713703393936157, 0.5904026627540588, 0.7094350457191467, 0.8284674286842346, 0.9474997520446777, 1.0665321350097656, 1.1855645179748535, 1.3045969009399414, 1.4236292839050293, 1.5426615476608276, 1.6616939306259155]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 1.0, 10.0, 2.0, 7.0, 12.0, 15.0, 16.0, 33.0, 17.0, 28.0, 48.0, 51.0, 48.0, 35.0, 63.0, 53.0, 57.0, 68.0, 57.0, 52.0, 53.0, 50.0, 40.0, 37.0, 43.0, 22.0, 11.0, 18.0, 15.0, 8.0, 12.0, 8.0, 11.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8646903038024902, -1.8038054704666138, -1.7429205179214478, -1.6820356845855713, -1.6211508512496948, -1.5602658987045288, -1.4993810653686523, -1.4384961128234863, -1.3776112794876099, -1.3167264461517334, -1.2558414936065674, -1.194956660270691, -1.1340718269348145, -1.0731868743896484, -1.012302041053772, -0.9514171481132507, -0.8905323147773743, -0.829647421836853, -0.7687625885009766, -0.7078776955604553, -0.6469928026199341, -0.5861079692840576, -0.5252230763435364, -0.46433818340301514, -0.4034533202648163, -0.34256845712661743, -0.2816835641860962, -0.22079870104789734, -0.1599138230085373, -0.09902894496917725, -0.038144081830978394, 0.022740811109542847, 0.0836256742477417, 0.14451055228710175, 0.2053954303264618, 0.26628029346466064, 0.3271651864051819, 0.38805004954338074, 0.4489349126815796, 0.5098198056221008, 0.5707046985626221, 0.6315895915031433, 0.6924744248390198, 0.753359317779541, 0.8142442107200623, 0.8751291036605835, 0.93601393699646, 0.9968988299369812, 1.057783603668213, 1.1186684370040894, 1.1795533895492554, 1.2404382228851318, 1.3013230562210083, 1.3622080087661743, 1.4230928421020508, 1.4839777946472168, 1.5448626279830933, 1.6057474613189697, 1.6666324138641357, 1.7275172472000122, 1.7884020805358887, 1.8492870330810547, 1.9101718664169312, 1.9710566997528076, 2.0319416522979736]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 11.0, 18.0, 25.0, 35.0, 58.0, 106.0, 229.0, 409.0, 777.0, 2107.0, 6448.0, 30488.0, 218792.0, 600782.0, 157078.0, 22828.0, 5174.0, 1607.0, 721.0, 365.0, 203.0, 117.0, 62.0, 42.0, 18.0, 14.0, 12.0, 7.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.359375, -2.286590576171875, -2.21380615234375, -2.141021728515625, -2.0682373046875, -1.995452880859375, -1.92266845703125, -1.849884033203125, -1.777099609375, -1.704315185546875, -1.63153076171875, -1.558746337890625, -1.4859619140625, -1.413177490234375, -1.34039306640625, -1.267608642578125, -1.19482421875, -1.122039794921875, -1.04925537109375, -0.976470947265625, -0.9036865234375, -0.830902099609375, -0.75811767578125, -0.685333251953125, -0.612548828125, -0.539764404296875, -0.46697998046875, -0.394195556640625, -0.3214111328125, -0.248626708984375, -0.17584228515625, -0.103057861328125, -0.0302734375, 0.042510986328125, 0.11529541015625, 0.188079833984375, 0.2608642578125, 0.333648681640625, 0.40643310546875, 0.479217529296875, 0.552001953125, 0.624786376953125, 0.69757080078125, 0.770355224609375, 0.8431396484375, 0.915924072265625, 0.98870849609375, 1.061492919921875, 1.13427734375, 1.207061767578125, 1.27984619140625, 1.352630615234375, 1.4254150390625, 1.498199462890625, 1.57098388671875, 1.643768310546875, 1.716552734375, 1.789337158203125, 1.86212158203125, 1.934906005859375, 2.0076904296875, 2.080474853515625, 2.15325927734375, 2.226043701171875, 2.298828125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 5.0, 6.0, 7.0, 13.0, 18.0, 39.0, 40.0, 57.0, 65.0, 92.0, 78.0, 88.0, 77.0, 88.0, 81.0, 46.0, 48.0, 43.0, 27.0, 29.0, 18.0, 8.0, 5.0, 8.0, 8.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7978515625, -0.7712860107421875, -0.744720458984375, -0.7181549072265625, -0.69158935546875, -0.6650238037109375, -0.638458251953125, -0.6118927001953125, -0.5853271484375, -0.5587615966796875, -0.532196044921875, -0.5056304931640625, -0.47906494140625, -0.4524993896484375, -0.425933837890625, -0.3993682861328125, -0.372802734375, -0.3462371826171875, -0.319671630859375, -0.2931060791015625, -0.26654052734375, -0.2399749755859375, -0.213409423828125, -0.1868438720703125, -0.1602783203125, -0.1337127685546875, -0.107147216796875, -0.0805816650390625, -0.05401611328125, -0.0274505615234375, -0.000885009765625, 0.0256805419921875, 0.05224609375, 0.0788116455078125, 0.105377197265625, 0.1319427490234375, 0.15850830078125, 0.1850738525390625, 0.211639404296875, 0.2382049560546875, 0.2647705078125, 0.2913360595703125, 0.317901611328125, 0.3444671630859375, 0.37103271484375, 0.3975982666015625, 0.424163818359375, 0.4507293701171875, 0.477294921875, 0.5038604736328125, 0.530426025390625, 0.5569915771484375, 0.58355712890625, 0.6101226806640625, 0.636688232421875, 0.6632537841796875, 0.6898193359375, 0.7163848876953125, 0.742950439453125, 0.7695159912109375, 0.79608154296875, 0.8226470947265625, 0.849212646484375, 0.8757781982421875, 0.90234375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 3.0, 4.0, 3.0, 11.0, 12.0, 15.0, 26.0, 36.0, 27.0, 47.0, 62.0, 85.0, 118.0, 192.0, 299.0, 551.0, 1428.0, 4477.0, 17825.0, 80634.0, 314997.0, 441268.0, 142915.0, 31959.0, 7522.0, 2161.0, 789.0, 358.0, 200.0, 148.0, 105.0, 71.0, 46.0, 55.0, 28.0, 21.0, 14.0, 11.0, 10.0, 8.0, 4.0, 5.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.51171875, -1.4632568359375, -1.414794921875, -1.3663330078125, -1.31787109375, -1.2694091796875, -1.220947265625, -1.1724853515625, -1.1240234375, -1.0755615234375, -1.027099609375, -0.9786376953125, -0.93017578125, -0.8817138671875, -0.833251953125, -0.7847900390625, -0.736328125, -0.6878662109375, -0.639404296875, -0.5909423828125, -0.54248046875, -0.4940185546875, -0.445556640625, -0.3970947265625, -0.3486328125, -0.3001708984375, -0.251708984375, -0.2032470703125, -0.15478515625, -0.1063232421875, -0.057861328125, -0.0093994140625, 0.0390625, 0.0875244140625, 0.135986328125, 0.1844482421875, 0.23291015625, 0.2813720703125, 0.329833984375, 0.3782958984375, 0.4267578125, 0.4752197265625, 0.523681640625, 0.5721435546875, 0.62060546875, 0.6690673828125, 0.717529296875, 0.7659912109375, 0.814453125, 0.8629150390625, 0.911376953125, 0.9598388671875, 1.00830078125, 1.0567626953125, 1.105224609375, 1.1536865234375, 1.2021484375, 1.2506103515625, 1.299072265625, 1.3475341796875, 1.39599609375, 1.4444580078125, 1.492919921875, 1.5413818359375, 1.58984375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 7.0, 1.0, 13.0, 6.0, 14.0, 11.0, 13.0, 21.0, 16.0, 26.0, 28.0, 17.0, 39.0, 33.0, 28.0, 40.0, 41.0, 24.0, 38.0, 36.0, 49.0, 47.0, 37.0, 47.0, 48.0, 43.0, 29.0, 36.0, 19.0, 30.0, 32.0, 20.0, 19.0, 21.0, 12.0, 14.0, 9.0, 4.0, 7.0, 10.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.880859375, -1.8241424560546875, -1.767425537109375, -1.7107086181640625, -1.65399169921875, -1.5972747802734375, -1.540557861328125, -1.4838409423828125, -1.4271240234375, -1.3704071044921875, -1.313690185546875, -1.2569732666015625, -1.20025634765625, -1.1435394287109375, -1.086822509765625, -1.0301055908203125, -0.973388671875, -0.9166717529296875, -0.859954833984375, -0.8032379150390625, -0.74652099609375, -0.6898040771484375, -0.633087158203125, -0.5763702392578125, -0.5196533203125, -0.4629364013671875, -0.406219482421875, -0.3495025634765625, -0.29278564453125, -0.2360687255859375, -0.179351806640625, -0.1226348876953125, -0.06591796875, -0.0092010498046875, 0.047515869140625, 0.1042327880859375, 0.16094970703125, 0.2176666259765625, 0.274383544921875, 0.3311004638671875, 0.3878173828125, 0.4445343017578125, 0.501251220703125, 0.5579681396484375, 0.61468505859375, 0.6714019775390625, 0.728118896484375, 0.7848358154296875, 0.841552734375, 0.8982696533203125, 0.954986572265625, 1.0117034912109375, 1.06842041015625, 1.1251373291015625, 1.181854248046875, 1.2385711669921875, 1.2952880859375, 1.3520050048828125, 1.408721923828125, 1.4654388427734375, 1.52215576171875, 1.5788726806640625, 1.635589599609375, 1.6923065185546875, 1.7490234375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 5.0, 2.0, 10.0, 8.0, 19.0, 32.0, 42.0, 69.0, 105.0, 178.0, 308.0, 559.0, 1123.0, 3089.0, 10590.0, 61957.0, 712128.0, 226757.0, 22689.0, 5320.0, 1860.0, 754.0, 400.0, 210.0, 136.0, 86.0, 43.0, 25.0, 13.0, 17.0, 7.0, 8.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64501953125, -0.6217727661132812, -0.5985260009765625, -0.5752792358398438, -0.552032470703125, -0.5287857055664062, -0.5055389404296875, -0.48229217529296875, -0.45904541015625, -0.43579864501953125, -0.4125518798828125, -0.38930511474609375, -0.366058349609375, -0.34281158447265625, -0.3195648193359375, -0.29631805419921875, -0.2730712890625, -0.24982452392578125, -0.2265777587890625, -0.20333099365234375, -0.180084228515625, -0.15683746337890625, -0.1335906982421875, -0.11034393310546875, -0.08709716796875, -0.06385040283203125, -0.0406036376953125, -0.01735687255859375, 0.005889892578125, 0.02913665771484375, 0.0523834228515625, 0.07563018798828125, 0.098876953125, 0.12212371826171875, 0.1453704833984375, 0.16861724853515625, 0.191864013671875, 0.21511077880859375, 0.2383575439453125, 0.26160430908203125, 0.28485107421875, 0.30809783935546875, 0.3313446044921875, 0.35459136962890625, 0.377838134765625, 0.40108489990234375, 0.4243316650390625, 0.44757843017578125, 0.4708251953125, 0.49407196044921875, 0.5173187255859375, 0.5405654907226562, 0.563812255859375, 0.5870590209960938, 0.6103057861328125, 0.6335525512695312, 0.65679931640625, 0.6800460815429688, 0.7032928466796875, 0.7265396118164062, 0.749786376953125, 0.7730331420898438, 0.7962799072265625, 0.8195266723632812, 0.8427734375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 8.0, 12.0, 4.0, 16.0, 13.0, 16.0, 31.0, 23.0, 36.0, 67.0, 113.0, 145.0, 148.0, 123.0, 75.0, 37.0, 22.0, 19.0, 15.0, 22.0, 8.0, 8.0, 9.0, 6.0, 5.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00011658668518066406, -0.00011258013546466827, -0.00010857358574867249, -0.0001045670360326767, -0.00010056048631668091, -9.655393660068512e-05, -9.254738688468933e-05, -8.854083716869354e-05, -8.453428745269775e-05, -8.052773773670197e-05, -7.652118802070618e-05, -7.251463830471039e-05, -6.85080885887146e-05, -6.450153887271881e-05, -6.049498915672302e-05, -5.6488439440727234e-05, -5.2481889724731445e-05, -4.847534000873566e-05, -4.446879029273987e-05, -4.046224057674408e-05, -3.645569086074829e-05, -3.24491411447525e-05, -2.8442591428756714e-05, -2.4436041712760925e-05, -2.0429491996765137e-05, -1.6422942280769348e-05, -1.241639256477356e-05, -8.409842848777771e-06, -4.403293132781982e-06, -3.9674341678619385e-07, 3.6098062992095947e-06, 7.616356015205383e-06, 1.1622905731201172e-05, 1.562945544719696e-05, 1.963600516319275e-05, 2.3642554879188538e-05, 2.7649104595184326e-05, 3.1655654311180115e-05, 3.56622040271759e-05, 3.966875374317169e-05, 4.367530345916748e-05, 4.768185317516327e-05, 5.168840289115906e-05, 5.5694952607154846e-05, 5.9701502323150635e-05, 6.370805203914642e-05, 6.771460175514221e-05, 7.1721151471138e-05, 7.572770118713379e-05, 7.973425090312958e-05, 8.374080061912537e-05, 8.774735033512115e-05, 9.175390005111694e-05, 9.576044976711273e-05, 9.976699948310852e-05, 0.00010377354919910431, 0.0001077800989151001, 0.00011178664863109589, 0.00011579319834709167, 0.00011979974806308746, 0.00012380629777908325, 0.00012781284749507904, 0.00013181939721107483, 0.00013582594692707062, 0.0001398324966430664]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 12.0, 12.0, 17.0, 16.0, 23.0, 31.0, 50.0, 83.0, 166.0, 301.0, 741.0, 2283.0, 11353.0, 151390.0, 830452.0, 43644.0, 5571.0, 1382.0, 475.0, 218.0, 117.0, 72.0, 51.0, 31.0, 20.0, 14.0, 11.0, 9.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9775390625, -0.9472732543945312, -0.9170074462890625, -0.8867416381835938, -0.856475830078125, -0.8262100219726562, -0.7959442138671875, -0.7656784057617188, -0.73541259765625, -0.7051467895507812, -0.6748809814453125, -0.6446151733398438, -0.614349365234375, -0.5840835571289062, -0.5538177490234375, -0.5235519409179688, -0.4932861328125, -0.46302032470703125, -0.4327545166015625, -0.40248870849609375, -0.372222900390625, -0.34195709228515625, -0.3116912841796875, -0.28142547607421875, -0.25115966796875, -0.22089385986328125, -0.1906280517578125, -0.16036224365234375, -0.130096435546875, -0.09983062744140625, -0.0695648193359375, -0.03929901123046875, -0.009033203125, 0.02123260498046875, 0.0514984130859375, 0.08176422119140625, 0.112030029296875, 0.14229583740234375, 0.1725616455078125, 0.20282745361328125, 0.23309326171875, 0.26335906982421875, 0.2936248779296875, 0.32389068603515625, 0.354156494140625, 0.38442230224609375, 0.4146881103515625, 0.44495391845703125, 0.4752197265625, 0.5054855346679688, 0.5357513427734375, 0.5660171508789062, 0.596282958984375, 0.6265487670898438, 0.6568145751953125, 0.6870803833007812, 0.71734619140625, 0.7476119995117188, 0.7778778076171875, 0.8081436157226562, 0.838409423828125, 0.8686752319335938, 0.8989410400390625, 0.9292068481445312, 0.95947265625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 1.0, 3.0, 4.0, 14.0, 8.0, 24.0, 32.0, 53.0, 76.0, 117.0, 137.0, 159.0, 133.0, 98.0, 46.0, 37.0, 19.0, 8.0, 10.0, 10.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0859375, -1.0595550537109375, -1.033172607421875, -1.0067901611328125, -0.98040771484375, -0.9540252685546875, -0.927642822265625, -0.9012603759765625, -0.8748779296875, -0.8484954833984375, -0.822113037109375, -0.7957305908203125, -0.76934814453125, -0.7429656982421875, -0.716583251953125, -0.6902008056640625, -0.663818359375, -0.6374359130859375, -0.611053466796875, -0.5846710205078125, -0.55828857421875, -0.5319061279296875, -0.505523681640625, -0.4791412353515625, -0.4527587890625, -0.4263763427734375, -0.399993896484375, -0.3736114501953125, -0.34722900390625, -0.3208465576171875, -0.294464111328125, -0.2680816650390625, -0.24169921875, -0.2153167724609375, -0.188934326171875, -0.1625518798828125, -0.13616943359375, -0.1097869873046875, -0.083404541015625, -0.0570220947265625, -0.0306396484375, -0.0042572021484375, 0.022125244140625, 0.0485076904296875, 0.07489013671875, 0.1012725830078125, 0.127655029296875, 0.1540374755859375, 0.180419921875, 0.2068023681640625, 0.233184814453125, 0.2595672607421875, 0.28594970703125, 0.3123321533203125, 0.338714599609375, 0.3650970458984375, 0.3914794921875, 0.4178619384765625, 0.444244384765625, 0.4706268310546875, 0.49700927734375, 0.5233917236328125, 0.549774169921875, 0.5761566162109375, 0.6025390625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 7.0, 11.0, 29.0, 35.0, 63.0, 122.0, 186.0, 159.0, 162.0, 104.0, 74.0, 33.0, 15.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.934480667114258, -9.527825355529785, -9.121170043945312, -8.71451473236084, -8.307859420776367, -7.9012041091918945, -7.494548797607422, -7.087893486022949, -6.681238174438477, -6.274582862854004, -5.867927551269531, -5.461272239685059, -5.054616928100586, -4.647961616516113, -4.241306304931641, -3.834650754928589, -3.427995204925537, -3.0213398933410645, -2.614684581756592, -2.208029270172119, -1.801373839378357, -1.3947184085845947, -0.9880630970001221, -0.5814077854156494, -0.17475247383117676, 0.2319028675556183, 0.6385582089424133, 1.0452135801315308, 1.4518688917160034, 1.8585243225097656, 2.2651796340942383, 2.671834945678711, 3.0784902572631836, 3.4851455688476562, 3.891800880432129, 4.298456192016602, 4.705111503601074, 5.111766815185547, 5.5184221267700195, 5.925077438354492, 6.331732749938965, 6.7383880615234375, 7.14504337310791, 7.551698684692383, 7.9583539962768555, 8.365009307861328, 8.7716646194458, 9.178319931030273, 9.584976196289062, 9.991631507873535, 10.398286819458008, 10.80494213104248, 11.211597442626953, 11.618252754211426, 12.024908065795898, 12.431563377380371, 12.838218688964844, 13.244874000549316, 13.651529312133789, 14.058184623718262, 14.464839935302734, 14.871495246887207, 15.27815055847168, 15.684805870056152, 16.091461181640625]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 8.0, 10.0, 13.0, 5.0, 10.0, 16.0, 14.0, 21.0, 13.0, 19.0, 30.0, 21.0, 37.0, 35.0, 32.0, 27.0, 43.0, 43.0, 41.0, 38.0, 48.0, 36.0, 29.0, 52.0, 37.0, 41.0, 41.0, 34.0, 27.0, 25.0, 17.0, 23.0, 28.0, 16.0, 10.0, 9.0, 15.0, 6.0, 8.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-8.829404830932617, -8.569636344909668, -8.309867858886719, -8.05009937286377, -7.79033088684082, -7.530562400817871, -7.270793914794922, -7.011025428771973, -6.751256942749023, -6.491488456726074, -6.231719970703125, -5.971951484680176, -5.712182998657227, -5.452414512634277, -5.192646026611328, -4.932877540588379, -4.67310905456543, -4.4133405685424805, -4.153572082519531, -3.893803596496582, -3.634035110473633, -3.3742666244506836, -3.1144981384277344, -2.854729652404785, -2.594961166381836, -2.3351926803588867, -2.0754241943359375, -1.8156557083129883, -1.555887222290039, -1.2961187362670898, -1.0363502502441406, -0.7765817642211914, -0.516812801361084, -0.25704431533813477, 0.002724170684814453, 0.26249265670776367, 0.5222611427307129, 0.7820296287536621, 1.0417981147766113, 1.3015666007995605, 1.5613350868225098, 1.821103572845459, 2.080872058868408, 2.3406405448913574, 2.6004090309143066, 2.860177516937256, 3.119946002960205, 3.3797144889831543, 3.6394829750061035, 3.8992514610290527, 4.159019947052002, 4.418788433074951, 4.6785569190979, 4.93832540512085, 5.198093891143799, 5.457862377166748, 5.717630863189697, 5.9773993492126465, 6.237167835235596, 6.496936321258545, 6.756704807281494, 7.016473293304443, 7.276241779327393, 7.536010265350342, 7.795778751373291]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 5.0, 3.0, 8.0, 10.0, 19.0, 22.0, 39.0, 76.0, 113.0, 218.0, 394.0, 852.0, 2054.0, 7237.0, 47796.0, 4006428.0, 112372.0, 11228.0, 3030.0, 1205.0, 499.0, 284.0, 150.0, 78.0, 56.0, 28.0, 22.0, 14.0, 7.0, 6.0, 7.0, 4.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-5.03515625, -4.9112548828125, -4.787353515625, -4.6634521484375, -4.53955078125, -4.4156494140625, -4.291748046875, -4.1678466796875, -4.0439453125, -3.9200439453125, -3.796142578125, -3.6722412109375, -3.54833984375, -3.4244384765625, -3.300537109375, -3.1766357421875, -3.052734375, -2.9288330078125, -2.804931640625, -2.6810302734375, -2.55712890625, -2.4332275390625, -2.309326171875, -2.1854248046875, -2.0615234375, -1.9376220703125, -1.813720703125, -1.6898193359375, -1.56591796875, -1.4420166015625, -1.318115234375, -1.1942138671875, -1.0703125, -0.9464111328125, -0.822509765625, -0.6986083984375, -0.57470703125, -0.4508056640625, -0.326904296875, -0.2030029296875, -0.0791015625, 0.0447998046875, 0.168701171875, 0.2926025390625, 0.41650390625, 0.5404052734375, 0.664306640625, 0.7882080078125, 0.912109375, 1.0360107421875, 1.159912109375, 1.2838134765625, 1.40771484375, 1.5316162109375, 1.655517578125, 1.7794189453125, 1.9033203125, 2.0272216796875, 2.151123046875, 2.2750244140625, 2.39892578125, 2.5228271484375, 2.646728515625, 2.7706298828125, 2.89453125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 6.0, 6.0, 11.0, 15.0, 21.0, 35.0, 53.0, 67.0, 73.0, 69.0, 100.0, 76.0, 67.0, 89.0, 59.0, 51.0, 46.0, 35.0, 35.0, 26.0, 21.0, 9.0, 11.0, 6.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85107421875, -0.8234024047851562, -0.7957305908203125, -0.7680587768554688, -0.740386962890625, -0.7127151489257812, -0.6850433349609375, -0.6573715209960938, -0.62969970703125, -0.6020278930664062, -0.5743560791015625, -0.5466842651367188, -0.519012451171875, -0.49134063720703125, -0.4636688232421875, -0.43599700927734375, -0.4083251953125, -0.38065338134765625, -0.3529815673828125, -0.32530975341796875, -0.297637939453125, -0.26996612548828125, -0.2422943115234375, -0.21462249755859375, -0.18695068359375, -0.15927886962890625, -0.1316070556640625, -0.10393524169921875, -0.076263427734375, -0.04859161376953125, -0.0209197998046875, 0.00675201416015625, 0.034423828125, 0.06209564208984375, 0.0897674560546875, 0.11743927001953125, 0.145111083984375, 0.17278289794921875, 0.2004547119140625, 0.22812652587890625, 0.25579833984375, 0.28347015380859375, 0.3111419677734375, 0.33881378173828125, 0.366485595703125, 0.39415740966796875, 0.4218292236328125, 0.44950103759765625, 0.4771728515625, 0.5048446655273438, 0.5325164794921875, 0.5601882934570312, 0.587860107421875, 0.6155319213867188, 0.6432037353515625, 0.6708755493164062, 0.69854736328125, 0.7262191772460938, 0.7538909912109375, 0.7815628051757812, 0.809234619140625, 0.8369064331054688, 0.8645782470703125, 0.8922500610351562, 0.919921875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 2.0, 7.0, 19.0, 21.0, 27.0, 50.0, 81.0, 96.0, 168.0, 309.0, 540.0, 992.0, 1979.0, 4604.0, 13421.0, 57585.0, 2210765.0, 1825954.0, 55863.0, 13106.0, 4559.0, 1961.0, 953.0, 447.0, 277.0, 179.0, 105.0, 69.0, 47.0, 27.0, 28.0, 10.0, 11.0, 5.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-2.181640625, -2.1270904541015625, -2.072540283203125, -2.0179901123046875, -1.96343994140625, -1.9088897705078125, -1.854339599609375, -1.7997894287109375, -1.7452392578125, -1.6906890869140625, -1.636138916015625, -1.5815887451171875, -1.52703857421875, -1.4724884033203125, -1.417938232421875, -1.3633880615234375, -1.308837890625, -1.2542877197265625, -1.199737548828125, -1.1451873779296875, -1.09063720703125, -1.0360870361328125, -0.981536865234375, -0.9269866943359375, -0.8724365234375, -0.8178863525390625, -0.763336181640625, -0.7087860107421875, -0.65423583984375, -0.5996856689453125, -0.545135498046875, -0.4905853271484375, -0.43603515625, -0.3814849853515625, -0.326934814453125, -0.2723846435546875, -0.21783447265625, -0.1632843017578125, -0.108734130859375, -0.0541839599609375, 0.0003662109375, 0.0549163818359375, 0.109466552734375, 0.1640167236328125, 0.21856689453125, 0.2731170654296875, 0.327667236328125, 0.3822174072265625, 0.436767578125, 0.4913177490234375, 0.545867919921875, 0.6004180908203125, 0.65496826171875, 0.7095184326171875, 0.764068603515625, 0.8186187744140625, 0.8731689453125, 0.9277191162109375, 0.982269287109375, 1.0368194580078125, 1.09136962890625, 1.1459197998046875, 1.200469970703125, 1.2550201416015625, 1.3095703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 0.0, 4.0, 3.0, 4.0, 10.0, 11.0, 16.0, 21.0, 40.0, 54.0, 110.0, 322.0, 2380.0, 746.0, 179.0, 71.0, 25.0, 20.0, 17.0, 10.0, 7.0, 9.0, 5.0, 3.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1982421875, -1.1688232421875, -1.139404296875, -1.1099853515625, -1.08056640625, -1.0511474609375, -1.021728515625, -0.9923095703125, -0.962890625, -0.9334716796875, -0.904052734375, -0.8746337890625, -0.84521484375, -0.8157958984375, -0.786376953125, -0.7569580078125, -0.7275390625, -0.6981201171875, -0.668701171875, -0.6392822265625, -0.60986328125, -0.5804443359375, -0.551025390625, -0.5216064453125, -0.4921875, -0.4627685546875, -0.433349609375, -0.4039306640625, -0.37451171875, -0.3450927734375, -0.315673828125, -0.2862548828125, -0.2568359375, -0.2274169921875, -0.197998046875, -0.1685791015625, -0.13916015625, -0.1097412109375, -0.080322265625, -0.0509033203125, -0.021484375, 0.0079345703125, 0.037353515625, 0.0667724609375, 0.09619140625, 0.1256103515625, 0.155029296875, 0.1844482421875, 0.2138671875, 0.2432861328125, 0.272705078125, 0.3021240234375, 0.33154296875, 0.3609619140625, 0.390380859375, 0.4197998046875, 0.44921875, 0.4786376953125, 0.508056640625, 0.5374755859375, 0.56689453125, 0.5963134765625, 0.625732421875, 0.6551513671875, 0.6845703125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 11.0, 31.0, 157.0, 418.0, 310.0, 73.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.776878356933594, -16.471323013305664, -16.165767669677734, -15.860213279724121, -15.554657936096191, -15.249102592468262, -14.943548202514648, -14.637992858886719, -14.332437515258789, -14.02688217163086, -13.721327781677246, -13.415772438049316, -13.110217094421387, -12.804661750793457, -12.499107360839844, -12.193552017211914, -11.887996673583984, -11.582441329956055, -11.276886940002441, -10.971331596374512, -10.665776252746582, -10.360220909118652, -10.054666519165039, -9.74911117553711, -9.443556785583496, -9.138001441955566, -8.832447052001953, -8.526891708374023, -8.221336364746094, -7.915781497955322, -7.610226631164551, -7.304671287536621, -6.999115467071533, -6.693560600280762, -6.388005256652832, -6.0824503898620605, -5.776895046234131, -5.471340179443359, -5.16578483581543, -4.860229969024658, -4.554675102233887, -4.249120235443115, -3.9435648918151855, -3.638010025024414, -3.3324546813964844, -3.026899814605713, -2.7213447093963623, -2.4157896041870117, -2.110234260559082, -1.8046791553497314, -1.4991240501403809, -1.1935690641403198, -0.8880139589309692, -0.5824588537216187, -0.2769038677215576, 0.02865123748779297, 0.33420634269714355, 0.6397614479064941, 0.9453164935112, 1.2508715391159058, 1.5564266443252563, 1.861981749534607, 2.167536735534668, 2.4730918407440186, 2.778646945953369]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 3.0, 7.0, 15.0, 10.0, 24.0, 35.0, 45.0, 44.0, 41.0, 63.0, 62.0, 62.0, 68.0, 72.0, 57.0, 65.0, 73.0, 49.0, 41.0, 42.0, 37.0, 25.0, 13.0, 13.0, 10.0, 11.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.379629611968994, -3.288191318511963, -3.1967532634735107, -3.1053149700164795, -3.0138769149780273, -2.922438621520996, -2.831000566482544, -2.7395622730255127, -2.6481242179870605, -2.5566859245300293, -2.465247869491577, -2.373809576034546, -2.2823715209960938, -2.1909332275390625, -2.0994951725006104, -2.008056879043579, -1.9166187047958374, -1.8251805305480957, -1.733742356300354, -1.6423041820526123, -1.5508660078048706, -1.459427833557129, -1.3679895401000977, -1.2765514850616455, -1.1851131916046143, -1.0936750173568726, -1.0022368431091309, -0.9107986688613892, -0.8193604946136475, -0.7279223203659058, -0.6364840865135193, -0.5450459122657776, -0.45360779762268066, -0.36216962337493896, -0.27073144912719727, -0.17929324507713318, -0.08785507082939148, 0.0035831034183502197, 0.0950213074684143, 0.186459481716156, 0.2778976559638977, 0.3693358302116394, 0.4607740044593811, 0.5522122383117676, 0.6436504125595093, 0.735088586807251, 0.8265267610549927, 0.9179649353027344, 1.009403109550476, 1.1008412837982178, 1.1922794580459595, 1.2837176322937012, 1.3751558065414429, 1.4665939807891846, 1.5580322742462158, 1.649470329284668, 1.7409086227416992, 1.832346796989441, 1.9237849712371826, 2.015223264694214, 2.106661319732666, 2.1980996131896973, 2.2895376682281494, 2.3809759616851807, 2.472414016723633]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 0.0, 4.0, 4.0, 8.0, 5.0, 9.0, 13.0, 17.0, 18.0, 31.0, 44.0, 70.0, 101.0, 145.0, 226.0, 382.0, 694.0, 1174.0, 2128.0, 4512.0, 10653.0, 28054.0, 90443.0, 291228.0, 393666.0, 151827.0, 44724.0, 15393.0, 6324.0, 2879.0, 1542.0, 845.0, 479.0, 303.0, 202.0, 119.0, 90.0, 53.0, 47.0, 26.0, 22.0, 14.0, 10.0, 12.0, 8.0, 7.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.880859375, -1.8224639892578125, -1.764068603515625, -1.7056732177734375, -1.64727783203125, -1.5888824462890625, -1.530487060546875, -1.4720916748046875, -1.4136962890625, -1.3553009033203125, -1.296905517578125, -1.2385101318359375, -1.18011474609375, -1.1217193603515625, -1.063323974609375, -1.0049285888671875, -0.946533203125, -0.8881378173828125, -0.829742431640625, -0.7713470458984375, -0.71295166015625, -0.6545562744140625, -0.596160888671875, -0.5377655029296875, -0.4793701171875, -0.4209747314453125, -0.362579345703125, -0.3041839599609375, -0.24578857421875, -0.1873931884765625, -0.128997802734375, -0.0706024169921875, -0.01220703125, 0.0461883544921875, 0.104583740234375, 0.1629791259765625, 0.22137451171875, 0.2797698974609375, 0.338165283203125, 0.3965606689453125, 0.4549560546875, 0.5133514404296875, 0.571746826171875, 0.6301422119140625, 0.68853759765625, 0.7469329833984375, 0.805328369140625, 0.8637237548828125, 0.922119140625, 0.9805145263671875, 1.038909912109375, 1.0973052978515625, 1.15570068359375, 1.2140960693359375, 1.272491455078125, 1.3308868408203125, 1.3892822265625, 1.4476776123046875, 1.506072998046875, 1.5644683837890625, 1.62286376953125, 1.6812591552734375, 1.739654541015625, 1.7980499267578125, 1.8564453125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 6.0, 8.0, 10.0, 11.0, 12.0, 25.0, 53.0, 54.0, 65.0, 72.0, 77.0, 87.0, 89.0, 70.0, 69.0, 60.0, 52.0, 34.0, 36.0, 35.0, 25.0, 17.0, 9.0, 9.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.849609375, -0.82257080078125, -0.7955322265625, -0.76849365234375, -0.741455078125, -0.71441650390625, -0.6873779296875, -0.66033935546875, -0.63330078125, -0.60626220703125, -0.5792236328125, -0.55218505859375, -0.525146484375, -0.49810791015625, -0.4710693359375, -0.44403076171875, -0.4169921875, -0.38995361328125, -0.3629150390625, -0.33587646484375, -0.308837890625, -0.28179931640625, -0.2547607421875, -0.22772216796875, -0.20068359375, -0.17364501953125, -0.1466064453125, -0.11956787109375, -0.092529296875, -0.06549072265625, -0.0384521484375, -0.01141357421875, 0.015625, 0.04266357421875, 0.0697021484375, 0.09674072265625, 0.123779296875, 0.15081787109375, 0.1778564453125, 0.20489501953125, 0.23193359375, 0.25897216796875, 0.2860107421875, 0.31304931640625, 0.340087890625, 0.36712646484375, 0.3941650390625, 0.42120361328125, 0.4482421875, 0.47528076171875, 0.5023193359375, 0.52935791015625, 0.556396484375, 0.58343505859375, 0.6104736328125, 0.63751220703125, 0.66455078125, 0.69158935546875, 0.7186279296875, 0.74566650390625, 0.772705078125, 0.79974365234375, 0.8267822265625, 0.85382080078125, 0.880859375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 7.0, 3.0, 11.0, 12.0, 13.0, 20.0, 37.0, 63.0, 85.0, 171.0, 285.0, 614.0, 1175.0, 2722.0, 8077.0, 32862.0, 174246.0, 544295.0, 226475.0, 41982.0, 9635.0, 3161.0, 1212.0, 623.0, 298.0, 181.0, 109.0, 52.0, 37.0, 36.0, 15.0, 13.0, 6.0, 3.0, 6.0, 5.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.244140625, -2.175262451171875, -2.10638427734375, -2.037506103515625, -1.9686279296875, -1.899749755859375, -1.83087158203125, -1.761993408203125, -1.693115234375, -1.624237060546875, -1.55535888671875, -1.486480712890625, -1.4176025390625, -1.348724365234375, -1.27984619140625, -1.210968017578125, -1.14208984375, -1.073211669921875, -1.00433349609375, -0.935455322265625, -0.8665771484375, -0.797698974609375, -0.72882080078125, -0.659942626953125, -0.591064453125, -0.522186279296875, -0.45330810546875, -0.384429931640625, -0.3155517578125, -0.246673583984375, -0.17779541015625, -0.108917236328125, -0.0400390625, 0.028839111328125, 0.09771728515625, 0.166595458984375, 0.2354736328125, 0.304351806640625, 0.37322998046875, 0.442108154296875, 0.510986328125, 0.579864501953125, 0.64874267578125, 0.717620849609375, 0.7864990234375, 0.855377197265625, 0.92425537109375, 0.993133544921875, 1.06201171875, 1.130889892578125, 1.19976806640625, 1.268646240234375, 1.3375244140625, 1.406402587890625, 1.47528076171875, 1.544158935546875, 1.613037109375, 1.681915283203125, 1.75079345703125, 1.819671630859375, 1.8885498046875, 1.957427978515625, 2.02630615234375, 2.095184326171875, 2.1640625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 3.0, 6.0, 12.0, 12.0, 19.0, 25.0, 41.0, 33.0, 34.0, 45.0, 53.0, 65.0, 63.0, 50.0, 51.0, 50.0, 56.0, 53.0, 59.0, 50.0, 40.0, 32.0, 36.0, 23.0, 20.0, 10.0, 9.0, 11.0, 5.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.818359375, -2.717864990234375, -2.61737060546875, -2.516876220703125, -2.4163818359375, -2.315887451171875, -2.21539306640625, -2.114898681640625, -2.014404296875, -1.913909912109375, -1.81341552734375, -1.712921142578125, -1.6124267578125, -1.511932373046875, -1.41143798828125, -1.310943603515625, -1.21044921875, -1.109954833984375, -1.00946044921875, -0.908966064453125, -0.8084716796875, -0.707977294921875, -0.60748291015625, -0.506988525390625, -0.406494140625, -0.305999755859375, -0.20550537109375, -0.105010986328125, -0.0045166015625, 0.095977783203125, 0.19647216796875, 0.296966552734375, 0.3974609375, 0.497955322265625, 0.59844970703125, 0.698944091796875, 0.7994384765625, 0.899932861328125, 1.00042724609375, 1.100921630859375, 1.201416015625, 1.301910400390625, 1.40240478515625, 1.502899169921875, 1.6033935546875, 1.703887939453125, 1.80438232421875, 1.904876708984375, 2.00537109375, 2.105865478515625, 2.20635986328125, 2.306854248046875, 2.4073486328125, 2.507843017578125, 2.60833740234375, 2.708831787109375, 2.809326171875, 2.909820556640625, 3.01031494140625, 3.110809326171875, 3.2113037109375, 3.311798095703125, 3.41229248046875, 3.512786865234375, 3.61328125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 4.0, 11.0, 22.0, 23.0, 44.0, 82.0, 105.0, 159.0, 329.0, 625.0, 1498.0, 4094.0, 14271.0, 111273.0, 852673.0, 48935.0, 9146.0, 2915.0, 1156.0, 508.0, 263.0, 161.0, 94.0, 57.0, 29.0, 14.0, 19.0, 6.0, 10.0, 3.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1796875, -2.11431884765625, -2.0489501953125, -1.98358154296875, -1.918212890625, -1.85284423828125, -1.7874755859375, -1.72210693359375, -1.65673828125, -1.59136962890625, -1.5260009765625, -1.46063232421875, -1.395263671875, -1.32989501953125, -1.2645263671875, -1.19915771484375, -1.1337890625, -1.06842041015625, -1.0030517578125, -0.93768310546875, -0.872314453125, -0.80694580078125, -0.7415771484375, -0.67620849609375, -0.61083984375, -0.54547119140625, -0.4801025390625, -0.41473388671875, -0.349365234375, -0.28399658203125, -0.2186279296875, -0.15325927734375, -0.087890625, -0.02252197265625, 0.0428466796875, 0.10821533203125, 0.173583984375, 0.23895263671875, 0.3043212890625, 0.36968994140625, 0.43505859375, 0.50042724609375, 0.5657958984375, 0.63116455078125, 0.696533203125, 0.76190185546875, 0.8272705078125, 0.89263916015625, 0.9580078125, 1.02337646484375, 1.0887451171875, 1.15411376953125, 1.219482421875, 1.28485107421875, 1.3502197265625, 1.41558837890625, 1.48095703125, 1.54632568359375, 1.6116943359375, 1.67706298828125, 1.742431640625, 1.80780029296875, 1.8731689453125, 1.93853759765625, 2.00390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 11.0, 5.0, 8.0, 8.0, 13.0, 21.0, 36.0, 37.0, 45.0, 72.0, 104.0, 191.0, 143.0, 70.0, 65.0, 45.0, 44.0, 29.0, 9.0, 13.0, 8.0, 7.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00024306774139404297, -0.0002354104071855545, -0.00022775307297706604, -0.00022009573876857758, -0.0002124384045600891, -0.00020478107035160065, -0.00019712373614311218, -0.00018946640193462372, -0.00018180906772613525, -0.0001741517335176468, -0.00016649439930915833, -0.00015883706510066986, -0.0001511797308921814, -0.00014352239668369293, -0.00013586506247520447, -0.000128207728266716, -0.00012055039405822754, -0.00011289305984973907, -0.00010523572564125061, -9.757839143276215e-05, -8.992105722427368e-05, -8.226372301578522e-05, -7.460638880729675e-05, -6.694905459880829e-05, -5.9291720390319824e-05, -5.163438618183136e-05, -4.3977051973342896e-05, -3.631971776485443e-05, -2.8662383556365967e-05, -2.1005049347877502e-05, -1.3347715139389038e-05, -5.690380930900574e-06, 1.9669532775878906e-06, 9.624287486076355e-06, 1.728162169456482e-05, 2.4938955903053284e-05, 3.259629011154175e-05, 4.025362432003021e-05, 4.791095852851868e-05, 5.556829273700714e-05, 6.32256269454956e-05, 7.088296115398407e-05, 7.854029536247253e-05, 8.6197629570961e-05, 9.385496377944946e-05, 0.00010151229798793793, 0.00010916963219642639, 0.00011682696640491486, 0.00012448430061340332, 0.00013214163482189178, 0.00013979896903038025, 0.0001474563032388687, 0.00015511363744735718, 0.00016277097165584564, 0.0001704283058643341, 0.00017808564007282257, 0.00018574297428131104, 0.0001934003084897995, 0.00020105764269828796, 0.00020871497690677643, 0.0002163723111152649, 0.00022402964532375336, 0.00023168697953224182, 0.00023934431374073029, 0.00024700164794921875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 7.0, 6.0, 20.0, 31.0, 44.0, 47.0, 80.0, 126.0, 294.0, 772.0, 2848.0, 17741.0, 676890.0, 332861.0, 13160.0, 2393.0, 648.0, 230.0, 133.0, 91.0, 50.0, 25.0, 22.0, 15.0, 7.0, 6.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.990234375, -1.9034423828125, -1.816650390625, -1.7298583984375, -1.64306640625, -1.5562744140625, -1.469482421875, -1.3826904296875, -1.2958984375, -1.2091064453125, -1.122314453125, -1.0355224609375, -0.94873046875, -0.8619384765625, -0.775146484375, -0.6883544921875, -0.6015625, -0.5147705078125, -0.427978515625, -0.3411865234375, -0.25439453125, -0.1676025390625, -0.080810546875, 0.0059814453125, 0.0927734375, 0.1795654296875, 0.266357421875, 0.3531494140625, 0.43994140625, 0.5267333984375, 0.613525390625, 0.7003173828125, 0.787109375, 0.8739013671875, 0.960693359375, 1.0474853515625, 1.13427734375, 1.2210693359375, 1.307861328125, 1.3946533203125, 1.4814453125, 1.5682373046875, 1.655029296875, 1.7418212890625, 1.82861328125, 1.9154052734375, 2.002197265625, 2.0889892578125, 2.17578125, 2.2625732421875, 2.349365234375, 2.4361572265625, 2.52294921875, 2.6097412109375, 2.696533203125, 2.7833251953125, 2.8701171875, 2.9569091796875, 3.043701171875, 3.1304931640625, 3.21728515625, 3.3040771484375, 3.390869140625, 3.4776611328125, 3.564453125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 4.0, 2.0, 2.0, 6.0, 5.0, 6.0, 10.0, 8.0, 14.0, 34.0, 62.0, 91.0, 156.0, 185.0, 163.0, 100.0, 39.0, 33.0, 26.0, 12.0, 7.0, 9.0, 5.0, 4.0, 5.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6943359375, -1.6386871337890625, -1.583038330078125, -1.5273895263671875, -1.47174072265625, -1.4160919189453125, -1.360443115234375, -1.3047943115234375, -1.2491455078125, -1.1934967041015625, -1.137847900390625, -1.0821990966796875, -1.02655029296875, -0.9709014892578125, -0.915252685546875, -0.8596038818359375, -0.803955078125, -0.7483062744140625, -0.692657470703125, -0.6370086669921875, -0.58135986328125, -0.5257110595703125, -0.470062255859375, -0.4144134521484375, -0.3587646484375, -0.3031158447265625, -0.247467041015625, -0.1918182373046875, -0.13616943359375, -0.0805206298828125, -0.024871826171875, 0.0307769775390625, 0.08642578125, 0.1420745849609375, 0.197723388671875, 0.2533721923828125, 0.30902099609375, 0.3646697998046875, 0.420318603515625, 0.4759674072265625, 0.5316162109375, 0.5872650146484375, 0.642913818359375, 0.6985626220703125, 0.75421142578125, 0.8098602294921875, 0.865509033203125, 0.9211578369140625, 0.976806640625, 1.0324554443359375, 1.088104248046875, 1.1437530517578125, 1.19940185546875, 1.2550506591796875, 1.310699462890625, 1.3663482666015625, 1.4219970703125, 1.4776458740234375, 1.533294677734375, 1.5889434814453125, 1.64459228515625, 1.7002410888671875, 1.755889892578125, 1.8115386962890625, 1.8671875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 13.0, 51.0, 125.0, 265.0, 278.0, 166.0, 65.0, 21.0, 11.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.588333129882812, -19.393722534179688, -18.199111938476562, -17.004501342773438, -15.809890747070312, -14.615280151367188, -13.420669555664062, -12.226058959960938, -11.031448364257812, -9.836837768554688, -8.642227172851562, -7.4476165771484375, -6.2530059814453125, -5.0583953857421875, -3.8637847900390625, -2.6691741943359375, -1.4745635986328125, -0.2799530029296875, 0.9146575927734375, 2.1092681884765625, 3.3038787841796875, 4.4984893798828125, 5.6930999755859375, 6.8877105712890625, 8.082321166992188, 9.276931762695312, 10.471542358398438, 11.666152954101562, 12.860763549804688, 14.055374145507812, 15.249984741210938, 16.444595336914062, 17.639202117919922, 18.833812713623047, 20.028423309326172, 21.223033905029297, 22.417644500732422, 23.612255096435547, 24.806865692138672, 26.001476287841797, 27.196086883544922, 28.390697479248047, 29.585308074951172, 30.779918670654297, 31.974529266357422, 33.16913986206055, 34.36375045776367, 35.5583610534668, 36.75297164916992, 37.94758224487305, 39.14219284057617, 40.3368034362793, 41.53141403198242, 42.72602462768555, 43.92063522338867, 45.1152458190918, 46.30985641479492, 47.50446701049805, 48.69907760620117, 49.8936882019043, 51.08829879760742, 52.28290939331055, 53.47751998901367, 54.6721305847168, 55.86674118041992]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 9.0, 8.0, 5.0, 9.0, 11.0, 13.0, 11.0, 18.0, 24.0, 26.0, 23.0, 34.0, 30.0, 26.0, 29.0, 36.0, 36.0, 39.0, 53.0, 50.0, 43.0, 44.0, 41.0, 41.0, 36.0, 30.0, 42.0, 25.0, 30.0, 23.0, 30.0, 31.0, 21.0, 8.0, 9.0, 13.0, 10.0, 6.0, 6.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-15.494140625, -15.037921905517578, -14.58170223236084, -14.125482559204102, -13.66926383972168, -13.213045120239258, -12.75682544708252, -12.300605773925781, -11.84438705444336, -11.388168334960938, -10.9319486618042, -10.475728988647461, -10.019510269165039, -9.563291549682617, -9.107071876525879, -8.65085220336914, -8.194633483886719, -7.738414287567139, -7.282195091247559, -6.8259758949279785, -6.369756698608398, -5.913537502288818, -5.457318305969238, -5.001099109649658, -4.544879913330078, -4.088660717010498, -3.632441520690918, -3.176222324371338, -2.720003128051758, -2.2637839317321777, -1.8075647354125977, -1.3513455390930176, -0.8951253890991211, -0.438906192779541, 0.017313003540039062, 0.47353219985961914, 0.9297513961791992, 1.3859705924987793, 1.8421897888183594, 2.2984089851379395, 2.7546281814575195, 3.2108473777770996, 3.6670665740966797, 4.12328577041626, 4.57950496673584, 5.03572416305542, 5.491943359375, 5.94816255569458, 6.40438175201416, 6.86060094833374, 7.31682014465332, 7.7730393409729, 8.22925853729248, 8.685478210449219, 9.14169692993164, 9.597915649414062, 10.0541353225708, 10.510354995727539, 10.966573715209961, 11.422792434692383, 11.879012107849121, 12.33523178100586, 12.791450500488281, 13.247669219970703, 13.703888893127441]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 12.0, 20.0, 28.0, 51.0, 90.0, 163.0, 359.0, 887.0, 2323.0, 7913.0, 55837.0, 3962705.0, 145743.0, 12706.0, 3333.0, 1154.0, 503.0, 201.0, 101.0, 63.0, 37.0, 16.0, 11.0, 9.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.60546875, -4.47979736328125, -4.3541259765625, -4.22845458984375, -4.102783203125, -3.97711181640625, -3.8514404296875, -3.72576904296875, -3.60009765625, -3.47442626953125, -3.3487548828125, -3.22308349609375, -3.097412109375, -2.97174072265625, -2.8460693359375, -2.72039794921875, -2.5947265625, -2.46905517578125, -2.3433837890625, -2.21771240234375, -2.092041015625, -1.96636962890625, -1.8406982421875, -1.71502685546875, -1.58935546875, -1.46368408203125, -1.3380126953125, -1.21234130859375, -1.086669921875, -0.96099853515625, -0.8353271484375, -0.70965576171875, -0.583984375, -0.45831298828125, -0.3326416015625, -0.20697021484375, -0.081298828125, 0.04437255859375, 0.1700439453125, 0.29571533203125, 0.42138671875, 0.54705810546875, 0.6727294921875, 0.79840087890625, 0.924072265625, 1.04974365234375, 1.1754150390625, 1.30108642578125, 1.4267578125, 1.55242919921875, 1.6781005859375, 1.80377197265625, 1.929443359375, 2.05511474609375, 2.1807861328125, 2.30645751953125, 2.43212890625, 2.55780029296875, 2.6834716796875, 2.80914306640625, 2.934814453125, 3.06048583984375, 3.1861572265625, 3.31182861328125, 3.4375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 8.0, 6.0, 12.0, 7.0, 23.0, 28.0, 40.0, 42.0, 39.0, 51.0, 67.0, 59.0, 75.0, 71.0, 63.0, 66.0, 53.0, 56.0, 45.0, 44.0, 23.0, 34.0, 22.0, 21.0, 7.0, 13.0, 5.0, 9.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9013671875, -0.873687744140625, -0.84600830078125, -0.818328857421875, -0.7906494140625, -0.762969970703125, -0.73529052734375, -0.707611083984375, -0.679931640625, -0.652252197265625, -0.62457275390625, -0.596893310546875, -0.5692138671875, -0.541534423828125, -0.51385498046875, -0.486175537109375, -0.45849609375, -0.430816650390625, -0.40313720703125, -0.375457763671875, -0.3477783203125, -0.320098876953125, -0.29241943359375, -0.264739990234375, -0.237060546875, -0.209381103515625, -0.18170166015625, -0.154022216796875, -0.1263427734375, -0.098663330078125, -0.07098388671875, -0.043304443359375, -0.015625, 0.012054443359375, 0.03973388671875, 0.067413330078125, 0.0950927734375, 0.122772216796875, 0.15045166015625, 0.178131103515625, 0.205810546875, 0.233489990234375, 0.26116943359375, 0.288848876953125, 0.3165283203125, 0.344207763671875, 0.37188720703125, 0.399566650390625, 0.42724609375, 0.454925537109375, 0.48260498046875, 0.510284423828125, 0.5379638671875, 0.565643310546875, 0.59332275390625, 0.621002197265625, 0.648681640625, 0.676361083984375, 0.70404052734375, 0.731719970703125, 0.7593994140625, 0.787078857421875, 0.81475830078125, 0.842437744140625, 0.8701171875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 7.0, 8.0, 7.0, 16.0, 27.0, 29.0, 38.0, 55.0, 82.0, 159.0, 258.0, 548.0, 1056.0, 2420.0, 6917.0, 27441.0, 272120.0, 3745940.0, 111238.0, 17204.0, 4921.0, 1924.0, 848.0, 406.0, 236.0, 129.0, 72.0, 42.0, 29.0, 28.0, 22.0, 11.0, 10.0, 11.0, 7.0, 8.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.279296875, -2.204193115234375, -2.12908935546875, -2.053985595703125, -1.9788818359375, -1.903778076171875, -1.82867431640625, -1.753570556640625, -1.678466796875, -1.603363037109375, -1.52825927734375, -1.453155517578125, -1.3780517578125, -1.302947998046875, -1.22784423828125, -1.152740478515625, -1.07763671875, -1.002532958984375, -0.92742919921875, -0.852325439453125, -0.7772216796875, -0.702117919921875, -0.62701416015625, -0.551910400390625, -0.476806640625, -0.401702880859375, -0.32659912109375, -0.251495361328125, -0.1763916015625, -0.101287841796875, -0.02618408203125, 0.048919677734375, 0.1240234375, 0.199127197265625, 0.27423095703125, 0.349334716796875, 0.4244384765625, 0.499542236328125, 0.57464599609375, 0.649749755859375, 0.724853515625, 0.799957275390625, 0.87506103515625, 0.950164794921875, 1.0252685546875, 1.100372314453125, 1.17547607421875, 1.250579833984375, 1.32568359375, 1.400787353515625, 1.47589111328125, 1.550994873046875, 1.6260986328125, 1.701202392578125, 1.77630615234375, 1.851409912109375, 1.926513671875, 2.001617431640625, 2.07672119140625, 2.151824951171875, 2.2269287109375, 2.302032470703125, 2.37713623046875, 2.452239990234375, 2.52734375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 9.0, 5.0, 8.0, 16.0, 18.0, 37.0, 87.0, 184.0, 979.0, 2249.0, 275.0, 104.0, 44.0, 27.0, 6.0, 9.0, 8.0, 6.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.431640625, -2.3777923583984375, -2.323944091796875, -2.2700958251953125, -2.21624755859375, -2.1623992919921875, -2.108551025390625, -2.0547027587890625, -2.0008544921875, -1.9470062255859375, -1.893157958984375, -1.8393096923828125, -1.78546142578125, -1.7316131591796875, -1.677764892578125, -1.6239166259765625, -1.570068359375, -1.5162200927734375, -1.462371826171875, -1.4085235595703125, -1.35467529296875, -1.3008270263671875, -1.246978759765625, -1.1931304931640625, -1.1392822265625, -1.0854339599609375, -1.031585693359375, -0.9777374267578125, -0.92388916015625, -0.8700408935546875, -0.816192626953125, -0.7623443603515625, -0.70849609375, -0.6546478271484375, -0.600799560546875, -0.5469512939453125, -0.49310302734375, -0.4392547607421875, -0.385406494140625, -0.3315582275390625, -0.2777099609375, -0.2238616943359375, -0.170013427734375, -0.1161651611328125, -0.06231689453125, -0.0084686279296875, 0.045379638671875, 0.0992279052734375, 0.153076171875, 0.2069244384765625, 0.260772705078125, 0.3146209716796875, 0.36846923828125, 0.4223175048828125, 0.476165771484375, 0.5300140380859375, 0.5838623046875, 0.6377105712890625, 0.691558837890625, 0.7454071044921875, 0.79925537109375, 0.8531036376953125, 0.906951904296875, 0.9608001708984375, 1.0146484375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 8.0, 35.0, 129.0, 272.0, 324.0, 159.0, 59.0, 15.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.818504333496094, -16.46736717224121, -16.116230010986328, -15.765093803405762, -15.413956642150879, -15.062820434570312, -14.71168327331543, -14.360546112060547, -14.009408950805664, -13.658271789550781, -13.307135581970215, -12.955998420715332, -12.60486125946045, -12.253725051879883, -11.902587890625, -11.551450729370117, -11.20031452178955, -10.849177360534668, -10.498041152954102, -10.146903991699219, -9.795766830444336, -9.444629669189453, -9.093493461608887, -8.742356300354004, -8.391220092773438, -8.040082931518555, -7.68894624710083, -7.3378095626831055, -6.986672401428223, -6.635535717010498, -6.284399032592773, -5.933261871337891, -5.582123756408691, -5.230987071990967, -4.879849910736084, -4.528713226318359, -4.177576065063477, -3.826439380645752, -3.4753026962280273, -3.1241657733917236, -2.77302885055542, -2.421891927719116, -2.0707550048828125, -1.719618320465088, -1.3684813976287842, -1.0173444747924805, -0.6662077903747559, -0.31507086753845215, 0.03606605529785156, 0.3872029185295105, 0.7383397817611694, 1.0894765853881836, 1.4406135082244873, 1.791750431060791, 2.1428871154785156, 2.4940240383148193, 2.845160961151123, 3.1962978839874268, 3.5474348068237305, 3.898571491241455, 4.24970817565918, 4.6008453369140625, 4.951982021331787, 5.303118705749512, 5.6542558670043945]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 7.0, 7.0, 5.0, 14.0, 11.0, 10.0, 11.0, 19.0, 24.0, 35.0, 25.0, 35.0, 34.0, 43.0, 39.0, 51.0, 39.0, 48.0, 53.0, 51.0, 40.0, 53.0, 45.0, 41.0, 33.0, 33.0, 36.0, 22.0, 29.0, 18.0, 25.0, 11.0, 16.0, 5.0, 7.0, 9.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.2170538902282715, -3.113553762435913, -3.010053873062134, -2.9065537452697754, -2.803053617477417, -2.6995534896850586, -2.5960536003112793, -2.492553472518921, -2.3890533447265625, -2.285553216934204, -2.182053327560425, -2.0785531997680664, -1.975053071975708, -1.8715530633926392, -1.7680530548095703, -1.664552927017212, -1.5610530376434326, -1.4575530290603638, -1.3540529012680054, -1.2505528926849365, -1.1470527648925781, -1.0435527563095093, -0.9400527477264404, -0.8365526795387268, -0.7330526113510132, -0.6295525431632996, -0.5260524749755859, -0.4225524663925171, -0.31905239820480347, -0.21555233001708984, -0.112052321434021, -0.008552253246307373, 0.09494757652282715, 0.19844762980937958, 0.301947683095932, 0.40544772148132324, 0.5089477896690369, 0.6124478578567505, 0.7159478664398193, 0.819447934627533, 0.9229480028152466, 1.0264480113983154, 1.1299481391906738, 1.2334481477737427, 1.3369481563568115, 1.44044828414917, 1.5439482927322388, 1.6474483013153076, 1.750948429107666, 1.8544484376907349, 1.9579485654830933, 2.061448574066162, 2.1649487018585205, 2.268448829650879, 2.371948719024658, 2.4754488468170166, 2.578948974609375, 2.6824491024017334, 2.7859489917755127, 2.889449119567871, 2.9929492473602295, 3.096449375152588, 3.199949264526367, 3.3034493923187256, 3.406949281692505]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 6.0, 8.0, 15.0, 14.0, 16.0, 27.0, 59.0, 87.0, 120.0, 195.0, 269.0, 523.0, 847.0, 1585.0, 3056.0, 6419.0, 15054.0, 39926.0, 110807.0, 266228.0, 327849.0, 170982.0, 62831.0, 23090.0, 9373.0, 4251.0, 2090.0, 1094.0, 653.0, 381.0, 232.0, 148.0, 94.0, 64.0, 50.0, 31.0, 21.0, 18.0, 8.0, 4.0, 4.0, 9.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.896484375, -1.8376312255859375, -1.778778076171875, -1.7199249267578125, -1.66107177734375, -1.6022186279296875, -1.543365478515625, -1.4845123291015625, -1.4256591796875, -1.3668060302734375, -1.307952880859375, -1.2490997314453125, -1.19024658203125, -1.1313934326171875, -1.072540283203125, -1.0136871337890625, -0.954833984375, -0.8959808349609375, -0.837127685546875, -0.7782745361328125, -0.71942138671875, -0.6605682373046875, -0.601715087890625, -0.5428619384765625, -0.4840087890625, -0.4251556396484375, -0.366302490234375, -0.3074493408203125, -0.24859619140625, -0.1897430419921875, -0.130889892578125, -0.0720367431640625, -0.01318359375, 0.0456695556640625, 0.104522705078125, 0.1633758544921875, 0.22222900390625, 0.2810821533203125, 0.339935302734375, 0.3987884521484375, 0.4576416015625, 0.5164947509765625, 0.575347900390625, 0.6342010498046875, 0.69305419921875, 0.7519073486328125, 0.810760498046875, 0.8696136474609375, 0.928466796875, 0.9873199462890625, 1.046173095703125, 1.1050262451171875, 1.16387939453125, 1.2227325439453125, 1.281585693359375, 1.3404388427734375, 1.3992919921875, 1.4581451416015625, 1.516998291015625, 1.5758514404296875, 1.63470458984375, 1.6935577392578125, 1.752410888671875, 1.8112640380859375, 1.8701171875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 2.0, 6.0, 7.0, 10.0, 14.0, 21.0, 13.0, 39.0, 34.0, 52.0, 56.0, 35.0, 70.0, 63.0, 71.0, 69.0, 73.0, 53.0, 46.0, 57.0, 38.0, 30.0, 34.0, 31.0, 22.0, 17.0, 9.0, 8.0, 7.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8935546875, -0.8665237426757812, -0.8394927978515625, -0.8124618530273438, -0.785430908203125, -0.7583999633789062, -0.7313690185546875, -0.7043380737304688, -0.67730712890625, -0.6502761840820312, -0.6232452392578125, -0.5962142944335938, -0.569183349609375, -0.5421524047851562, -0.5151214599609375, -0.48809051513671875, -0.4610595703125, -0.43402862548828125, -0.4069976806640625, -0.37996673583984375, -0.352935791015625, -0.32590484619140625, -0.2988739013671875, -0.27184295654296875, -0.24481201171875, -0.21778106689453125, -0.1907501220703125, -0.16371917724609375, -0.136688232421875, -0.10965728759765625, -0.0826263427734375, -0.05559539794921875, -0.028564453125, -0.00153350830078125, 0.0254974365234375, 0.05252838134765625, 0.079559326171875, 0.10659027099609375, 0.1336212158203125, 0.16065216064453125, 0.18768310546875, 0.21471405029296875, 0.2417449951171875, 0.26877593994140625, 0.295806884765625, 0.32283782958984375, 0.3498687744140625, 0.37689971923828125, 0.4039306640625, 0.43096160888671875, 0.4579925537109375, 0.48502349853515625, 0.512054443359375, 0.5390853881835938, 0.5661163330078125, 0.5931472778320312, 0.62017822265625, 0.6472091674804688, 0.6742401123046875, 0.7012710571289062, 0.728302001953125, 0.7553329467773438, 0.7823638916015625, 0.8093948364257812, 0.83642578125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 6.0, 8.0, 4.0, 4.0, 9.0, 10.0, 18.0, 25.0, 29.0, 40.0, 55.0, 79.0, 115.0, 178.0, 328.0, 588.0, 1274.0, 2912.0, 8006.0, 24228.0, 83448.0, 280857.0, 419922.0, 159142.0, 44545.0, 13935.0, 4857.0, 1976.0, 834.0, 398.0, 227.0, 148.0, 104.0, 59.0, 50.0, 25.0, 26.0, 18.0, 16.0, 16.0, 12.0, 7.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.404296875, -2.3341064453125, -2.263916015625, -2.1937255859375, -2.12353515625, -2.0533447265625, -1.983154296875, -1.9129638671875, -1.8427734375, -1.7725830078125, -1.702392578125, -1.6322021484375, -1.56201171875, -1.4918212890625, -1.421630859375, -1.3514404296875, -1.28125, -1.2110595703125, -1.140869140625, -1.0706787109375, -1.00048828125, -0.9302978515625, -0.860107421875, -0.7899169921875, -0.7197265625, -0.6495361328125, -0.579345703125, -0.5091552734375, -0.43896484375, -0.3687744140625, -0.298583984375, -0.2283935546875, -0.158203125, -0.0880126953125, -0.017822265625, 0.0523681640625, 0.12255859375, 0.1927490234375, 0.262939453125, 0.3331298828125, 0.4033203125, 0.4735107421875, 0.543701171875, 0.6138916015625, 0.68408203125, 0.7542724609375, 0.824462890625, 0.8946533203125, 0.96484375, 1.0350341796875, 1.105224609375, 1.1754150390625, 1.24560546875, 1.3157958984375, 1.385986328125, 1.4561767578125, 1.5263671875, 1.5965576171875, 1.666748046875, 1.7369384765625, 1.80712890625, 1.8773193359375, 1.947509765625, 2.0177001953125, 2.087890625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 5.0, 4.0, 7.0, 7.0, 3.0, 11.0, 16.0, 13.0, 7.0, 16.0, 18.0, 22.0, 24.0, 27.0, 32.0, 24.0, 39.0, 34.0, 30.0, 43.0, 39.0, 42.0, 42.0, 47.0, 57.0, 36.0, 40.0, 36.0, 27.0, 28.0, 30.0, 22.0, 19.0, 21.0, 19.0, 16.0, 16.0, 14.0, 12.0, 16.0, 10.0, 4.0, 5.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.0078125, -2.908111572265625, -2.80841064453125, -2.708709716796875, -2.6090087890625, -2.509307861328125, -2.40960693359375, -2.309906005859375, -2.210205078125, -2.110504150390625, -2.01080322265625, -1.911102294921875, -1.8114013671875, -1.711700439453125, -1.61199951171875, -1.512298583984375, -1.41259765625, -1.312896728515625, -1.21319580078125, -1.113494873046875, -1.0137939453125, -0.914093017578125, -0.81439208984375, -0.714691162109375, -0.614990234375, -0.515289306640625, -0.41558837890625, -0.315887451171875, -0.2161865234375, -0.116485595703125, -0.01678466796875, 0.082916259765625, 0.1826171875, 0.282318115234375, 0.38201904296875, 0.481719970703125, 0.5814208984375, 0.681121826171875, 0.78082275390625, 0.880523681640625, 0.980224609375, 1.079925537109375, 1.17962646484375, 1.279327392578125, 1.3790283203125, 1.478729248046875, 1.57843017578125, 1.678131103515625, 1.77783203125, 1.877532958984375, 1.97723388671875, 2.076934814453125, 2.1766357421875, 2.276336669921875, 2.37603759765625, 2.475738525390625, 2.575439453125, 2.675140380859375, 2.77484130859375, 2.874542236328125, 2.9742431640625, 3.073944091796875, 3.17364501953125, 3.273345947265625, 3.373046875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 10.0, 9.0, 15.0, 17.0, 28.0, 29.0, 34.0, 74.0, 90.0, 163.0, 314.0, 679.0, 1809.0, 6650.0, 46565.0, 645196.0, 316710.0, 23310.0, 4375.0, 1303.0, 493.0, 268.0, 137.0, 89.0, 61.0, 41.0, 18.0, 21.0, 11.0, 10.0, 7.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.017578125, -1.949981689453125, -1.88238525390625, -1.814788818359375, -1.7471923828125, -1.679595947265625, -1.61199951171875, -1.544403076171875, -1.476806640625, -1.409210205078125, -1.34161376953125, -1.274017333984375, -1.2064208984375, -1.138824462890625, -1.07122802734375, -1.003631591796875, -0.93603515625, -0.868438720703125, -0.80084228515625, -0.733245849609375, -0.6656494140625, -0.598052978515625, -0.53045654296875, -0.462860107421875, -0.395263671875, -0.327667236328125, -0.26007080078125, -0.192474365234375, -0.1248779296875, -0.057281494140625, 0.01031494140625, 0.077911376953125, 0.1455078125, 0.213104248046875, 0.28070068359375, 0.348297119140625, 0.4158935546875, 0.483489990234375, 0.55108642578125, 0.618682861328125, 0.686279296875, 0.753875732421875, 0.82147216796875, 0.889068603515625, 0.9566650390625, 1.024261474609375, 1.09185791015625, 1.159454345703125, 1.22705078125, 1.294647216796875, 1.36224365234375, 1.429840087890625, 1.4974365234375, 1.565032958984375, 1.63262939453125, 1.700225830078125, 1.767822265625, 1.835418701171875, 1.90301513671875, 1.970611572265625, 2.0382080078125, 2.105804443359375, 2.17340087890625, 2.240997314453125, 2.30859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 9.0, 15.0, 37.0, 48.0, 111.0, 146.0, 160.0, 172.0, 132.0, 80.0, 46.0, 24.0, 8.0, 9.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023412704467773438, -0.00022094696760177612, -0.00020776689052581787, -0.00019458681344985962, -0.00018140673637390137, -0.00016822665929794312, -0.00015504658222198486, -0.0001418665051460266, -0.00012868642807006836, -0.00011550635099411011, -0.00010232627391815186, -8.91461968421936e-05, -7.596611976623535e-05, -6.27860426902771e-05, -4.960596561431885e-05, -3.6425888538360596e-05, -2.3245811462402344e-05, -1.0065734386444092e-05, 3.11434268951416e-06, 1.6294419765472412e-05, 2.9474496841430664e-05, 4.2654573917388916e-05, 5.583465099334717e-05, 6.901472806930542e-05, 8.219480514526367e-05, 9.537488222122192e-05, 0.00010855495929718018, 0.00012173503637313843, 0.00013491511344909668, 0.00014809519052505493, 0.00016127526760101318, 0.00017445534467697144, 0.0001876354217529297, 0.00020081549882888794, 0.0002139955759048462, 0.00022717565298080444, 0.0002403557300567627, 0.00025353580713272095, 0.0002667158842086792, 0.00027989596128463745, 0.0002930760383605957, 0.00030625611543655396, 0.0003194361925125122, 0.00033261626958847046, 0.0003457963466644287, 0.00035897642374038696, 0.0003721565008163452, 0.00038533657789230347, 0.0003985166549682617, 0.00041169673204421997, 0.0004248768091201782, 0.0004380568861961365, 0.0004512369632720947, 0.000464417040348053, 0.00047759711742401123, 0.0004907771944999695, 0.0005039572715759277, 0.000517137348651886, 0.0005303174257278442, 0.0005434975028038025, 0.0005566775798797607, 0.000569857656955719, 0.0005830377340316772, 0.0005962178111076355, 0.0006093978881835938]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 6.0, 5.0, 7.0, 13.0, 20.0, 25.0, 40.0, 60.0, 94.0, 162.0, 323.0, 622.0, 1412.0, 3807.0, 15670.0, 93574.0, 544062.0, 325685.0, 48817.0, 9252.0, 2708.0, 1007.0, 482.0, 288.0, 161.0, 89.0, 63.0, 26.0, 20.0, 20.0, 5.0, 13.0, 2.0, 4.0, 8.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.716796875, -1.6701812744140625, -1.623565673828125, -1.5769500732421875, -1.53033447265625, -1.4837188720703125, -1.437103271484375, -1.3904876708984375, -1.3438720703125, -1.2972564697265625, -1.250640869140625, -1.2040252685546875, -1.15740966796875, -1.1107940673828125, -1.064178466796875, -1.0175628662109375, -0.970947265625, -0.9243316650390625, -0.877716064453125, -0.8311004638671875, -0.78448486328125, -0.7378692626953125, -0.691253662109375, -0.6446380615234375, -0.5980224609375, -0.5514068603515625, -0.504791259765625, -0.4581756591796875, -0.41156005859375, -0.3649444580078125, -0.318328857421875, -0.2717132568359375, -0.22509765625, -0.1784820556640625, -0.131866455078125, -0.0852508544921875, -0.03863525390625, 0.0079803466796875, 0.054595947265625, 0.1012115478515625, 0.1478271484375, 0.1944427490234375, 0.241058349609375, 0.2876739501953125, 0.33428955078125, 0.3809051513671875, 0.427520751953125, 0.4741363525390625, 0.520751953125, 0.5673675537109375, 0.613983154296875, 0.6605987548828125, 0.70721435546875, 0.7538299560546875, 0.800445556640625, 0.8470611572265625, 0.8936767578125, 0.9402923583984375, 0.986907958984375, 1.0335235595703125, 1.08013916015625, 1.1267547607421875, 1.173370361328125, 1.2199859619140625, 1.2666015625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 2.0, 3.0, 10.0, 9.0, 13.0, 24.0, 31.0, 33.0, 56.0, 72.0, 88.0, 121.0, 131.0, 89.0, 87.0, 55.0, 44.0, 42.0, 26.0, 19.0, 10.0, 13.0, 7.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.771484375, -1.710723876953125, -1.64996337890625, -1.589202880859375, -1.5284423828125, -1.467681884765625, -1.40692138671875, -1.346160888671875, -1.285400390625, -1.224639892578125, -1.16387939453125, -1.103118896484375, -1.0423583984375, -0.981597900390625, -0.92083740234375, -0.860076904296875, -0.79931640625, -0.738555908203125, -0.67779541015625, -0.617034912109375, -0.5562744140625, -0.495513916015625, -0.43475341796875, -0.373992919921875, -0.313232421875, -0.252471923828125, -0.19171142578125, -0.130950927734375, -0.0701904296875, -0.009429931640625, 0.05133056640625, 0.112091064453125, 0.1728515625, 0.233612060546875, 0.29437255859375, 0.355133056640625, 0.4158935546875, 0.476654052734375, 0.53741455078125, 0.598175048828125, 0.658935546875, 0.719696044921875, 0.78045654296875, 0.841217041015625, 0.9019775390625, 0.962738037109375, 1.02349853515625, 1.084259033203125, 1.14501953125, 1.205780029296875, 1.26654052734375, 1.327301025390625, 1.3880615234375, 1.448822021484375, 1.50958251953125, 1.570343017578125, 1.631103515625, 1.691864013671875, 1.75262451171875, 1.813385009765625, 1.8741455078125, 1.934906005859375, 1.99566650390625, 2.056427001953125, 2.1171875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 1.0, 8.0, 24.0, 69.0, 140.0, 263.0, 244.0, 158.0, 66.0, 21.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.57878494262695, -49.133033752441406, -47.68728256225586, -46.24152755737305, -44.7957763671875, -43.35002517700195, -41.904273986816406, -40.458518981933594, -39.01276779174805, -37.5670166015625, -36.12126541137695, -34.67551040649414, -33.229759216308594, -31.784008026123047, -30.3382568359375, -28.89250373840332, -27.446752548217773, -26.001001358032227, -24.555248260498047, -23.1094970703125, -21.66374397277832, -20.217992782592773, -18.772239685058594, -17.326488494873047, -15.880736351013184, -14.43498420715332, -12.989232063293457, -11.543479919433594, -10.097728729248047, -8.651975631713867, -7.20622444152832, -5.760472297668457, -4.314720153808594, -2.8689680099487305, -1.4232161045074463, 0.02253580093383789, 1.4682879447937012, 2.9140400886535645, 4.3597917556762695, 5.805543899536133, 7.251296043395996, 8.69704818725586, 10.142800331115723, 11.588552474975586, 13.034303665161133, 14.480056762695312, 15.92580795288086, 17.371559143066406, 18.817312240600586, 20.263063430786133, 21.708816528320312, 23.15456771850586, 24.60032081604004, 26.046072006225586, 27.491825103759766, 28.937576293945312, 30.38332748413086, 31.829078674316406, 33.27482986450195, 34.720584869384766, 36.16633605957031, 37.61208724975586, 39.057838439941406, 40.50359344482422, 41.949344635009766]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 4.0, 11.0, 7.0, 15.0, 13.0, 18.0, 21.0, 17.0, 26.0, 28.0, 32.0, 28.0, 34.0, 43.0, 50.0, 44.0, 42.0, 43.0, 45.0, 52.0, 39.0, 48.0, 37.0, 35.0, 39.0, 25.0, 21.0, 20.0, 23.0, 22.0, 18.0, 17.0, 13.0, 12.0, 12.0, 11.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-21.579700469970703, -20.926462173461914, -20.273223876953125, -19.619985580444336, -18.966747283935547, -18.313507080078125, -17.660268783569336, -17.007030487060547, -16.353792190551758, -15.700553894042969, -15.04731559753418, -14.394076347351074, -13.740838050842285, -13.087599754333496, -12.43436050415039, -11.781122207641602, -11.127883911132812, -10.474645614624023, -9.821407318115234, -9.168168067932129, -8.51492977142334, -7.861691474914551, -7.2084527015686035, -6.555213928222656, -5.901975631713867, -5.248737335205078, -4.595498561859131, -3.9422600269317627, -3.2890214920043945, -2.6357829570770264, -1.9825444221496582, -1.329305648803711, -0.6760654449462891, -0.0228269100189209, 0.6304116249084473, 1.2836501598358154, 1.9368886947631836, 2.5901272296905518, 3.24336576461792, 3.896604537963867, 4.549842834472656, 5.203081130981445, 5.856319904327393, 6.50955867767334, 7.162796974182129, 7.816035270690918, 8.469274520874023, 9.122512817382812, 9.775751113891602, 10.42898941040039, 11.08222770690918, 11.735466957092285, 12.388705253601074, 13.041943550109863, 13.695182800292969, 14.348421096801758, 15.001659393310547, 15.654897689819336, 16.308135986328125, 16.961374282836914, 17.614612579345703, 18.267852783203125, 18.921091079711914, 19.574329376220703, 20.227567672729492]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 4.0, 13.0, 6.0, 20.0, 40.0, 60.0, 142.0, 229.0, 442.0, 967.0, 2304.0, 7212.0, 29721.0, 362122.0, 3731229.0, 44657.0, 9797.0, 3038.0, 1168.0, 528.0, 276.0, 124.0, 63.0, 53.0, 23.0, 13.0, 8.0, 6.0, 1.0, 2.0, 5.0, 1.0, 2.0, 2.0, 4.0], "bins": [-4.078125, -3.9835357666015625, -3.888946533203125, -3.7943572998046875, -3.69976806640625, -3.6051788330078125, -3.510589599609375, -3.4160003662109375, -3.3214111328125, -3.2268218994140625, -3.132232666015625, -3.0376434326171875, -2.94305419921875, -2.8484649658203125, -2.753875732421875, -2.6592864990234375, -2.564697265625, -2.4701080322265625, -2.375518798828125, -2.2809295654296875, -2.18634033203125, -2.0917510986328125, -1.997161865234375, -1.9025726318359375, -1.8079833984375, -1.7133941650390625, -1.618804931640625, -1.5242156982421875, -1.42962646484375, -1.3350372314453125, -1.240447998046875, -1.1458587646484375, -1.05126953125, -0.9566802978515625, -0.862091064453125, -0.7675018310546875, -0.67291259765625, -0.5783233642578125, -0.483734130859375, -0.3891448974609375, -0.2945556640625, -0.1999664306640625, -0.105377197265625, -0.0107879638671875, 0.08380126953125, 0.1783905029296875, 0.272979736328125, 0.3675689697265625, 0.462158203125, 0.5567474365234375, 0.651336669921875, 0.7459259033203125, 0.84051513671875, 0.9351043701171875, 1.029693603515625, 1.1242828369140625, 1.2188720703125, 1.3134613037109375, 1.408050537109375, 1.5026397705078125, 1.59722900390625, 1.6918182373046875, 1.786407470703125, 1.8809967041015625, 1.9755859375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 3.0, 8.0, 8.0, 7.0, 14.0, 16.0, 11.0, 23.0, 18.0, 36.0, 43.0, 44.0, 62.0, 48.0, 64.0, 50.0, 58.0, 53.0, 50.0, 60.0, 48.0, 50.0, 39.0, 40.0, 28.0, 24.0, 21.0, 21.0, 14.0, 13.0, 9.0, 3.0, 3.0, 4.0, 5.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9501953125, -0.9193878173828125, -0.888580322265625, -0.8577728271484375, -0.82696533203125, -0.7961578369140625, -0.765350341796875, -0.7345428466796875, -0.7037353515625, -0.6729278564453125, -0.642120361328125, -0.6113128662109375, -0.58050537109375, -0.5496978759765625, -0.518890380859375, -0.4880828857421875, -0.457275390625, -0.4264678955078125, -0.395660400390625, -0.3648529052734375, -0.33404541015625, -0.3032379150390625, -0.272430419921875, -0.2416229248046875, -0.2108154296875, -0.1800079345703125, -0.149200439453125, -0.1183929443359375, -0.08758544921875, -0.0567779541015625, -0.025970458984375, 0.0048370361328125, 0.03564453125, 0.0664520263671875, 0.097259521484375, 0.1280670166015625, 0.15887451171875, 0.1896820068359375, 0.220489501953125, 0.2512969970703125, 0.2821044921875, 0.3129119873046875, 0.343719482421875, 0.3745269775390625, 0.40533447265625, 0.4361419677734375, 0.466949462890625, 0.4977569580078125, 0.528564453125, 0.5593719482421875, 0.590179443359375, 0.6209869384765625, 0.65179443359375, 0.6826019287109375, 0.713409423828125, 0.7442169189453125, 0.7750244140625, 0.8058319091796875, 0.836639404296875, 0.8674468994140625, 0.89825439453125, 0.9290618896484375, 0.959869384765625, 0.9906768798828125, 1.021484375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 9.0, 4.0, 15.0, 20.0, 22.0, 39.0, 51.0, 75.0, 91.0, 142.0, 181.0, 271.0, 370.0, 544.0, 749.0, 1145.0, 1546.0, 2661.0, 4332.0, 7246.0, 13279.0, 28076.0, 78881.0, 459419.0, 3359636.0, 149589.0, 42923.0, 18242.0, 9288.0, 5491.0, 3403.0, 2076.0, 1423.0, 880.0, 641.0, 429.0, 352.0, 225.0, 135.0, 104.0, 80.0, 52.0, 37.0, 35.0, 18.0, 15.0, 12.0, 12.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.001953125, -0.9698638916015625, -0.937774658203125, -0.9056854248046875, -0.87359619140625, -0.8415069580078125, -0.809417724609375, -0.7773284912109375, -0.7452392578125, -0.7131500244140625, -0.681060791015625, -0.6489715576171875, -0.61688232421875, -0.5847930908203125, -0.552703857421875, -0.5206146240234375, -0.488525390625, -0.4564361572265625, -0.424346923828125, -0.3922576904296875, -0.36016845703125, -0.3280792236328125, -0.295989990234375, -0.2639007568359375, -0.2318115234375, -0.1997222900390625, -0.167633056640625, -0.1355438232421875, -0.10345458984375, -0.0713653564453125, -0.039276123046875, -0.0071868896484375, 0.02490234375, 0.0569915771484375, 0.089080810546875, 0.1211700439453125, 0.15325927734375, 0.1853485107421875, 0.217437744140625, 0.2495269775390625, 0.2816162109375, 0.3137054443359375, 0.345794677734375, 0.3778839111328125, 0.40997314453125, 0.4420623779296875, 0.474151611328125, 0.5062408447265625, 0.538330078125, 0.5704193115234375, 0.602508544921875, 0.6345977783203125, 0.66668701171875, 0.6987762451171875, 0.730865478515625, 0.7629547119140625, 0.7950439453125, 0.8271331787109375, 0.859222412109375, 0.8913116455078125, 0.92340087890625, 0.9554901123046875, 0.987579345703125, 1.0196685791015625, 1.0517578125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 0.0, 4.0, 2.0, 3.0, 3.0, 7.0, 16.0, 11.0, 25.0, 35.0, 58.0, 107.0, 339.0, 2773.0, 363.0, 138.0, 60.0, 38.0, 21.0, 16.0, 12.0, 6.0, 7.0, 4.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.440673828125, -0.4275054931640625, -0.414337158203125, -0.4011688232421875, -0.38800048828125, -0.3748321533203125, -0.361663818359375, -0.3484954833984375, -0.3353271484375, -0.3221588134765625, -0.308990478515625, -0.2958221435546875, -0.28265380859375, -0.2694854736328125, -0.256317138671875, -0.2431488037109375, -0.22998046875, -0.2168121337890625, -0.203643798828125, -0.1904754638671875, -0.17730712890625, -0.1641387939453125, -0.150970458984375, -0.1378021240234375, -0.1246337890625, -0.1114654541015625, -0.098297119140625, -0.0851287841796875, -0.07196044921875, -0.0587921142578125, -0.045623779296875, -0.0324554443359375, -0.019287109375, -0.0061187744140625, 0.007049560546875, 0.0202178955078125, 0.03338623046875, 0.0465545654296875, 0.059722900390625, 0.0728912353515625, 0.0860595703125, 0.0992279052734375, 0.112396240234375, 0.1255645751953125, 0.13873291015625, 0.1519012451171875, 0.165069580078125, 0.1782379150390625, 0.19140625, 0.2045745849609375, 0.217742919921875, 0.2309112548828125, 0.24407958984375, 0.2572479248046875, 0.270416259765625, 0.2835845947265625, 0.2967529296875, 0.3099212646484375, 0.323089599609375, 0.3362579345703125, 0.34942626953125, 0.3625946044921875, 0.375762939453125, 0.3889312744140625, 0.402099609375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 9.0, 39.0, 62.0, 133.0, 186.0, 241.0, 162.0, 88.0, 45.0, 23.0, 12.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8826694488525391, -0.786632776260376, -0.6905961036682129, -0.5945594310760498, -0.4985227584838867, -0.40248608589172363, -0.30644941329956055, -0.21041274070739746, -0.11437606811523438, -0.01833939552307129, 0.0776972770690918, 0.17373394966125488, 0.26977062225341797, 0.36580729484558105, 0.46184396743774414, 0.5578806400299072, 0.6539173126220703, 0.7499539852142334, 0.8459906578063965, 0.9420273303985596, 1.0380640029907227, 1.1341006755828857, 1.2301373481750488, 1.326174020767212, 1.422210693359375, 1.518247365951538, 1.6142840385437012, 1.7103207111358643, 1.8063573837280273, 1.9023940563201904, 1.9984307289123535, 2.0944674015045166, 2.1905040740966797, 2.2865407466888428, 2.382577419281006, 2.478614091873169, 2.574650764465332, 2.670687437057495, 2.766724109649658, 2.8627607822418213, 2.9587974548339844, 3.0548341274261475, 3.1508708000183105, 3.2469074726104736, 3.3429441452026367, 3.4389808177948, 3.535017490386963, 3.631054162979126, 3.727090835571289, 3.823127508163452, 3.9191641807556152, 4.015200614929199, 4.111237525939941, 4.207274436950684, 4.303310871124268, 4.399347305297852, 4.495384216308594, 4.591421127319336, 4.68745756149292, 4.783493995666504, 4.879530906677246, 4.975567817687988, 5.071604251861572, 5.167640686035156, 5.263677597045898]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 1.0, 6.0, 12.0, 12.0, 9.0, 15.0, 20.0, 21.0, 34.0, 26.0, 26.0, 28.0, 42.0, 37.0, 40.0, 49.0, 45.0, 41.0, 42.0, 56.0, 36.0, 39.0, 37.0, 37.0, 25.0, 27.0, 17.0, 32.0, 34.0, 30.0, 25.0, 17.0, 23.0, 11.0, 18.0, 5.0, 5.0, 6.0, 4.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3344950675964355, -1.2939614057540894, -1.2534278631210327, -1.2128942012786865, -1.1723606586456299, -1.1318269968032837, -1.091293454170227, -1.0507597923278809, -1.0102262496948242, -0.9696926474571228, -0.9291590452194214, -0.88862544298172, -0.8480918407440186, -0.8075582385063171, -0.7670246362686157, -0.7264909744262695, -0.6859573721885681, -0.6454237699508667, -0.6048901677131653, -0.5643565654754639, -0.5238229632377625, -0.48328936100006104, -0.44275572896003723, -0.4022221267223358, -0.3616885244846344, -0.321154922246933, -0.28062132000923157, -0.24008770287036896, -0.19955410063266754, -0.15902049839496613, -0.11848688125610352, -0.0779532790184021, -0.037419676780700684, 0.003113929182291031, 0.043647535145282745, 0.08418114483356476, 0.12471474707126617, 0.1652483493089676, 0.2057819664478302, 0.24631556868553162, 0.28684917092323303, 0.32738277316093445, 0.36791637539863586, 0.40845000743865967, 0.4489836096763611, 0.4895172119140625, 0.5300508141517639, 0.5705844163894653, 0.6111180186271667, 0.6516516208648682, 0.6921852231025696, 0.732718825340271, 0.7732524275779724, 0.8137860298156738, 0.85431969165802, 0.8948532342910767, 0.9353868961334229, 0.9759204983711243, 1.0164541006088257, 1.0569877624511719, 1.0975213050842285, 1.1380549669265747, 1.1785885095596313, 1.2191221714019775, 1.2596557140350342]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 2.0, 3.0, 6.0, 13.0, 17.0, 21.0, 29.0, 64.0, 83.0, 142.0, 281.0, 515.0, 943.0, 2114.0, 4939.0, 13401.0, 42529.0, 151439.0, 387435.0, 305036.0, 96011.0, 27403.0, 9179.0, 3615.0, 1610.0, 787.0, 374.0, 213.0, 128.0, 84.0, 41.0, 32.0, 23.0, 11.0, 8.0, 7.0, 8.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.541015625, -2.463592529296875, -2.38616943359375, -2.308746337890625, -2.2313232421875, -2.153900146484375, -2.07647705078125, -1.999053955078125, -1.921630859375, -1.844207763671875, -1.76678466796875, -1.689361572265625, -1.6119384765625, -1.534515380859375, -1.45709228515625, -1.379669189453125, -1.30224609375, -1.224822998046875, -1.14739990234375, -1.069976806640625, -0.9925537109375, -0.915130615234375, -0.83770751953125, -0.760284423828125, -0.682861328125, -0.605438232421875, -0.52801513671875, -0.450592041015625, -0.3731689453125, -0.295745849609375, -0.21832275390625, -0.140899658203125, -0.0634765625, 0.013946533203125, 0.09136962890625, 0.168792724609375, 0.2462158203125, 0.323638916015625, 0.40106201171875, 0.478485107421875, 0.555908203125, 0.633331298828125, 0.71075439453125, 0.788177490234375, 0.8656005859375, 0.943023681640625, 1.02044677734375, 1.097869873046875, 1.17529296875, 1.252716064453125, 1.33013916015625, 1.407562255859375, 1.4849853515625, 1.562408447265625, 1.63983154296875, 1.717254638671875, 1.794677734375, 1.872100830078125, 1.94952392578125, 2.026947021484375, 2.1043701171875, 2.181793212890625, 2.25921630859375, 2.336639404296875, 2.4140625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 9.0, 9.0, 24.0, 17.0, 28.0, 26.0, 34.0, 44.0, 47.0, 54.0, 52.0, 47.0, 57.0, 59.0, 68.0, 65.0, 51.0, 37.0, 43.0, 39.0, 41.0, 20.0, 24.0, 23.0, 14.0, 18.0, 12.0, 5.0, 2.0, 5.0, 2.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94677734375, -0.9155807495117188, -0.8843841552734375, -0.8531875610351562, -0.821990966796875, -0.7907943725585938, -0.7595977783203125, -0.7284011840820312, -0.69720458984375, -0.6660079956054688, -0.6348114013671875, -0.6036148071289062, -0.572418212890625, -0.5412216186523438, -0.5100250244140625, -0.47882843017578125, -0.4476318359375, -0.41643524169921875, -0.3852386474609375, -0.35404205322265625, -0.322845458984375, -0.29164886474609375, -0.2604522705078125, -0.22925567626953125, -0.19805908203125, -0.16686248779296875, -0.1356658935546875, -0.10446929931640625, -0.073272705078125, -0.04207611083984375, -0.0108795166015625, 0.02031707763671875, 0.051513671875, 0.08271026611328125, 0.1139068603515625, 0.14510345458984375, 0.176300048828125, 0.20749664306640625, 0.2386932373046875, 0.26988983154296875, 0.30108642578125, 0.33228302001953125, 0.3634796142578125, 0.39467620849609375, 0.425872802734375, 0.45706939697265625, 0.4882659912109375, 0.5194625854492188, 0.5506591796875, 0.5818557739257812, 0.6130523681640625, 0.6442489624023438, 0.675445556640625, 0.7066421508789062, 0.7378387451171875, 0.7690353393554688, 0.80023193359375, 0.8314285278320312, 0.8626251220703125, 0.8938217163085938, 0.925018310546875, 0.9562149047851562, 0.9874114990234375, 1.0186080932617188, 1.0498046875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 5.0, 7.0, 12.0, 9.0, 19.0, 23.0, 38.0, 51.0, 95.0, 225.0, 448.0, 1317.0, 5193.0, 31461.0, 438206.0, 526591.0, 36745.0, 5665.0, 1502.0, 473.0, 207.0, 100.0, 57.0, 33.0, 17.0, 16.0, 10.0, 6.0, 10.0, 3.0, 4.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28125, -5.111083984375, -4.94091796875, -4.770751953125, -4.6005859375, -4.430419921875, -4.26025390625, -4.090087890625, -3.919921875, -3.749755859375, -3.57958984375, -3.409423828125, -3.2392578125, -3.069091796875, -2.89892578125, -2.728759765625, -2.55859375, -2.388427734375, -2.21826171875, -2.048095703125, -1.8779296875, -1.707763671875, -1.53759765625, -1.367431640625, -1.197265625, -1.027099609375, -0.85693359375, -0.686767578125, -0.5166015625, -0.346435546875, -0.17626953125, -0.006103515625, 0.1640625, 0.334228515625, 0.50439453125, 0.674560546875, 0.8447265625, 1.014892578125, 1.18505859375, 1.355224609375, 1.525390625, 1.695556640625, 1.86572265625, 2.035888671875, 2.2060546875, 2.376220703125, 2.54638671875, 2.716552734375, 2.88671875, 3.056884765625, 3.22705078125, 3.397216796875, 3.5673828125, 3.737548828125, 3.90771484375, 4.077880859375, 4.248046875, 4.418212890625, 4.58837890625, 4.758544921875, 4.9287109375, 5.098876953125, 5.26904296875, 5.439208984375, 5.609375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 3.0, 8.0, 8.0, 18.0, 11.0, 20.0, 23.0, 21.0, 43.0, 33.0, 42.0, 38.0, 47.0, 56.0, 56.0, 55.0, 57.0, 62.0, 51.0, 46.0, 51.0, 36.0, 39.0, 31.0, 36.0, 26.0, 20.0, 14.0, 11.0, 4.0, 6.0, 8.0, 1.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.6640625, -6.46978759765625, -6.2755126953125, -6.08123779296875, -5.886962890625, -5.69268798828125, -5.4984130859375, -5.30413818359375, -5.10986328125, -4.91558837890625, -4.7213134765625, -4.52703857421875, -4.332763671875, -4.13848876953125, -3.9442138671875, -3.74993896484375, -3.5556640625, -3.36138916015625, -3.1671142578125, -2.97283935546875, -2.778564453125, -2.58428955078125, -2.3900146484375, -2.19573974609375, -2.00146484375, -1.80718994140625, -1.6129150390625, -1.41864013671875, -1.224365234375, -1.03009033203125, -0.8358154296875, -0.64154052734375, -0.447265625, -0.25299072265625, -0.0587158203125, 0.13555908203125, 0.329833984375, 0.52410888671875, 0.7183837890625, 0.91265869140625, 1.10693359375, 1.30120849609375, 1.4954833984375, 1.68975830078125, 1.884033203125, 2.07830810546875, 2.2725830078125, 2.46685791015625, 2.6611328125, 2.85540771484375, 3.0496826171875, 3.24395751953125, 3.438232421875, 3.63250732421875, 3.8267822265625, 4.02105712890625, 4.21533203125, 4.40960693359375, 4.6038818359375, 4.79815673828125, 4.992431640625, 5.18670654296875, 5.3809814453125, 5.57525634765625, 5.76953125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 1.0, 9.0, 9.0, 17.0, 9.0, 22.0, 37.0, 39.0, 58.0, 110.0, 193.0, 399.0, 1009.0, 3780.0, 39646.0, 920731.0, 75131.0, 5129.0, 1216.0, 450.0, 191.0, 120.0, 59.0, 57.0, 32.0, 18.0, 13.0, 12.0, 15.0, 3.0, 6.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.51171875, -3.40716552734375, -3.3026123046875, -3.19805908203125, -3.093505859375, -2.98895263671875, -2.8843994140625, -2.77984619140625, -2.67529296875, -2.57073974609375, -2.4661865234375, -2.36163330078125, -2.257080078125, -2.15252685546875, -2.0479736328125, -1.94342041015625, -1.8388671875, -1.73431396484375, -1.6297607421875, -1.52520751953125, -1.420654296875, -1.31610107421875, -1.2115478515625, -1.10699462890625, -1.00244140625, -0.89788818359375, -0.7933349609375, -0.68878173828125, -0.584228515625, -0.47967529296875, -0.3751220703125, -0.27056884765625, -0.166015625, -0.06146240234375, 0.0430908203125, 0.14764404296875, 0.252197265625, 0.35675048828125, 0.4613037109375, 0.56585693359375, 0.67041015625, 0.77496337890625, 0.8795166015625, 0.98406982421875, 1.088623046875, 1.19317626953125, 1.2977294921875, 1.40228271484375, 1.5068359375, 1.61138916015625, 1.7159423828125, 1.82049560546875, 1.925048828125, 2.02960205078125, 2.1341552734375, 2.23870849609375, 2.34326171875, 2.44781494140625, 2.5523681640625, 2.65692138671875, 2.761474609375, 2.86602783203125, 2.9705810546875, 3.07513427734375, 3.1796875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 16.0, 31.0, 41.0, 87.0, 121.0, 153.0, 150.0, 118.0, 105.0, 71.0, 44.0, 26.0, 12.0, 11.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0004963874816894531, -0.000485224649310112, -0.0004740618169307709, -0.00046289898455142975, -0.0004517361521720886, -0.0004405733197927475, -0.00042941048741340637, -0.00041824765503406525, -0.0004070848226547241, -0.000395921990275383, -0.00038475915789604187, -0.00037359632551670074, -0.0003624334931373596, -0.0003512706607580185, -0.00034010782837867737, -0.00032894499599933624, -0.0003177821636199951, -0.000306619331240654, -0.00029545649886131287, -0.00028429366648197174, -0.0002731308341026306, -0.0002619680017232895, -0.00025080516934394836, -0.00023964233696460724, -0.0002284795045852661, -0.000217316672205925, -0.00020615383982658386, -0.00019499100744724274, -0.0001838281750679016, -0.00017266534268856049, -0.00016150251030921936, -0.00015033967792987823, -0.0001391768455505371, -0.00012801401317119598, -0.00011685118079185486, -0.00010568834841251373, -9.452551603317261e-05, -8.336268365383148e-05, -7.219985127449036e-05, -6.103701889514923e-05, -4.9874186515808105e-05, -3.871135413646698e-05, -2.7548521757125854e-05, -1.638568937778473e-05, -5.2228569984436035e-06, 5.939975380897522e-06, 1.7102807760238647e-05, 2.8265640139579773e-05, 3.94284725189209e-05, 5.0591304898262024e-05, 6.175413727760315e-05, 7.291696965694427e-05, 8.40798020362854e-05, 9.524263441562653e-05, 0.00010640546679496765, 0.00011756829917430878, 0.0001287311315536499, 0.00013989396393299103, 0.00015105679631233215, 0.00016221962869167328, 0.0001733824610710144, 0.00018454529345035553, 0.00019570812582969666, 0.00020687095820903778, 0.0002180337905883789]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 5.0, 4.0, 14.0, 21.0, 38.0, 80.0, 164.0, 363.0, 921.0, 3811.0, 32183.0, 792330.0, 205679.0, 10019.0, 1882.0, 588.0, 243.0, 87.0, 49.0, 25.0, 21.0, 16.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53515625, -2.455352783203125, -2.37554931640625, -2.295745849609375, -2.2159423828125, -2.136138916015625, -2.05633544921875, -1.976531982421875, -1.896728515625, -1.816925048828125, -1.73712158203125, -1.657318115234375, -1.5775146484375, -1.497711181640625, -1.41790771484375, -1.338104248046875, -1.25830078125, -1.178497314453125, -1.09869384765625, -1.018890380859375, -0.9390869140625, -0.859283447265625, -0.77947998046875, -0.699676513671875, -0.619873046875, -0.540069580078125, -0.46026611328125, -0.380462646484375, -0.3006591796875, -0.220855712890625, -0.14105224609375, -0.061248779296875, 0.0185546875, 0.098358154296875, 0.17816162109375, 0.257965087890625, 0.3377685546875, 0.417572021484375, 0.49737548828125, 0.577178955078125, 0.656982421875, 0.736785888671875, 0.81658935546875, 0.896392822265625, 0.9761962890625, 1.055999755859375, 1.13580322265625, 1.215606689453125, 1.29541015625, 1.375213623046875, 1.45501708984375, 1.534820556640625, 1.6146240234375, 1.694427490234375, 1.77423095703125, 1.854034423828125, 1.933837890625, 2.013641357421875, 2.09344482421875, 2.173248291015625, 2.2530517578125, 2.332855224609375, 2.41265869140625, 2.492462158203125, 2.572265625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 3.0, 3.0, 11.0, 14.0, 22.0, 38.0, 62.0, 109.0, 182.0, 214.0, 139.0, 90.0, 36.0, 24.0, 23.0, 10.0, 7.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.681640625, -3.555694580078125, -3.42974853515625, -3.303802490234375, -3.1778564453125, -3.051910400390625, -2.92596435546875, -2.800018310546875, -2.674072265625, -2.548126220703125, -2.42218017578125, -2.296234130859375, -2.1702880859375, -2.044342041015625, -1.91839599609375, -1.792449951171875, -1.66650390625, -1.540557861328125, -1.41461181640625, -1.288665771484375, -1.1627197265625, -1.036773681640625, -0.91082763671875, -0.784881591796875, -0.658935546875, -0.532989501953125, -0.40704345703125, -0.281097412109375, -0.1551513671875, -0.029205322265625, 0.09674072265625, 0.222686767578125, 0.3486328125, 0.474578857421875, 0.60052490234375, 0.726470947265625, 0.8524169921875, 0.978363037109375, 1.10430908203125, 1.230255126953125, 1.356201171875, 1.482147216796875, 1.60809326171875, 1.734039306640625, 1.8599853515625, 1.985931396484375, 2.11187744140625, 2.237823486328125, 2.36376953125, 2.489715576171875, 2.61566162109375, 2.741607666015625, 2.8675537109375, 2.993499755859375, 3.11944580078125, 3.245391845703125, 3.371337890625, 3.497283935546875, 3.62322998046875, 3.749176025390625, 3.8751220703125, 4.001068115234375, 4.12701416015625, 4.252960205078125, 4.37890625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 8.0, 16.0, 30.0, 33.0, 60.0, 104.0, 119.0, 175.0, 170.0, 107.0, 73.0, 52.0, 27.0, 13.0, 7.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.422245025634766, -20.298860549926758, -19.175474166870117, -18.05208969116211, -16.92870330810547, -15.805318832397461, -14.681934356689453, -13.558548927307129, -12.435163497924805, -11.31177806854248, -10.188392639160156, -9.065008163452148, -7.941622734069824, -6.8182373046875, -5.694852352142334, -4.571467399597168, -3.4480819702148438, -2.3246967792510986, -1.2013115882873535, -0.0779263973236084, 1.0454587936401367, 2.168844223022461, 3.292229175567627, 4.415614128112793, 5.538999557495117, 6.662384986877441, 7.785769939422607, 8.909154891967773, 10.032540321350098, 11.155925750732422, 12.27931022644043, 13.402695655822754, 14.526081085205078, 15.649466514587402, 16.772851943969727, 17.896236419677734, 19.019622802734375, 20.143007278442383, 21.26639175415039, 22.38977813720703, 23.51316261291504, 24.636547088623047, 25.759933471679688, 26.883317947387695, 28.006702423095703, 29.130088806152344, 30.25347328186035, 31.37685775756836, 32.500244140625, 33.62363052368164, 34.747013092041016, 35.870399475097656, 36.9937858581543, 38.11717224121094, 39.24055480957031, 40.36394119262695, 41.487327575683594, 42.610713958740234, 43.73409652709961, 44.85748291015625, 45.98086929321289, 47.10425567626953, 48.227638244628906, 49.35102462768555, 50.47440719604492]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 5.0, 9.0, 11.0, 16.0, 27.0, 18.0, 23.0, 36.0, 39.0, 64.0, 76.0, 78.0, 79.0, 85.0, 77.0, 66.0, 48.0, 55.0, 37.0, 36.0, 24.0, 22.0, 17.0, 9.0, 11.0, 10.0, 7.0, 4.0, 5.0, 5.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.73468017578125, -45.36898422241211, -44.00328826904297, -42.63759231567383, -41.27189636230469, -39.90619659423828, -38.54050064086914, -37.1748046875, -35.80910873413086, -34.44341278076172, -33.07771682739258, -31.712018966674805, -30.346323013305664, -28.980627059936523, -27.61492919921875, -26.24923324584961, -24.88353729248047, -23.517841339111328, -22.152145385742188, -20.786447525024414, -19.420751571655273, -18.055055618286133, -16.68935775756836, -15.323661804199219, -13.957965850830078, -12.592269897460938, -11.22657299041748, -9.860876083374023, -8.495180130004883, -7.129483699798584, -5.763787269592285, -4.398090362548828, -3.032398223876953, -1.6667017936706543, -0.30100536346435547, 1.0646910667419434, 2.430387496948242, 3.796083927154541, 5.16178035736084, 6.527477264404297, 7.8931732177734375, 9.258869171142578, 10.624566078186035, 11.990262985229492, 13.355958938598633, 14.721654891967773, 16.087352752685547, 17.453048706054688, 18.818744659423828, 20.18444061279297, 21.55013656616211, 22.915834426879883, 24.281530380249023, 25.647226333618164, 27.012924194335938, 28.378620147705078, 29.74431610107422, 31.11001205444336, 32.4757080078125, 33.84140396118164, 35.20709991455078, 36.57279968261719, 37.93849563598633, 39.30419158935547, 40.66988754272461]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 8.0, 12.0, 7.0, 11.0, 24.0, 43.0, 53.0, 105.0, 143.0, 193.0, 457.0, 962.0, 2006.0, 5521.0, 20177.0, 157249.0, 3884740.0, 98796.0, 15559.0, 4581.0, 1725.0, 813.0, 397.0, 238.0, 163.0, 88.0, 68.0, 35.0, 32.0, 18.0, 18.0, 8.0, 7.0, 6.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.330078125, -3.2205810546875, -3.111083984375, -3.0015869140625, -2.89208984375, -2.7825927734375, -2.673095703125, -2.5635986328125, -2.4541015625, -2.3446044921875, -2.235107421875, -2.1256103515625, -2.01611328125, -1.9066162109375, -1.797119140625, -1.6876220703125, -1.578125, -1.4686279296875, -1.359130859375, -1.2496337890625, -1.14013671875, -1.0306396484375, -0.921142578125, -0.8116455078125, -0.7021484375, -0.5926513671875, -0.483154296875, -0.3736572265625, -0.26416015625, -0.1546630859375, -0.045166015625, 0.0643310546875, 0.173828125, 0.2833251953125, 0.392822265625, 0.5023193359375, 0.61181640625, 0.7213134765625, 0.830810546875, 0.9403076171875, 1.0498046875, 1.1593017578125, 1.268798828125, 1.3782958984375, 1.48779296875, 1.5972900390625, 1.706787109375, 1.8162841796875, 1.92578125, 2.0352783203125, 2.144775390625, 2.2542724609375, 2.36376953125, 2.4732666015625, 2.582763671875, 2.6922607421875, 2.8017578125, 2.9112548828125, 3.020751953125, 3.1302490234375, 3.23974609375, 3.3492431640625, 3.458740234375, 3.5682373046875, 3.677734375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 13.0, 10.0, 22.0, 25.0, 29.0, 46.0, 55.0, 60.0, 80.0, 91.0, 85.0, 88.0, 62.0, 55.0, 63.0, 47.0, 37.0, 31.0, 17.0, 18.0, 11.0, 13.0, 5.0, 3.0, 4.0, 3.0, 5.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5517578125, -1.5028839111328125, -1.454010009765625, -1.4051361083984375, -1.35626220703125, -1.3073883056640625, -1.258514404296875, -1.2096405029296875, -1.1607666015625, -1.1118927001953125, -1.063018798828125, -1.0141448974609375, -0.96527099609375, -0.9163970947265625, -0.867523193359375, -0.8186492919921875, -0.769775390625, -0.7209014892578125, -0.672027587890625, -0.6231536865234375, -0.57427978515625, -0.5254058837890625, -0.476531982421875, -0.4276580810546875, -0.3787841796875, -0.3299102783203125, -0.281036376953125, -0.2321624755859375, -0.18328857421875, -0.1344146728515625, -0.085540771484375, -0.0366668701171875, 0.01220703125, 0.0610809326171875, 0.109954833984375, 0.1588287353515625, 0.20770263671875, 0.2565765380859375, 0.305450439453125, 0.3543243408203125, 0.4031982421875, 0.4520721435546875, 0.500946044921875, 0.5498199462890625, 0.59869384765625, 0.6475677490234375, 0.696441650390625, 0.7453155517578125, 0.794189453125, 0.8430633544921875, 0.891937255859375, 0.9408111572265625, 0.98968505859375, 1.0385589599609375, 1.087432861328125, 1.1363067626953125, 1.1851806640625, 1.2340545654296875, 1.282928466796875, 1.3318023681640625, 1.38067626953125, 1.4295501708984375, 1.478424072265625, 1.5272979736328125, 1.576171875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 10.0, 5.0, 18.0, 21.0, 25.0, 39.0, 67.0, 100.0, 148.0, 259.0, 393.0, 670.0, 1311.0, 2680.0, 6134.0, 15619.0, 49210.0, 248084.0, 3527426.0, 262869.0, 51281.0, 15946.0, 6205.0, 2694.0, 1277.0, 744.0, 414.0, 250.0, 131.0, 72.0, 60.0, 42.0, 24.0, 17.0, 19.0, 10.0, 6.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.400390625, -2.330841064453125, -2.26129150390625, -2.191741943359375, -2.1221923828125, -2.052642822265625, -1.98309326171875, -1.913543701171875, -1.843994140625, -1.774444580078125, -1.70489501953125, -1.635345458984375, -1.5657958984375, -1.496246337890625, -1.42669677734375, -1.357147216796875, -1.28759765625, -1.218048095703125, -1.14849853515625, -1.078948974609375, -1.0093994140625, -0.939849853515625, -0.87030029296875, -0.800750732421875, -0.731201171875, -0.661651611328125, -0.59210205078125, -0.522552490234375, -0.4530029296875, -0.383453369140625, -0.31390380859375, -0.244354248046875, -0.1748046875, -0.105255126953125, -0.03570556640625, 0.033843994140625, 0.1033935546875, 0.172943115234375, 0.24249267578125, 0.312042236328125, 0.381591796875, 0.451141357421875, 0.52069091796875, 0.590240478515625, 0.6597900390625, 0.729339599609375, 0.79888916015625, 0.868438720703125, 0.93798828125, 1.007537841796875, 1.07708740234375, 1.146636962890625, 1.2161865234375, 1.285736083984375, 1.35528564453125, 1.424835205078125, 1.494384765625, 1.563934326171875, 1.63348388671875, 1.703033447265625, 1.7725830078125, 1.842132568359375, 1.91168212890625, 1.981231689453125, 2.05078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 11.0, 12.0, 5.0, 15.0, 45.0, 52.0, 108.0, 184.0, 638.0, 2420.0, 286.0, 126.0, 53.0, 43.0, 24.0, 16.0, 10.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7998046875, -0.770416259765625, -0.74102783203125, -0.711639404296875, -0.6822509765625, -0.652862548828125, -0.62347412109375, -0.594085693359375, -0.564697265625, -0.535308837890625, -0.50592041015625, -0.476531982421875, -0.4471435546875, -0.417755126953125, -0.38836669921875, -0.358978271484375, -0.32958984375, -0.300201416015625, -0.27081298828125, -0.241424560546875, -0.2120361328125, -0.182647705078125, -0.15325927734375, -0.123870849609375, -0.094482421875, -0.065093994140625, -0.03570556640625, -0.006317138671875, 0.0230712890625, 0.052459716796875, 0.08184814453125, 0.111236572265625, 0.140625, 0.170013427734375, 0.19940185546875, 0.228790283203125, 0.2581787109375, 0.287567138671875, 0.31695556640625, 0.346343994140625, 0.375732421875, 0.405120849609375, 0.43450927734375, 0.463897705078125, 0.4932861328125, 0.522674560546875, 0.55206298828125, 0.581451416015625, 0.61083984375, 0.640228271484375, 0.66961669921875, 0.699005126953125, 0.7283935546875, 0.757781982421875, 0.78717041015625, 0.816558837890625, 0.845947265625, 0.875335693359375, 0.90472412109375, 0.934112548828125, 0.9635009765625, 0.992889404296875, 1.02227783203125, 1.051666259765625, 1.0810546875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 8.0, 15.0, 57.0, 141.0, 251.0, 294.0, 165.0, 53.0, 17.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.483149528503418, -2.2165772914886475, -1.9500048160552979, -1.6834325790405273, -1.4168602228164673, -1.1502878665924072, -0.8837156295776367, -0.6171432733535767, -0.3505709171295166, -0.08399859070777893, 0.18257373571395874, 0.449146032333374, 0.7157183885574341, 0.9822907447814941, 1.2488629817962646, 1.5154353380203247, 1.7820076942443848, 2.0485799312591553, 2.315152406692505, 2.5817246437072754, 2.848297119140625, 3.1148693561553955, 3.381441593170166, 3.6480140686035156, 3.914586305618286, 4.181158542633057, 4.447731018066406, 4.714303016662598, 4.980875492095947, 5.247447967529297, 5.514019966125488, 5.780592441558838, 6.0471649169921875, 6.313737392425537, 6.5803093910217285, 6.846881866455078, 7.113454341888428, 7.380026817321777, 7.646598815917969, 7.913171291351318, 8.179743766784668, 8.44631576538086, 8.712888717651367, 8.979460716247559, 9.24603271484375, 9.512605667114258, 9.77917766571045, 10.04574966430664, 10.312322616577148, 10.57889461517334, 10.845467567443848, 11.112039566040039, 11.37861156463623, 11.645184516906738, 11.91175651550293, 12.178328514099121, 12.444900512695312, 12.711472511291504, 12.978045463562012, 13.244617462158203, 13.511189460754395, 13.777762413024902, 14.044334411621094, 14.310906410217285, 14.577479362487793]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 9.0, 9.0, 9.0, 13.0, 12.0, 26.0, 22.0, 20.0, 29.0, 35.0, 32.0, 38.0, 48.0, 43.0, 40.0, 47.0, 50.0, 49.0, 34.0, 35.0, 49.0, 51.0, 36.0, 46.0, 30.0, 39.0, 23.0, 30.0, 18.0, 13.0, 16.0, 11.0, 10.0, 4.0, 5.0, 6.0, 6.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2696189880371094, -2.195716619491577, -2.121814250946045, -2.0479118824005127, -1.9740095138549805, -1.9001071453094482, -1.8262046575546265, -1.7523022890090942, -1.678399920463562, -1.6044975519180298, -1.5305951833724976, -1.4566928148269653, -1.3827903270721436, -1.3088879585266113, -1.234985589981079, -1.1610832214355469, -1.0871808528900146, -1.0132784843444824, -0.9393761157989502, -0.8654736876487732, -0.791571319103241, -0.7176689505577087, -0.6437665224075317, -0.5698641538619995, -0.4959617853164673, -0.42205941677093506, -0.34815701842308044, -0.27425462007522583, -0.2003522515296936, -0.12644988298416138, -0.05254748463630676, 0.02135491371154785, 0.09525728225708008, 0.1691596657037735, 0.24306204915046692, 0.31696444749832153, 0.39086681604385376, 0.464769184589386, 0.538671612739563, 0.6125739812850952, 0.6864763498306274, 0.7603787183761597, 0.8342810869216919, 0.9081835150718689, 0.9820858836174011, 1.0559883117675781, 1.1298906803131104, 1.2037930488586426, 1.2776954174041748, 1.351597785949707, 1.4255001544952393, 1.4994025230407715, 1.5733048915863037, 1.647207260131836, 1.7211097478866577, 1.79501211643219, 1.8689144849777222, 1.9428168535232544, 2.016719341278076, 2.0906217098236084, 2.1645240783691406, 2.238426446914673, 2.312328815460205, 2.3862311840057373, 2.4601335525512695]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 10.0, 5.0, 11.0, 29.0, 41.0, 83.0, 114.0, 239.0, 420.0, 1009.0, 2546.0, 7911.0, 30576.0, 158404.0, 507119.0, 268968.0, 52860.0, 12087.0, 3589.0, 1336.0, 587.0, 262.0, 137.0, 76.0, 56.0, 29.0, 17.0, 14.0, 3.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53515625, -2.44970703125, -2.3642578125, -2.27880859375, -2.193359375, -2.10791015625, -2.0224609375, -1.93701171875, -1.8515625, -1.76611328125, -1.6806640625, -1.59521484375, -1.509765625, -1.42431640625, -1.3388671875, -1.25341796875, -1.16796875, -1.08251953125, -0.9970703125, -0.91162109375, -0.826171875, -0.74072265625, -0.6552734375, -0.56982421875, -0.484375, -0.39892578125, -0.3134765625, -0.22802734375, -0.142578125, -0.05712890625, 0.0283203125, 0.11376953125, 0.19921875, 0.28466796875, 0.3701171875, 0.45556640625, 0.541015625, 0.62646484375, 0.7119140625, 0.79736328125, 0.8828125, 0.96826171875, 1.0537109375, 1.13916015625, 1.224609375, 1.31005859375, 1.3955078125, 1.48095703125, 1.56640625, 1.65185546875, 1.7373046875, 1.82275390625, 1.908203125, 1.99365234375, 2.0791015625, 2.16455078125, 2.25, 2.33544921875, 2.4208984375, 2.50634765625, 2.591796875, 2.67724609375, 2.7626953125, 2.84814453125, 2.93359375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 8.0, 4.0, 3.0, 14.0, 28.0, 31.0, 34.0, 45.0, 42.0, 65.0, 74.0, 77.0, 83.0, 91.0, 81.0, 53.0, 56.0, 52.0, 38.0, 24.0, 23.0, 17.0, 12.0, 8.0, 11.0, 6.0, 8.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.544921875, -1.4964447021484375, -1.447967529296875, -1.3994903564453125, -1.35101318359375, -1.3025360107421875, -1.254058837890625, -1.2055816650390625, -1.1571044921875, -1.1086273193359375, -1.060150146484375, -1.0116729736328125, -0.96319580078125, -0.9147186279296875, -0.866241455078125, -0.8177642822265625, -0.769287109375, -0.7208099365234375, -0.672332763671875, -0.6238555908203125, -0.57537841796875, -0.5269012451171875, -0.478424072265625, -0.4299468994140625, -0.3814697265625, -0.3329925537109375, -0.284515380859375, -0.2360382080078125, -0.18756103515625, -0.1390838623046875, -0.090606689453125, -0.0421295166015625, 0.00634765625, 0.0548248291015625, 0.103302001953125, 0.1517791748046875, 0.20025634765625, 0.2487335205078125, 0.297210693359375, 0.3456878662109375, 0.3941650390625, 0.4426422119140625, 0.491119384765625, 0.5395965576171875, 0.58807373046875, 0.6365509033203125, 0.685028076171875, 0.7335052490234375, 0.781982421875, 0.8304595947265625, 0.878936767578125, 0.9274139404296875, 0.97589111328125, 1.0243682861328125, 1.072845458984375, 1.1213226318359375, 1.1697998046875, 1.2182769775390625, 1.266754150390625, 1.3152313232421875, 1.36370849609375, 1.4121856689453125, 1.460662841796875, 1.5091400146484375, 1.5576171875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 11.0, 5.0, 11.0, 21.0, 28.0, 50.0, 87.0, 116.0, 261.0, 803.0, 2847.0, 20281.0, 582553.0, 422048.0, 15753.0, 2347.0, 708.0, 254.0, 144.0, 75.0, 41.0, 31.0, 16.0, 7.0, 12.0, 8.0, 7.0, 7.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.8359375, -5.63433837890625, -5.4327392578125, -5.23114013671875, -5.029541015625, -4.82794189453125, -4.6263427734375, -4.42474365234375, -4.22314453125, -4.02154541015625, -3.8199462890625, -3.61834716796875, -3.416748046875, -3.21514892578125, -3.0135498046875, -2.81195068359375, -2.6103515625, -2.40875244140625, -2.2071533203125, -2.00555419921875, -1.803955078125, -1.60235595703125, -1.4007568359375, -1.19915771484375, -0.99755859375, -0.79595947265625, -0.5943603515625, -0.39276123046875, -0.191162109375, 0.01043701171875, 0.2120361328125, 0.41363525390625, 0.615234375, 0.81683349609375, 1.0184326171875, 1.22003173828125, 1.421630859375, 1.62322998046875, 1.8248291015625, 2.02642822265625, 2.22802734375, 2.42962646484375, 2.6312255859375, 2.83282470703125, 3.034423828125, 3.23602294921875, 3.4376220703125, 3.63922119140625, 3.8408203125, 4.04241943359375, 4.2440185546875, 4.44561767578125, 4.647216796875, 4.84881591796875, 5.0504150390625, 5.25201416015625, 5.45361328125, 5.65521240234375, 5.8568115234375, 6.05841064453125, 6.260009765625, 6.46160888671875, 6.6632080078125, 6.86480712890625, 7.06640625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 7.0, 5.0, 5.0, 9.0, 11.0, 12.0, 14.0, 28.0, 28.0, 26.0, 28.0, 37.0, 52.0, 45.0, 64.0, 48.0, 53.0, 58.0, 54.0, 35.0, 48.0, 46.0, 52.0, 34.0, 31.0, 30.0, 26.0, 21.0, 23.0, 15.0, 13.0, 14.0, 3.0, 7.0, 6.0, 2.0, 4.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.40234375, -6.2005615234375, -5.998779296875, -5.7969970703125, -5.59521484375, -5.3934326171875, -5.191650390625, -4.9898681640625, -4.7880859375, -4.5863037109375, -4.384521484375, -4.1827392578125, -3.98095703125, -3.7791748046875, -3.577392578125, -3.3756103515625, -3.173828125, -2.9720458984375, -2.770263671875, -2.5684814453125, -2.36669921875, -2.1649169921875, -1.963134765625, -1.7613525390625, -1.5595703125, -1.3577880859375, -1.156005859375, -0.9542236328125, -0.75244140625, -0.5506591796875, -0.348876953125, -0.1470947265625, 0.0546875, 0.2564697265625, 0.458251953125, 0.6600341796875, 0.86181640625, 1.0635986328125, 1.265380859375, 1.4671630859375, 1.6689453125, 1.8707275390625, 2.072509765625, 2.2742919921875, 2.47607421875, 2.6778564453125, 2.879638671875, 3.0814208984375, 3.283203125, 3.4849853515625, 3.686767578125, 3.8885498046875, 4.09033203125, 4.2921142578125, 4.493896484375, 4.6956787109375, 4.8974609375, 5.0992431640625, 5.301025390625, 5.5028076171875, 5.70458984375, 5.9063720703125, 6.108154296875, 6.3099365234375, 6.51171875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 5.0, 8.0, 6.0, 12.0, 17.0, 27.0, 46.0, 54.0, 79.0, 138.0, 207.0, 387.0, 1197.0, 6030.0, 317703.0, 710735.0, 9281.0, 1502.0, 468.0, 256.0, 115.0, 74.0, 61.0, 31.0, 20.0, 16.0, 17.0, 13.0, 9.0, 13.0, 8.0, 1.0, 5.0, 1.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.82421875, -5.66717529296875, -5.5101318359375, -5.35308837890625, -5.196044921875, -5.03900146484375, -4.8819580078125, -4.72491455078125, -4.56787109375, -4.41082763671875, -4.2537841796875, -4.09674072265625, -3.939697265625, -3.78265380859375, -3.6256103515625, -3.46856689453125, -3.3115234375, -3.15447998046875, -2.9974365234375, -2.84039306640625, -2.683349609375, -2.52630615234375, -2.3692626953125, -2.21221923828125, -2.05517578125, -1.89813232421875, -1.7410888671875, -1.58404541015625, -1.427001953125, -1.26995849609375, -1.1129150390625, -0.95587158203125, -0.798828125, -0.64178466796875, -0.4847412109375, -0.32769775390625, -0.170654296875, -0.01361083984375, 0.1434326171875, 0.30047607421875, 0.45751953125, 0.61456298828125, 0.7716064453125, 0.92864990234375, 1.085693359375, 1.24273681640625, 1.3997802734375, 1.55682373046875, 1.7138671875, 1.87091064453125, 2.0279541015625, 2.18499755859375, 2.342041015625, 2.49908447265625, 2.6561279296875, 2.81317138671875, 2.97021484375, 3.12725830078125, 3.2843017578125, 3.44134521484375, 3.598388671875, 3.75543212890625, 3.9124755859375, 4.06951904296875, 4.2265625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 7.0, 2.0, 6.0, 14.0, 17.0, 18.0, 26.0, 49.0, 67.0, 82.0, 108.0, 112.0, 106.0, 108.0, 64.0, 61.0, 45.0, 35.0, 27.0, 15.0, 10.0, 6.0, 3.0, 0.0, 7.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003006458282470703, -0.00029153376817703247, -0.00028242170810699463, -0.0002733096480369568, -0.00026419758796691895, -0.0002550855278968811, -0.00024597346782684326, -0.00023686140775680542, -0.00022774934768676758, -0.00021863728761672974, -0.0002095252275466919, -0.00020041316747665405, -0.0001913011074066162, -0.00018218904733657837, -0.00017307698726654053, -0.00016396492719650269, -0.00015485286712646484, -0.000145740807056427, -0.00013662874698638916, -0.00012751668691635132, -0.00011840462684631348, -0.00010929256677627563, -0.00010018050670623779, -9.106844663619995e-05, -8.195638656616211e-05, -7.284432649612427e-05, -6.373226642608643e-05, -5.4620206356048584e-05, -4.550814628601074e-05, -3.63960862159729e-05, -2.728402614593506e-05, -1.8171966075897217e-05, -9.059906005859375e-06, 5.21540641784668e-08, 9.164214134216309e-06, 1.827627420425415e-05, 2.7388334274291992e-05, 3.6500394344329834e-05, 4.5612454414367676e-05, 5.472451448440552e-05, 6.383657455444336e-05, 7.29486346244812e-05, 8.206069469451904e-05, 9.117275476455688e-05, 0.00010028481483459473, 0.00010939687490463257, 0.00011850893497467041, 0.00012762099504470825, 0.0001367330551147461, 0.00014584511518478394, 0.00015495717525482178, 0.00016406923532485962, 0.00017318129539489746, 0.0001822933554649353, 0.00019140541553497314, 0.00020051747560501099, 0.00020962953567504883, 0.00021874159574508667, 0.0002278536558151245, 0.00023696571588516235, 0.0002460777759552002, 0.00025518983602523804, 0.0002643018960952759, 0.0002734139561653137, 0.00028252601623535156]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 8.0, 3.0, 14.0, 8.0, 28.0, 57.0, 131.0, 273.0, 789.0, 3578.0, 62596.0, 937760.0, 39270.0, 2901.0, 670.0, 232.0, 118.0, 47.0, 28.0, 14.0, 11.0, 8.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.16796875, -3.04345703125, -2.9189453125, -2.79443359375, -2.669921875, -2.54541015625, -2.4208984375, -2.29638671875, -2.171875, -2.04736328125, -1.9228515625, -1.79833984375, -1.673828125, -1.54931640625, -1.4248046875, -1.30029296875, -1.17578125, -1.05126953125, -0.9267578125, -0.80224609375, -0.677734375, -0.55322265625, -0.4287109375, -0.30419921875, -0.1796875, -0.05517578125, 0.0693359375, 0.19384765625, 0.318359375, 0.44287109375, 0.5673828125, 0.69189453125, 0.81640625, 0.94091796875, 1.0654296875, 1.18994140625, 1.314453125, 1.43896484375, 1.5634765625, 1.68798828125, 1.8125, 1.93701171875, 2.0615234375, 2.18603515625, 2.310546875, 2.43505859375, 2.5595703125, 2.68408203125, 2.80859375, 2.93310546875, 3.0576171875, 3.18212890625, 3.306640625, 3.43115234375, 3.5556640625, 3.68017578125, 3.8046875, 3.92919921875, 4.0537109375, 4.17822265625, 4.302734375, 4.42724609375, 4.5517578125, 4.67626953125, 4.80078125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 6.0, 11.0, 28.0, 61.0, 116.0, 169.0, 205.0, 173.0, 101.0, 52.0, 29.0, 10.0, 6.0, 12.0, 8.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08984375, -4.94244384765625, -4.7950439453125, -4.64764404296875, -4.500244140625, -4.35284423828125, -4.2054443359375, -4.05804443359375, -3.91064453125, -3.76324462890625, -3.6158447265625, -3.46844482421875, -3.321044921875, -3.17364501953125, -3.0262451171875, -2.87884521484375, -2.7314453125, -2.58404541015625, -2.4366455078125, -2.28924560546875, -2.141845703125, -1.99444580078125, -1.8470458984375, -1.69964599609375, -1.55224609375, -1.40484619140625, -1.2574462890625, -1.11004638671875, -0.962646484375, -0.81524658203125, -0.6678466796875, -0.52044677734375, -0.373046875, -0.22564697265625, -0.0782470703125, 0.06915283203125, 0.216552734375, 0.36395263671875, 0.5113525390625, 0.65875244140625, 0.80615234375, 0.95355224609375, 1.1009521484375, 1.24835205078125, 1.395751953125, 1.54315185546875, 1.6905517578125, 1.83795166015625, 1.9853515625, 2.13275146484375, 2.2801513671875, 2.42755126953125, 2.574951171875, 2.72235107421875, 2.8697509765625, 3.01715087890625, 3.16455078125, 3.31195068359375, 3.4593505859375, 3.60675048828125, 3.754150390625, 3.90155029296875, 4.0489501953125, 4.19635009765625, 4.34375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 20.0, 60.0, 166.0, 293.0, 249.0, 129.0, 51.0, 25.0, 1.0, 3.0, 2.0, 4.0], "bins": [-126.08174896240234, -123.81938171386719, -121.55702209472656, -119.29466247558594, -117.03229522705078, -114.76992797851562, -112.507568359375, -110.24520874023438, -107.98284149169922, -105.72047424316406, -103.45811462402344, -101.19575500488281, -98.93338775634766, -96.6710205078125, -94.40866088867188, -92.14630126953125, -89.8839340209961, -87.62156677246094, -85.35920715332031, -83.09684753417969, -80.83448028564453, -78.57211303710938, -76.30975341796875, -74.04739379882812, -71.78502655029297, -69.52265930175781, -67.26029968261719, -64.99794006347656, -62.735572814941406, -60.473209381103516, -58.210845947265625, -55.948482513427734, -53.68611145019531, -51.42374801635742, -49.16138458251953, -46.89902114868164, -44.63665771484375, -42.37429428100586, -40.11193084716797, -37.84956741333008, -35.58720397949219, -33.3248405456543, -31.062477111816406, -28.800113677978516, -26.537750244140625, -24.275386810302734, -22.013023376464844, -19.750659942626953, -17.488298416137695, -15.225934982299805, -12.963571548461914, -10.701208114624023, -8.438844680786133, -6.176481246948242, -3.9141178131103516, -1.651754379272461, 0.6106090545654297, 2.8729724884033203, 5.135335922241211, 7.397699356079102, 9.660062789916992, 11.922426223754883, 14.184789657592773, 16.447153091430664, 18.709516525268555]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 3.0, 5.0, 5.0, 1.0, 11.0, 16.0, 13.0, 15.0, 24.0, 25.0, 30.0, 37.0, 31.0, 55.0, 54.0, 54.0, 56.0, 47.0, 60.0, 56.0, 48.0, 54.0, 45.0, 43.0, 35.0, 35.0, 30.0, 22.0, 16.0, 12.0, 11.0, 10.0, 11.0, 6.0, 9.0, 6.0, 4.0, 5.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.198808670043945, -24.28268814086914, -23.36656951904297, -22.450448989868164, -21.53432846069336, -20.618207931518555, -19.70208740234375, -18.785968780517578, -17.869848251342773, -16.95372772216797, -16.037609100341797, -15.121488571166992, -14.205368041992188, -13.289247512817383, -12.373127937316895, -11.457008361816406, -10.540887832641602, -9.624767303466797, -8.708647727966309, -7.792527675628662, -6.876407623291016, -5.960287570953369, -5.044167518615723, -4.128047466278076, -3.2119274139404297, -2.295807361602783, -1.3796873092651367, -0.46356725692749023, 0.45255279541015625, 1.3686728477478027, 2.284792900085449, 3.2009129524230957, 4.117034912109375, 5.0331549644470215, 5.949275016784668, 6.8653950691223145, 7.781515121459961, 8.697635650634766, 9.613755226135254, 10.529874801635742, 11.445995330810547, 12.362115859985352, 13.27823543548584, 14.194355010986328, 15.110475540161133, 16.026596069335938, 16.94271469116211, 17.858835220336914, 18.77495574951172, 19.691076278686523, 20.607196807861328, 21.5233154296875, 22.439435958862305, 23.35555648803711, 24.27167510986328, 25.187795639038086, 26.10391616821289, 27.020036697387695, 27.9361572265625, 28.852275848388672, 29.768396377563477, 30.68451690673828, 31.600635528564453, 32.51675796508789, 33.43287658691406]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 9.0, 15.0, 15.0, 23.0, 39.0, 59.0, 86.0, 151.0, 271.0, 577.0, 1318.0, 4090.0, 21119.0, 3938729.0, 209603.0, 12824.0, 3038.0, 1114.0, 523.0, 262.0, 123.0, 91.0, 63.0, 31.0, 24.0, 22.0, 18.0, 6.0, 9.0, 8.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2421875, -5.047119140625, -4.85205078125, -4.656982421875, -4.4619140625, -4.266845703125, -4.07177734375, -3.876708984375, -3.681640625, -3.486572265625, -3.29150390625, -3.096435546875, -2.9013671875, -2.706298828125, -2.51123046875, -2.316162109375, -2.12109375, -1.926025390625, -1.73095703125, -1.535888671875, -1.3408203125, -1.145751953125, -0.95068359375, -0.755615234375, -0.560546875, -0.365478515625, -0.17041015625, 0.024658203125, 0.2197265625, 0.414794921875, 0.60986328125, 0.804931640625, 1.0, 1.195068359375, 1.39013671875, 1.585205078125, 1.7802734375, 1.975341796875, 2.17041015625, 2.365478515625, 2.560546875, 2.755615234375, 2.95068359375, 3.145751953125, 3.3408203125, 3.535888671875, 3.73095703125, 3.926025390625, 4.12109375, 4.316162109375, 4.51123046875, 4.706298828125, 4.9013671875, 5.096435546875, 5.29150390625, 5.486572265625, 5.681640625, 5.876708984375, 6.07177734375, 6.266845703125, 6.4619140625, 6.656982421875, 6.85205078125, 7.047119140625, 7.2421875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 6.0, 5.0, 14.0, 19.0, 31.0, 37.0, 42.0, 82.0, 101.0, 119.0, 129.0, 100.0, 98.0, 67.0, 39.0, 30.0, 29.0, 19.0, 9.0, 6.0, 6.0, 2.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.04522705078125, -1.9732666015625, -1.90130615234375, -1.829345703125, -1.75738525390625, -1.6854248046875, -1.61346435546875, -1.54150390625, -1.46954345703125, -1.3975830078125, -1.32562255859375, -1.253662109375, -1.18170166015625, -1.1097412109375, -1.03778076171875, -0.9658203125, -0.89385986328125, -0.8218994140625, -0.74993896484375, -0.677978515625, -0.60601806640625, -0.5340576171875, -0.46209716796875, -0.39013671875, -0.31817626953125, -0.2462158203125, -0.17425537109375, -0.102294921875, -0.03033447265625, 0.0416259765625, 0.11358642578125, 0.185546875, 0.25750732421875, 0.3294677734375, 0.40142822265625, 0.473388671875, 0.54534912109375, 0.6173095703125, 0.68927001953125, 0.76123046875, 0.83319091796875, 0.9051513671875, 0.97711181640625, 1.049072265625, 1.12103271484375, 1.1929931640625, 1.26495361328125, 1.3369140625, 1.40887451171875, 1.4808349609375, 1.55279541015625, 1.624755859375, 1.69671630859375, 1.7686767578125, 1.84063720703125, 1.91259765625, 1.98455810546875, 2.0565185546875, 2.12847900390625, 2.200439453125, 2.27239990234375, 2.3443603515625, 2.41632080078125, 2.48828125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 12.0, 13.0, 25.0, 38.0, 47.0, 63.0, 98.0, 160.0, 276.0, 439.0, 875.0, 2077.0, 6404.0, 27909.0, 427098.0, 3674546.0, 41059.0, 8282.0, 2512.0, 1014.0, 507.0, 269.0, 204.0, 113.0, 87.0, 54.0, 29.0, 27.0, 11.0, 8.0, 11.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.31640625, -3.1728515625, -3.029296875, -2.8857421875, -2.7421875, -2.5986328125, -2.455078125, -2.3115234375, -2.16796875, -2.0244140625, -1.880859375, -1.7373046875, -1.59375, -1.4501953125, -1.306640625, -1.1630859375, -1.01953125, -0.8759765625, -0.732421875, -0.5888671875, -0.4453125, -0.3017578125, -0.158203125, -0.0146484375, 0.12890625, 0.2724609375, 0.416015625, 0.5595703125, 0.703125, 0.8466796875, 0.990234375, 1.1337890625, 1.27734375, 1.4208984375, 1.564453125, 1.7080078125, 1.8515625, 1.9951171875, 2.138671875, 2.2822265625, 2.42578125, 2.5693359375, 2.712890625, 2.8564453125, 3.0, 3.1435546875, 3.287109375, 3.4306640625, 3.57421875, 3.7177734375, 3.861328125, 4.0048828125, 4.1484375, 4.2919921875, 4.435546875, 4.5791015625, 4.72265625, 4.8662109375, 5.009765625, 5.1533203125, 5.296875, 5.4404296875, 5.583984375, 5.7275390625, 5.87109375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 15.0, 13.0, 40.0, 90.0, 354.0, 3239.0, 194.0, 72.0, 26.0, 12.0, 8.0, 7.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.33203125, -1.277130126953125, -1.22222900390625, -1.167327880859375, -1.1124267578125, -1.057525634765625, -1.00262451171875, -0.947723388671875, -0.892822265625, -0.837921142578125, -0.78302001953125, -0.728118896484375, -0.6732177734375, -0.618316650390625, -0.56341552734375, -0.508514404296875, -0.45361328125, -0.398712158203125, -0.34381103515625, -0.288909912109375, -0.2340087890625, -0.179107666015625, -0.12420654296875, -0.069305419921875, -0.014404296875, 0.040496826171875, 0.09539794921875, 0.150299072265625, 0.2052001953125, 0.260101318359375, 0.31500244140625, 0.369903564453125, 0.4248046875, 0.479705810546875, 0.53460693359375, 0.589508056640625, 0.6444091796875, 0.699310302734375, 0.75421142578125, 0.809112548828125, 0.864013671875, 0.918914794921875, 0.97381591796875, 1.028717041015625, 1.0836181640625, 1.138519287109375, 1.19342041015625, 1.248321533203125, 1.30322265625, 1.358123779296875, 1.41302490234375, 1.467926025390625, 1.5228271484375, 1.577728271484375, 1.63262939453125, 1.687530517578125, 1.742431640625, 1.797332763671875, 1.85223388671875, 1.907135009765625, 1.9620361328125, 2.016937255859375, 2.07183837890625, 2.126739501953125, 2.181640625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 16.0, 12.0, 23.0, 52.0, 71.0, 97.0, 102.0, 137.0, 131.0, 108.0, 83.0, 59.0, 36.0, 35.0, 12.0, 10.0, 9.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6954848766326904, -3.576456308364868, -3.457427501678467, -3.3383989334106445, -3.2193703651428223, -3.100341558456421, -2.9813129901885986, -2.8622841835021973, -2.743255615234375, -2.6242270469665527, -2.5051982402801514, -2.386169672012329, -2.2671408653259277, -2.1481122970581055, -2.029083728790283, -1.9100550413131714, -1.7910263538360596, -1.6719976663589478, -1.552968978881836, -1.4339404106140137, -1.3149117231369019, -1.19588303565979, -1.0768544673919678, -0.957825779914856, -0.8387970924377441, -0.7197684049606323, -0.6007397770881653, -0.48171111941337585, -0.3626824617385864, -0.2436537742614746, -0.12462514638900757, -0.005596518516540527, 0.11343240737915039, 0.23246106505393982, 0.35148972272872925, 0.4705183804035187, 0.5895470380783081, 0.7085757255554199, 0.827604353427887, 0.946632981300354, 1.0656616687774658, 1.1846903562545776, 1.3037190437316895, 1.4227476119995117, 1.5417762994766235, 1.6608049869537354, 1.7798335552215576, 1.8988622426986694, 2.0178909301757812, 2.1369194984436035, 2.255948305130005, 2.374976873397827, 2.4940056800842285, 2.613034248352051, 2.732062816619873, 2.8510913848876953, 2.9701201915740967, 3.089148759841919, 3.2081775665283203, 3.3272061347961426, 3.446234703063965, 3.565263509750366, 3.6842920780181885, 3.80332088470459, 3.922349452972412]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 6.0, 3.0, 7.0, 16.0, 9.0, 6.0, 13.0, 22.0, 21.0, 23.0, 29.0, 23.0, 27.0, 47.0, 29.0, 18.0, 29.0, 41.0, 40.0, 33.0, 45.0, 26.0, 29.0, 35.0, 28.0, 34.0, 28.0, 29.0, 37.0, 39.0, 29.0, 25.0, 24.0, 21.0, 23.0, 10.0, 16.0, 8.0, 15.0, 11.0, 8.0, 10.0, 6.0, 4.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.894153118133545, -1.8360918760299683, -1.778030514717102, -1.7199692726135254, -1.6619079113006592, -1.6038466691970825, -1.5457854270935059, -1.4877240657806396, -1.429662823677063, -1.3716015815734863, -1.3135402202606201, -1.2554789781570435, -1.1974176168441772, -1.1393563747406006, -1.0812950134277344, -1.0232337713241577, -0.9651724696159363, -0.9071111679077148, -0.8490498661994934, -0.790988564491272, -0.7329273223876953, -0.6748660206794739, -0.6168047189712524, -0.5587434768676758, -0.5006821155548096, -0.44262081384658813, -0.3845595419406891, -0.32649824023246765, -0.2684369683265686, -0.21037566661834717, -0.15231436491012573, -0.09425309300422668, -0.03619182109832764, 0.021869469434022903, 0.07993075996637344, 0.13799205422401428, 0.19605334103107452, 0.25411462783813477, 0.3121759295463562, 0.37023720145225525, 0.4282985031604767, 0.4863598048686981, 0.5444210767745972, 0.6024823784828186, 0.66054368019104, 0.7186049222946167, 0.7766662836074829, 0.8347275257110596, 0.892788827419281, 0.9508501291275024, 1.008911371231079, 1.0669727325439453, 1.125033974647522, 1.1830952167510986, 1.2411565780639648, 1.2992178201675415, 1.3572791814804077, 1.4153404235839844, 1.4734017848968506, 1.5314630270004272, 1.5895243883132935, 1.6475856304168701, 1.7056469917297363, 1.763708233833313, 1.8217694759368896]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 7.0, 12.0, 17.0, 19.0, 29.0, 45.0, 89.0, 147.0, 230.0, 355.0, 737.0, 1409.0, 3249.0, 9299.0, 39376.0, 271359.0, 576519.0, 115610.0, 19817.0, 5582.0, 2227.0, 1061.0, 560.0, 300.0, 203.0, 105.0, 57.0, 39.0, 25.0, 22.0, 12.0, 10.0, 10.0, 1.0, 4.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.736328125, -2.63958740234375, -2.5428466796875, -2.44610595703125, -2.349365234375, -2.25262451171875, -2.1558837890625, -2.05914306640625, -1.96240234375, -1.86566162109375, -1.7689208984375, -1.67218017578125, -1.575439453125, -1.47869873046875, -1.3819580078125, -1.28521728515625, -1.1884765625, -1.09173583984375, -0.9949951171875, -0.89825439453125, -0.801513671875, -0.70477294921875, -0.6080322265625, -0.51129150390625, -0.41455078125, -0.31781005859375, -0.2210693359375, -0.12432861328125, -0.027587890625, 0.06915283203125, 0.1658935546875, 0.26263427734375, 0.359375, 0.45611572265625, 0.5528564453125, 0.64959716796875, 0.746337890625, 0.84307861328125, 0.9398193359375, 1.03656005859375, 1.13330078125, 1.23004150390625, 1.3267822265625, 1.42352294921875, 1.520263671875, 1.61700439453125, 1.7137451171875, 1.81048583984375, 1.9072265625, 2.00396728515625, 2.1007080078125, 2.19744873046875, 2.294189453125, 2.39093017578125, 2.4876708984375, 2.58441162109375, 2.68115234375, 2.77789306640625, 2.8746337890625, 2.97137451171875, 3.068115234375, 3.16485595703125, 3.2615966796875, 3.35833740234375, 3.455078125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 8.0, 11.0, 10.0, 23.0, 23.0, 35.0, 56.0, 74.0, 81.0, 93.0, 114.0, 105.0, 91.0, 67.0, 62.0, 42.0, 36.0, 26.0, 17.0, 7.0, 6.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.029296875, -1.961212158203125, -1.89312744140625, -1.825042724609375, -1.7569580078125, -1.688873291015625, -1.62078857421875, -1.552703857421875, -1.484619140625, -1.416534423828125, -1.34844970703125, -1.280364990234375, -1.2122802734375, -1.144195556640625, -1.07611083984375, -1.008026123046875, -0.93994140625, -0.871856689453125, -0.80377197265625, -0.735687255859375, -0.6676025390625, -0.599517822265625, -0.53143310546875, -0.463348388671875, -0.395263671875, -0.327178955078125, -0.25909423828125, -0.191009521484375, -0.1229248046875, -0.054840087890625, 0.01324462890625, 0.081329345703125, 0.1494140625, 0.217498779296875, 0.28558349609375, 0.353668212890625, 0.4217529296875, 0.489837646484375, 0.55792236328125, 0.626007080078125, 0.694091796875, 0.762176513671875, 0.83026123046875, 0.898345947265625, 0.9664306640625, 1.034515380859375, 1.10260009765625, 1.170684814453125, 1.23876953125, 1.306854248046875, 1.37493896484375, 1.443023681640625, 1.5111083984375, 1.579193115234375, 1.64727783203125, 1.715362548828125, 1.783447265625, 1.851531982421875, 1.91961669921875, 1.987701416015625, 2.0557861328125, 2.123870849609375, 2.19195556640625, 2.260040283203125, 2.328125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 4.0, 2.0, 12.0, 11.0, 15.0, 22.0, 27.0, 28.0, 36.0, 44.0, 77.0, 100.0, 132.0, 211.0, 383.0, 629.0, 1194.0, 3179.0, 13048.0, 108982.0, 693000.0, 198979.0, 20651.0, 4302.0, 1522.0, 681.0, 406.0, 271.0, 155.0, 116.0, 80.0, 59.0, 41.0, 36.0, 26.0, 17.0, 18.0, 17.0, 8.0, 8.0, 7.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.54296875, -3.434356689453125, -3.32574462890625, -3.217132568359375, -3.1085205078125, -2.999908447265625, -2.89129638671875, -2.782684326171875, -2.674072265625, -2.565460205078125, -2.45684814453125, -2.348236083984375, -2.2396240234375, -2.131011962890625, -2.02239990234375, -1.913787841796875, -1.80517578125, -1.696563720703125, -1.58795166015625, -1.479339599609375, -1.3707275390625, -1.262115478515625, -1.15350341796875, -1.044891357421875, -0.936279296875, -0.827667236328125, -0.71905517578125, -0.610443115234375, -0.5018310546875, -0.393218994140625, -0.28460693359375, -0.175994873046875, -0.0673828125, 0.041229248046875, 0.14984130859375, 0.258453369140625, 0.3670654296875, 0.475677490234375, 0.58428955078125, 0.692901611328125, 0.801513671875, 0.910125732421875, 1.01873779296875, 1.127349853515625, 1.2359619140625, 1.344573974609375, 1.45318603515625, 1.561798095703125, 1.67041015625, 1.779022216796875, 1.88763427734375, 1.996246337890625, 2.1048583984375, 2.213470458984375, 2.32208251953125, 2.430694580078125, 2.539306640625, 2.647918701171875, 2.75653076171875, 2.865142822265625, 2.9737548828125, 3.082366943359375, 3.19097900390625, 3.299591064453125, 3.408203125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 6.0, 5.0, 8.0, 5.0, 7.0, 11.0, 11.0, 6.0, 13.0, 14.0, 28.0, 20.0, 29.0, 32.0, 40.0, 41.0, 38.0, 43.0, 53.0, 45.0, 49.0, 37.0, 49.0, 29.0, 48.0, 37.0, 39.0, 47.0, 35.0, 40.0, 20.0, 25.0, 27.0, 14.0, 6.0, 8.0, 7.0, 10.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.87109375, -4.709716796875, -4.54833984375, -4.386962890625, -4.2255859375, -4.064208984375, -3.90283203125, -3.741455078125, -3.580078125, -3.418701171875, -3.25732421875, -3.095947265625, -2.9345703125, -2.773193359375, -2.61181640625, -2.450439453125, -2.2890625, -2.127685546875, -1.96630859375, -1.804931640625, -1.6435546875, -1.482177734375, -1.32080078125, -1.159423828125, -0.998046875, -0.836669921875, -0.67529296875, -0.513916015625, -0.3525390625, -0.191162109375, -0.02978515625, 0.131591796875, 0.29296875, 0.454345703125, 0.61572265625, 0.777099609375, 0.9384765625, 1.099853515625, 1.26123046875, 1.422607421875, 1.583984375, 1.745361328125, 1.90673828125, 2.068115234375, 2.2294921875, 2.390869140625, 2.55224609375, 2.713623046875, 2.875, 3.036376953125, 3.19775390625, 3.359130859375, 3.5205078125, 3.681884765625, 3.84326171875, 4.004638671875, 4.166015625, 4.327392578125, 4.48876953125, 4.650146484375, 4.8115234375, 4.972900390625, 5.13427734375, 5.295654296875, 5.45703125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 9.0, 12.0, 20.0, 55.0, 82.0, 217.0, 1025.0, 17369.0, 1015857.0, 12636.0, 879.0, 234.0, 70.0, 45.0, 17.0, 6.0, 6.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.74609375, -4.53485107421875, -4.3236083984375, -4.11236572265625, -3.901123046875, -3.68988037109375, -3.4786376953125, -3.26739501953125, -3.05615234375, -2.84490966796875, -2.6336669921875, -2.42242431640625, -2.211181640625, -1.99993896484375, -1.7886962890625, -1.57745361328125, -1.3662109375, -1.15496826171875, -0.9437255859375, -0.73248291015625, -0.521240234375, -0.30999755859375, -0.0987548828125, 0.11248779296875, 0.32373046875, 0.53497314453125, 0.7462158203125, 0.95745849609375, 1.168701171875, 1.37994384765625, 1.5911865234375, 1.80242919921875, 2.013671875, 2.22491455078125, 2.4361572265625, 2.64739990234375, 2.858642578125, 3.06988525390625, 3.2811279296875, 3.49237060546875, 3.70361328125, 3.91485595703125, 4.1260986328125, 4.33734130859375, 4.548583984375, 4.75982666015625, 4.9710693359375, 5.18231201171875, 5.3935546875, 5.60479736328125, 5.8160400390625, 6.02728271484375, 6.238525390625, 6.44976806640625, 6.6610107421875, 6.87225341796875, 7.08349609375, 7.29473876953125, 7.5059814453125, 7.71722412109375, 7.928466796875, 8.13970947265625, 8.3509521484375, 8.56219482421875, 8.7734375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 10.0, 17.0, 29.0, 35.0, 84.0, 109.0, 159.0, 208.0, 150.0, 89.0, 60.0, 36.0, 14.0, 7.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031757354736328125, -0.00030259788036346436, -0.00028762221336364746, -0.00027264654636383057, -0.00025767087936401367, -0.00024269521236419678, -0.00022771954536437988, -0.000212743878364563, -0.0001977682113647461, -0.0001827925443649292, -0.0001678168773651123, -0.0001528412103652954, -0.00013786554336547852, -0.00012288987636566162, -0.00010791420936584473, -9.293854236602783e-05, -7.796287536621094e-05, -6.298720836639404e-05, -4.801154136657715e-05, -3.3035874366760254e-05, -1.806020736694336e-05, -3.084540367126465e-06, 1.189112663269043e-05, 2.6866793632507324e-05, 4.184246063232422e-05, 5.681812763214111e-05, 7.179379463195801e-05, 8.67694616317749e-05, 0.0001017451286315918, 0.00011672079563140869, 0.00013169646263122559, 0.00014667212963104248, 0.00016164779663085938, 0.00017662346363067627, 0.00019159913063049316, 0.00020657479763031006, 0.00022155046463012695, 0.00023652613162994385, 0.00025150179862976074, 0.00026647746562957764, 0.00028145313262939453, 0.0002964287996292114, 0.0003114044666290283, 0.0003263801336288452, 0.0003413558006286621, 0.000356331467628479, 0.0003713071346282959, 0.0003862828016281128, 0.0004012584686279297, 0.0004162341356277466, 0.0004312098026275635, 0.00044618546962738037, 0.00046116113662719727, 0.00047613680362701416, 0.0004911124706268311, 0.000506088137626648, 0.0005210638046264648, 0.0005360394716262817, 0.0005510151386260986, 0.0005659908056259155, 0.0005809664726257324, 0.0005959421396255493, 0.0006109178066253662, 0.0006258934736251831, 0.000640869140625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 5.0, 2.0, 3.0, 9.0, 4.0, 14.0, 16.0, 31.0, 45.0, 94.0, 185.0, 461.0, 1202.0, 5191.0, 72657.0, 898844.0, 63056.0, 4747.0, 1137.0, 419.0, 192.0, 100.0, 60.0, 27.0, 16.0, 16.0, 6.0, 5.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.51171875, -2.420318603515625, -2.32891845703125, -2.237518310546875, -2.1461181640625, -2.054718017578125, -1.96331787109375, -1.871917724609375, -1.780517578125, -1.689117431640625, -1.59771728515625, -1.506317138671875, -1.4149169921875, -1.323516845703125, -1.23211669921875, -1.140716552734375, -1.04931640625, -0.957916259765625, -0.86651611328125, -0.775115966796875, -0.6837158203125, -0.592315673828125, -0.50091552734375, -0.409515380859375, -0.318115234375, -0.226715087890625, -0.13531494140625, -0.043914794921875, 0.0474853515625, 0.138885498046875, 0.23028564453125, 0.321685791015625, 0.4130859375, 0.504486083984375, 0.59588623046875, 0.687286376953125, 0.7786865234375, 0.870086669921875, 0.96148681640625, 1.052886962890625, 1.144287109375, 1.235687255859375, 1.32708740234375, 1.418487548828125, 1.5098876953125, 1.601287841796875, 1.69268798828125, 1.784088134765625, 1.87548828125, 1.966888427734375, 2.05828857421875, 2.149688720703125, 2.2410888671875, 2.332489013671875, 2.42388916015625, 2.515289306640625, 2.606689453125, 2.698089599609375, 2.78948974609375, 2.880889892578125, 2.9722900390625, 3.063690185546875, 3.15509033203125, 3.246490478515625, 3.337890625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 1.0, 5.0, 5.0, 7.0, 7.0, 14.0, 15.0, 29.0, 33.0, 43.0, 55.0, 89.0, 85.0, 102.0, 83.0, 102.0, 78.0, 68.0, 55.0, 34.0, 26.0, 19.0, 13.0, 11.0, 6.0, 7.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.61328125, -1.551239013671875, -1.48919677734375, -1.427154541015625, -1.3651123046875, -1.303070068359375, -1.24102783203125, -1.178985595703125, -1.116943359375, -1.054901123046875, -0.99285888671875, -0.930816650390625, -0.8687744140625, -0.806732177734375, -0.74468994140625, -0.682647705078125, -0.62060546875, -0.558563232421875, -0.49652099609375, -0.434478759765625, -0.3724365234375, -0.310394287109375, -0.24835205078125, -0.186309814453125, -0.124267578125, -0.062225341796875, -0.00018310546875, 0.061859130859375, 0.1239013671875, 0.185943603515625, 0.24798583984375, 0.310028076171875, 0.3720703125, 0.434112548828125, 0.49615478515625, 0.558197021484375, 0.6202392578125, 0.682281494140625, 0.74432373046875, 0.806365966796875, 0.868408203125, 0.930450439453125, 0.99249267578125, 1.054534912109375, 1.1165771484375, 1.178619384765625, 1.24066162109375, 1.302703857421875, 1.36474609375, 1.426788330078125, 1.48883056640625, 1.550872802734375, 1.6129150390625, 1.674957275390625, 1.73699951171875, 1.799041748046875, 1.861083984375, 1.923126220703125, 1.98516845703125, 2.047210693359375, 2.1092529296875, 2.171295166015625, 2.23333740234375, 2.295379638671875, 2.357421875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 8.0, 24.0, 97.0, 224.0, 355.0, 205.0, 69.0, 17.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.28843688964844, -53.35307312011719, -51.41770935058594, -49.48234558105469, -47.54698181152344, -45.61161804199219, -43.67625427246094, -41.74089050292969, -39.80552673339844, -37.87016296386719, -35.93479919433594, -33.99943542480469, -32.06407165527344, -30.128707885742188, -28.19334602355957, -26.25798225402832, -24.322620391845703, -22.387256622314453, -20.451892852783203, -18.516529083251953, -16.581165313720703, -14.64580249786377, -12.710439682006836, -10.775075912475586, -8.839712142944336, -6.904348373413086, -4.968985080718994, -3.0336217880249023, -1.0982580184936523, 0.8371057510375977, 2.7724685668945312, 4.707832336425781, 6.643196105957031, 8.578559875488281, 10.513923645019531, 12.449286460876465, 14.384650230407715, 16.32001495361328, 18.2553768157959, 20.19074058532715, 22.1261043548584, 24.06146812438965, 25.9968318939209, 27.932193756103516, 29.867557525634766, 31.802921295166016, 33.738285064697266, 35.673648834228516, 37.609012603759766, 39.544376373291016, 41.479740142822266, 43.415103912353516, 45.350467681884766, 47.285831451416016, 49.22119140625, 51.15655517578125, 53.0919189453125, 55.02728271484375, 56.962646484375, 58.89801025390625, 60.8333740234375, 62.76873779296875, 64.7041015625, 66.63946533203125, 68.5748291015625]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 3.0, 6.0, 10.0, 10.0, 17.0, 17.0, 20.0, 31.0, 18.0, 22.0, 31.0, 42.0, 44.0, 48.0, 47.0, 58.0, 65.0, 53.0, 55.0, 60.0, 44.0, 41.0, 42.0, 32.0, 36.0, 32.0, 19.0, 17.0, 15.0, 12.0, 14.0, 7.0, 7.0, 4.0, 4.0, 3.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-27.206832885742188, -26.4228515625, -25.638870239257812, -24.854888916015625, -24.070907592773438, -23.286928176879883, -22.502946853637695, -21.718965530395508, -20.93498420715332, -20.151002883911133, -19.367021560668945, -18.583040237426758, -17.799060821533203, -17.015079498291016, -16.231098175048828, -15.44711685180664, -14.663135528564453, -13.879154205322266, -13.095172882080078, -12.311192512512207, -11.52721118927002, -10.743229866027832, -9.959249496459961, -9.175268173217773, -8.391286849975586, -7.607305526733398, -6.823324680328369, -6.03934383392334, -5.255362510681152, -4.471381187438965, -3.6874003410339355, -2.9034194946289062, -2.1194400787353516, -1.3354589939117432, -0.5514779090881348, 0.23250317573547363, 1.016484260559082, 1.8004653453826904, 2.584446430206299, 3.368427276611328, 4.152408599853516, 4.936389923095703, 5.720370769500732, 6.504351615905762, 7.288332939147949, 8.072314262390137, 8.856294631958008, 9.640275955200195, 10.424257278442383, 11.20823860168457, 11.992219924926758, 12.776200294494629, 13.560181617736816, 14.344162940979004, 15.128143310546875, 15.912124633789062, 16.69610595703125, 17.480087280273438, 18.264068603515625, 19.048049926757812, 19.83203125, 20.616010665893555, 21.399991989135742, 22.18397331237793, 22.967954635620117]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 6.0, 1.0, 5.0, 5.0, 11.0, 11.0, 21.0, 29.0, 30.0, 57.0, 96.0, 164.0, 243.0, 482.0, 962.0, 2120.0, 5865.0, 22339.0, 167520.0, 3856749.0, 110793.0, 17652.0, 5110.0, 1933.0, 904.0, 442.0, 227.0, 160.0, 101.0, 60.0, 54.0, 34.0, 25.0, 21.0, 14.0, 5.0, 8.0, 10.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.892578125, -2.790802001953125, -2.68902587890625, -2.587249755859375, -2.4854736328125, -2.383697509765625, -2.28192138671875, -2.180145263671875, -2.078369140625, -1.976593017578125, -1.87481689453125, -1.773040771484375, -1.6712646484375, -1.569488525390625, -1.46771240234375, -1.365936279296875, -1.26416015625, -1.162384033203125, -1.06060791015625, -0.958831787109375, -0.8570556640625, -0.755279541015625, -0.65350341796875, -0.551727294921875, -0.449951171875, -0.348175048828125, -0.24639892578125, -0.144622802734375, -0.0428466796875, 0.058929443359375, 0.16070556640625, 0.262481689453125, 0.3642578125, 0.466033935546875, 0.56781005859375, 0.669586181640625, 0.7713623046875, 0.873138427734375, 0.97491455078125, 1.076690673828125, 1.178466796875, 1.280242919921875, 1.38201904296875, 1.483795166015625, 1.5855712890625, 1.687347412109375, 1.78912353515625, 1.890899658203125, 1.99267578125, 2.094451904296875, 2.19622802734375, 2.298004150390625, 2.3997802734375, 2.501556396484375, 2.60333251953125, 2.705108642578125, 2.806884765625, 2.908660888671875, 3.01043701171875, 3.112213134765625, 3.2139892578125, 3.315765380859375, 3.41754150390625, 3.519317626953125, 3.62109375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 5.0, 4.0, 7.0, 9.0, 15.0, 21.0, 18.0, 30.0, 50.0, 67.0, 85.0, 108.0, 97.0, 112.0, 87.0, 86.0, 57.0, 50.0, 23.0, 26.0, 13.0, 11.0, 7.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7900390625, -1.7256622314453125, -1.661285400390625, -1.5969085693359375, -1.53253173828125, -1.4681549072265625, -1.403778076171875, -1.3394012451171875, -1.2750244140625, -1.2106475830078125, -1.146270751953125, -1.0818939208984375, -1.01751708984375, -0.9531402587890625, -0.888763427734375, -0.8243865966796875, -0.760009765625, -0.6956329345703125, -0.631256103515625, -0.5668792724609375, -0.50250244140625, -0.4381256103515625, -0.373748779296875, -0.3093719482421875, -0.2449951171875, -0.1806182861328125, -0.116241455078125, -0.0518646240234375, 0.01251220703125, 0.0768890380859375, 0.141265869140625, 0.2056427001953125, 0.27001953125, 0.3343963623046875, 0.398773193359375, 0.4631500244140625, 0.52752685546875, 0.5919036865234375, 0.656280517578125, 0.7206573486328125, 0.7850341796875, 0.8494110107421875, 0.913787841796875, 0.9781646728515625, 1.04254150390625, 1.1069183349609375, 1.171295166015625, 1.2356719970703125, 1.300048828125, 1.3644256591796875, 1.428802490234375, 1.4931793212890625, 1.55755615234375, 1.6219329833984375, 1.686309814453125, 1.7506866455078125, 1.8150634765625, 1.8794403076171875, 1.943817138671875, 2.0081939697265625, 2.07257080078125, 2.1369476318359375, 2.201324462890625, 2.2657012939453125, 2.330078125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 10.0, 12.0, 12.0, 29.0, 33.0, 65.0, 96.0, 136.0, 226.0, 424.0, 726.0, 1375.0, 2703.0, 5972.0, 15727.0, 56238.0, 386401.0, 3495107.0, 174367.0, 34422.0, 10901.0, 4557.0, 2182.0, 1010.0, 575.0, 327.0, 219.0, 153.0, 98.0, 56.0, 43.0, 27.0, 16.0, 12.0, 6.0, 7.0, 10.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3046875, -2.237548828125, -2.17041015625, -2.103271484375, -2.0361328125, -1.968994140625, -1.90185546875, -1.834716796875, -1.767578125, -1.700439453125, -1.63330078125, -1.566162109375, -1.4990234375, -1.431884765625, -1.36474609375, -1.297607421875, -1.23046875, -1.163330078125, -1.09619140625, -1.029052734375, -0.9619140625, -0.894775390625, -0.82763671875, -0.760498046875, -0.693359375, -0.626220703125, -0.55908203125, -0.491943359375, -0.4248046875, -0.357666015625, -0.29052734375, -0.223388671875, -0.15625, -0.089111328125, -0.02197265625, 0.045166015625, 0.1123046875, 0.179443359375, 0.24658203125, 0.313720703125, 0.380859375, 0.447998046875, 0.51513671875, 0.582275390625, 0.6494140625, 0.716552734375, 0.78369140625, 0.850830078125, 0.91796875, 0.985107421875, 1.05224609375, 1.119384765625, 1.1865234375, 1.253662109375, 1.32080078125, 1.387939453125, 1.455078125, 1.522216796875, 1.58935546875, 1.656494140625, 1.7236328125, 1.790771484375, 1.85791015625, 1.925048828125, 1.9921875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 10.0, 17.0, 21.0, 31.0, 46.0, 105.0, 190.0, 375.0, 2305.0, 531.0, 196.0, 95.0, 48.0, 36.0, 24.0, 12.0, 4.0, 2.0, 4.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91748046875, -0.8750686645507812, -0.8326568603515625, -0.7902450561523438, -0.747833251953125, -0.7054214477539062, -0.6630096435546875, -0.6205978393554688, -0.57818603515625, -0.5357742309570312, -0.4933624267578125, -0.45095062255859375, -0.408538818359375, -0.36612701416015625, -0.3237152099609375, -0.28130340576171875, -0.2388916015625, -0.19647979736328125, -0.1540679931640625, -0.11165618896484375, -0.069244384765625, -0.02683258056640625, 0.0155792236328125, 0.05799102783203125, 0.10040283203125, 0.14281463623046875, 0.1852264404296875, 0.22763824462890625, 0.270050048828125, 0.31246185302734375, 0.3548736572265625, 0.39728546142578125, 0.439697265625, 0.48210906982421875, 0.5245208740234375, 0.5669326782226562, 0.609344482421875, 0.6517562866210938, 0.6941680908203125, 0.7365798950195312, 0.77899169921875, 0.8214035034179688, 0.8638153076171875, 0.9062271118164062, 0.948638916015625, 0.9910507202148438, 1.0334625244140625, 1.0758743286132812, 1.1182861328125, 1.1606979370117188, 1.2031097412109375, 1.2455215454101562, 1.287933349609375, 1.3303451538085938, 1.3727569580078125, 1.4151687622070312, 1.45758056640625, 1.4999923706054688, 1.5424041748046875, 1.5848159790039062, 1.627227783203125, 1.6696395874023438, 1.7120513916015625, 1.7544631958007812, 1.796875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 4.0, 12.0, 15.0, 22.0, 34.0, 50.0, 74.0, 84.0, 101.0, 102.0, 103.0, 102.0, 77.0, 64.0, 35.0, 26.0, 20.0, 19.0, 18.0, 7.0, 8.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.754072666168213, -5.609649658203125, -5.465226650238037, -5.320803642272949, -5.176380634307861, -5.031957626342773, -4.8875346183776855, -4.743111610412598, -4.598688125610352, -4.454265117645264, -4.309842109680176, -4.165419101715088, -4.02099609375, -3.876573085784912, -3.732149839401245, -3.5877268314361572, -3.4433040618896484, -3.2988810539245605, -3.1544580459594727, -3.0100350379943848, -2.865612030029297, -2.721189022064209, -2.576765775680542, -2.432342767715454, -2.287919759750366, -2.1434967517852783, -1.9990737438201904, -1.854650616645813, -1.710227608680725, -1.5658046007156372, -1.4213814735412598, -1.2769584655761719, -1.1325352191925049, -0.988112211227417, -0.8436891436576843, -0.6992660760879517, -0.5548430681228638, -0.4104200601577759, -0.2659969925880432, -0.12157392501831055, 0.022849082946777344, 0.16727212071418762, 0.3116951584815979, 0.4561181962490082, 0.6005412340164185, 0.7449642419815063, 0.889387309551239, 1.0338103771209717, 1.1782333850860596, 1.3226563930511475, 1.4670794010162354, 1.6115025281906128, 1.7559255361557007, 1.9003485441207886, 2.044771671295166, 2.189194679260254, 2.333617687225342, 2.4780406951904297, 2.6224637031555176, 2.7668867111206055, 2.9113097190856934, 3.0557327270507812, 3.2001559734344482, 3.344578981399536, 3.489001989364624]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 10.0, 10.0, 8.0, 8.0, 13.0, 12.0, 13.0, 25.0, 31.0, 33.0, 47.0, 50.0, 52.0, 50.0, 49.0, 49.0, 61.0, 45.0, 46.0, 45.0, 40.0, 41.0, 43.0, 33.0, 42.0, 28.0, 28.0, 21.0, 14.0, 14.0, 14.0, 8.0, 5.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9463589191436768, -3.812131643295288, -3.6779046058654785, -3.54367733001709, -3.4094502925872803, -3.2752230167388916, -3.140995979309082, -3.0067687034606934, -2.8725414276123047, -2.738314151763916, -2.6040871143341064, -2.4698598384857178, -2.335632801055908, -2.2014055252075195, -2.067178249359131, -1.9329512119293213, -1.7987241744995117, -1.6644970178604126, -1.5302698612213135, -1.3960425853729248, -1.2618155479431152, -1.1275882720947266, -0.9933611154556274, -0.8591339588165283, -0.7249068021774292, -0.5906796455383301, -0.45645245909690857, -0.32222527265548706, -0.18799811601638794, -0.05377095937728882, 0.08045625686645508, 0.2146834135055542, 0.3489103317260742, 0.48313748836517334, 0.6173646450042725, 0.7515918612480164, 0.8858190178871155, 1.0200462341308594, 1.1542733907699585, 1.2885005474090576, 1.4227277040481567, 1.5569548606872559, 1.691182017326355, 1.825409173965454, 1.9596364498138428, 2.0938634872436523, 2.228090763092041, 2.3623180389404297, 2.4965450763702393, 2.630772352218628, 2.7649993896484375, 2.899226665496826, 3.0334537029266357, 3.1676809787750244, 3.301908016204834, 3.4361352920532227, 3.5703625679016113, 3.70458984375, 3.8388168811798096, 3.9730441570281982, 4.107271194458008, 4.2414984703063965, 4.375725746154785, 4.509952545166016, 4.644179821014404]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 4.0, 5.0, 5.0, 10.0, 19.0, 18.0, 40.0, 54.0, 111.0, 313.0, 905.0, 3822.0, 36691.0, 730076.0, 260429.0, 12996.0, 2043.0, 600.0, 208.0, 85.0, 53.0, 23.0, 8.0, 10.0, 5.0, 5.0, 1.0, 5.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5234375, -6.3304443359375, -6.137451171875, -5.9444580078125, -5.75146484375, -5.5584716796875, -5.365478515625, -5.1724853515625, -4.9794921875, -4.7864990234375, -4.593505859375, -4.4005126953125, -4.20751953125, -4.0145263671875, -3.821533203125, -3.6285400390625, -3.435546875, -3.2425537109375, -3.049560546875, -2.8565673828125, -2.66357421875, -2.4705810546875, -2.277587890625, -2.0845947265625, -1.8916015625, -1.6986083984375, -1.505615234375, -1.3126220703125, -1.11962890625, -0.9266357421875, -0.733642578125, -0.5406494140625, -0.34765625, -0.1546630859375, 0.038330078125, 0.2313232421875, 0.42431640625, 0.6173095703125, 0.810302734375, 1.0032958984375, 1.1962890625, 1.3892822265625, 1.582275390625, 1.7752685546875, 1.96826171875, 2.1612548828125, 2.354248046875, 2.5472412109375, 2.740234375, 2.9332275390625, 3.126220703125, 3.3192138671875, 3.51220703125, 3.7052001953125, 3.898193359375, 4.0911865234375, 4.2841796875, 4.4771728515625, 4.670166015625, 4.8631591796875, 5.05615234375, 5.2491455078125, 5.442138671875, 5.6351318359375, 5.828125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 5.0, 5.0, 11.0, 9.0, 10.0, 30.0, 29.0, 36.0, 54.0, 60.0, 85.0, 91.0, 96.0, 111.0, 89.0, 68.0, 55.0, 52.0, 34.0, 16.0, 16.0, 15.0, 7.0, 5.0, 4.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6025390625, -1.5424346923828125, -1.482330322265625, -1.4222259521484375, -1.36212158203125, -1.3020172119140625, -1.241912841796875, -1.1818084716796875, -1.1217041015625, -1.0615997314453125, -1.001495361328125, -0.9413909912109375, -0.88128662109375, -0.8211822509765625, -0.761077880859375, -0.7009735107421875, -0.640869140625, -0.5807647705078125, -0.520660400390625, -0.4605560302734375, -0.40045166015625, -0.3403472900390625, -0.280242919921875, -0.2201385498046875, -0.1600341796875, -0.0999298095703125, -0.039825439453125, 0.0202789306640625, 0.08038330078125, 0.1404876708984375, 0.200592041015625, 0.2606964111328125, 0.32080078125, 0.3809051513671875, 0.441009521484375, 0.5011138916015625, 0.56121826171875, 0.6213226318359375, 0.681427001953125, 0.7415313720703125, 0.8016357421875, 0.8617401123046875, 0.921844482421875, 0.9819488525390625, 1.04205322265625, 1.1021575927734375, 1.162261962890625, 1.2223663330078125, 1.282470703125, 1.3425750732421875, 1.402679443359375, 1.4627838134765625, 1.52288818359375, 1.5829925537109375, 1.643096923828125, 1.7032012939453125, 1.7633056640625, 1.8234100341796875, 1.883514404296875, 1.9436187744140625, 2.00372314453125, 2.0638275146484375, 2.123931884765625, 2.1840362548828125, 2.244140625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 0.0, 4.0, 4.0, 8.0, 13.0, 15.0, 26.0, 28.0, 68.0, 95.0, 166.0, 272.0, 536.0, 1239.0, 3799.0, 24285.0, 556697.0, 435249.0, 20186.0, 3393.0, 1224.0, 548.0, 270.0, 151.0, 94.0, 60.0, 43.0, 16.0, 18.0, 15.0, 11.0, 3.0, 3.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.9921875, -4.8309326171875, -4.669677734375, -4.5084228515625, -4.34716796875, -4.1859130859375, -4.024658203125, -3.8634033203125, -3.7021484375, -3.5408935546875, -3.379638671875, -3.2183837890625, -3.05712890625, -2.8958740234375, -2.734619140625, -2.5733642578125, -2.412109375, -2.2508544921875, -2.089599609375, -1.9283447265625, -1.76708984375, -1.6058349609375, -1.444580078125, -1.2833251953125, -1.1220703125, -0.9608154296875, -0.799560546875, -0.6383056640625, -0.47705078125, -0.3157958984375, -0.154541015625, 0.0067138671875, 0.16796875, 0.3292236328125, 0.490478515625, 0.6517333984375, 0.81298828125, 0.9742431640625, 1.135498046875, 1.2967529296875, 1.4580078125, 1.6192626953125, 1.780517578125, 1.9417724609375, 2.10302734375, 2.2642822265625, 2.425537109375, 2.5867919921875, 2.748046875, 2.9093017578125, 3.070556640625, 3.2318115234375, 3.39306640625, 3.5543212890625, 3.715576171875, 3.8768310546875, 4.0380859375, 4.1993408203125, 4.360595703125, 4.5218505859375, 4.68310546875, 4.8443603515625, 5.005615234375, 5.1668701171875, 5.328125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 5.0, 10.0, 7.0, 11.0, 11.0, 10.0, 13.0, 10.0, 24.0, 18.0, 21.0, 31.0, 26.0, 41.0, 38.0, 35.0, 43.0, 48.0, 27.0, 40.0, 45.0, 38.0, 56.0, 47.0, 30.0, 39.0, 40.0, 38.0, 31.0, 29.0, 24.0, 24.0, 13.0, 15.0, 10.0, 12.0, 11.0, 6.0, 5.0, 2.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.48828125, -3.35858154296875, -3.2288818359375, -3.09918212890625, -2.969482421875, -2.83978271484375, -2.7100830078125, -2.58038330078125, -2.45068359375, -2.32098388671875, -2.1912841796875, -2.06158447265625, -1.931884765625, -1.80218505859375, -1.6724853515625, -1.54278564453125, -1.4130859375, -1.28338623046875, -1.1536865234375, -1.02398681640625, -0.894287109375, -0.76458740234375, -0.6348876953125, -0.50518798828125, -0.37548828125, -0.24578857421875, -0.1160888671875, 0.01361083984375, 0.143310546875, 0.27301025390625, 0.4027099609375, 0.53240966796875, 0.662109375, 0.79180908203125, 0.9215087890625, 1.05120849609375, 1.180908203125, 1.31060791015625, 1.4403076171875, 1.57000732421875, 1.69970703125, 1.82940673828125, 1.9591064453125, 2.08880615234375, 2.218505859375, 2.34820556640625, 2.4779052734375, 2.60760498046875, 2.7373046875, 2.86700439453125, 2.9967041015625, 3.12640380859375, 3.256103515625, 3.38580322265625, 3.5155029296875, 3.64520263671875, 3.77490234375, 3.90460205078125, 4.0343017578125, 4.16400146484375, 4.293701171875, 4.42340087890625, 4.5531005859375, 4.68280029296875, 4.8125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 5.0, 8.0, 11.0, 21.0, 32.0, 41.0, 68.0, 128.0, 225.0, 622.0, 1472.0, 5418.0, 36299.0, 498223.0, 464109.0, 34258.0, 5085.0, 1456.0, 536.0, 229.0, 129.0, 70.0, 37.0, 23.0, 16.0, 11.0, 6.0, 9.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8349609375, -1.7825164794921875, -1.730072021484375, -1.6776275634765625, -1.62518310546875, -1.5727386474609375, -1.520294189453125, -1.4678497314453125, -1.4154052734375, -1.3629608154296875, -1.310516357421875, -1.2580718994140625, -1.20562744140625, -1.1531829833984375, -1.100738525390625, -1.0482940673828125, -0.995849609375, -0.9434051513671875, -0.890960693359375, -0.8385162353515625, -0.78607177734375, -0.7336273193359375, -0.681182861328125, -0.6287384033203125, -0.5762939453125, -0.5238494873046875, -0.471405029296875, -0.4189605712890625, -0.36651611328125, -0.3140716552734375, -0.261627197265625, -0.2091827392578125, -0.15673828125, -0.1042938232421875, -0.051849365234375, 0.0005950927734375, 0.05303955078125, 0.1054840087890625, 0.157928466796875, 0.2103729248046875, 0.2628173828125, 0.3152618408203125, 0.367706298828125, 0.4201507568359375, 0.47259521484375, 0.5250396728515625, 0.577484130859375, 0.6299285888671875, 0.682373046875, 0.7348175048828125, 0.787261962890625, 0.8397064208984375, 0.89215087890625, 0.9445953369140625, 0.997039794921875, 1.0494842529296875, 1.1019287109375, 1.1543731689453125, 1.206817626953125, 1.2592620849609375, 1.31170654296875, 1.3641510009765625, 1.416595458984375, 1.4690399169921875, 1.521484375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 8.0, 3.0, 7.0, 9.0, 9.0, 10.0, 11.0, 16.0, 23.0, 19.0, 29.0, 23.0, 42.0, 60.0, 56.0, 70.0, 76.0, 74.0, 83.0, 65.0, 49.0, 45.0, 36.0, 36.0, 19.0, 25.0, 21.0, 21.0, 19.0, 4.0, 8.0, 4.0, 7.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00018739700317382812, -0.00018121488392353058, -0.00017503276467323303, -0.00016885064542293549, -0.00016266852617263794, -0.0001564864069223404, -0.00015030428767204285, -0.0001441221684217453, -0.00013794004917144775, -0.0001317579299211502, -0.00012557581067085266, -0.00011939369142055511, -0.00011321157217025757, -0.00010702945291996002, -0.00010084733366966248, -9.466521441936493e-05, -8.848309516906738e-05, -8.230097591876984e-05, -7.611885666847229e-05, -6.993673741817474e-05, -6.37546181678772e-05, -5.757249891757965e-05, -5.1390379667282104e-05, -4.520826041698456e-05, -3.902614116668701e-05, -3.2844021916389465e-05, -2.666190266609192e-05, -2.0479783415794373e-05, -1.4297664165496826e-05, -8.11554491519928e-06, -1.9334256649017334e-06, 4.248693585395813e-06, 1.043081283569336e-05, 1.6612932085990906e-05, 2.2795051336288452e-05, 2.8977170586586e-05, 3.5159289836883545e-05, 4.134140908718109e-05, 4.752352833747864e-05, 5.3705647587776184e-05, 5.988776683807373e-05, 6.606988608837128e-05, 7.225200533866882e-05, 7.843412458896637e-05, 8.461624383926392e-05, 9.079836308956146e-05, 9.698048233985901e-05, 0.00010316260159015656, 0.0001093447208404541, 0.00011552684009075165, 0.0001217089593410492, 0.00012789107859134674, 0.0001340731978416443, 0.00014025531709194183, 0.00014643743634223938, 0.00015261955559253693, 0.00015880167484283447, 0.00016498379409313202, 0.00017116591334342957, 0.0001773480325937271, 0.00018353015184402466, 0.0001897122710943222, 0.00019589439034461975, 0.0002020765095949173, 0.00020825862884521484]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 13.0, 12.0, 24.0, 28.0, 53.0, 99.0, 178.0, 435.0, 949.0, 2734.0, 15411.0, 269132.0, 710990.0, 41099.0, 4964.0, 1336.0, 524.0, 245.0, 123.0, 77.0, 52.0, 32.0, 17.0, 10.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.341796875, -2.283538818359375, -2.22528076171875, -2.167022705078125, -2.1087646484375, -2.050506591796875, -1.99224853515625, -1.933990478515625, -1.875732421875, -1.817474365234375, -1.75921630859375, -1.700958251953125, -1.6427001953125, -1.584442138671875, -1.52618408203125, -1.467926025390625, -1.40966796875, -1.351409912109375, -1.29315185546875, -1.234893798828125, -1.1766357421875, -1.118377685546875, -1.06011962890625, -1.001861572265625, -0.943603515625, -0.885345458984375, -0.82708740234375, -0.768829345703125, -0.7105712890625, -0.652313232421875, -0.59405517578125, -0.535797119140625, -0.4775390625, -0.419281005859375, -0.36102294921875, -0.302764892578125, -0.2445068359375, -0.186248779296875, -0.12799072265625, -0.069732666015625, -0.011474609375, 0.046783447265625, 0.10504150390625, 0.163299560546875, 0.2215576171875, 0.279815673828125, 0.33807373046875, 0.396331787109375, 0.45458984375, 0.512847900390625, 0.57110595703125, 0.629364013671875, 0.6876220703125, 0.745880126953125, 0.80413818359375, 0.862396240234375, 0.920654296875, 0.978912353515625, 1.03717041015625, 1.095428466796875, 1.1536865234375, 1.211944580078125, 1.27020263671875, 1.328460693359375, 1.38671875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 6.0, 8.0, 4.0, 10.0, 17.0, 21.0, 30.0, 42.0, 39.0, 54.0, 55.0, 67.0, 68.0, 73.0, 84.0, 74.0, 63.0, 42.0, 43.0, 46.0, 37.0, 27.0, 19.0, 19.0, 14.0, 7.0, 7.0, 3.0, 3.0, 6.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3193359375, -1.2818145751953125, -1.244293212890625, -1.2067718505859375, -1.16925048828125, -1.1317291259765625, -1.094207763671875, -1.0566864013671875, -1.0191650390625, -0.9816436767578125, -0.944122314453125, -0.9066009521484375, -0.86907958984375, -0.8315582275390625, -0.794036865234375, -0.7565155029296875, -0.718994140625, -0.6814727783203125, -0.643951416015625, -0.6064300537109375, -0.56890869140625, -0.5313873291015625, -0.493865966796875, -0.4563446044921875, -0.4188232421875, -0.3813018798828125, -0.343780517578125, -0.3062591552734375, -0.26873779296875, -0.2312164306640625, -0.193695068359375, -0.1561737060546875, -0.11865234375, -0.0811309814453125, -0.043609619140625, -0.0060882568359375, 0.03143310546875, 0.0689544677734375, 0.106475830078125, 0.1439971923828125, 0.1815185546875, 0.2190399169921875, 0.256561279296875, 0.2940826416015625, 0.33160400390625, 0.3691253662109375, 0.406646728515625, 0.4441680908203125, 0.481689453125, 0.5192108154296875, 0.556732177734375, 0.5942535400390625, 0.63177490234375, 0.6692962646484375, 0.706817626953125, 0.7443389892578125, 0.7818603515625, 0.8193817138671875, 0.856903076171875, 0.8944244384765625, 0.93194580078125, 0.9694671630859375, 1.006988525390625, 1.0445098876953125, 1.08203125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 9.0, 33.0, 171.0, 356.0, 301.0, 99.0, 30.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-86.47315216064453, -84.4529800415039, -82.43280029296875, -80.41262817382812, -78.3924560546875, -76.37227630615234, -74.35210418701172, -72.33192443847656, -70.31175231933594, -68.29158020019531, -66.27140045166016, -64.25122833251953, -62.23105239868164, -60.21087646484375, -58.190704345703125, -56.170528411865234, -54.150352478027344, -52.13017654418945, -50.11000061035156, -48.08982849121094, -46.06965255737305, -44.049476623535156, -42.02930450439453, -40.00912857055664, -37.98895263671875, -35.96877670288086, -33.94860076904297, -31.928428649902344, -29.908252716064453, -27.888076782226562, -25.867902755737305, -23.847728729248047, -21.827552795410156, -19.807376861572266, -17.787202835083008, -15.767027854919434, -13.74685287475586, -11.726677894592285, -9.706502914428711, -7.686327934265137, -5.6661529541015625, -3.6459779739379883, -1.625802993774414, 0.39437198638916016, 2.4145469665527344, 4.434721946716309, 6.454896926879883, 8.475071907043457, 10.495246887207031, 12.515421867370605, 14.53559684753418, 16.555770874023438, 18.575946807861328, 20.59612274169922, 22.616296768188477, 24.636470794677734, 26.656646728515625, 28.676822662353516, 30.696996688842773, 32.71717071533203, 34.73734664916992, 36.75752258300781, 38.77769470214844, 40.79787063598633, 42.81804656982422]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 11.0, 7.0, 8.0, 14.0, 28.0, 25.0, 19.0, 25.0, 35.0, 49.0, 37.0, 41.0, 50.0, 63.0, 65.0, 70.0, 61.0, 61.0, 65.0, 43.0, 31.0, 28.0, 36.0, 22.0, 25.0, 12.0, 13.0, 13.0, 10.0, 6.0, 6.0, 4.0, 1.0, 7.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.728443145751953, -21.991424560546875, -21.254405975341797, -20.51738739013672, -19.78036880493164, -19.043350219726562, -18.306331634521484, -17.569313049316406, -16.832294464111328, -16.09527587890625, -15.358257293701172, -14.621238708496094, -13.884220123291016, -13.147201538085938, -12.41018295288086, -11.673164367675781, -10.936144828796387, -10.199126243591309, -9.46210765838623, -8.725089073181152, -7.988070487976074, -7.251051902770996, -6.51403284072876, -5.777014255523682, -5.0399956703186035, -4.302977085113525, -3.5659584999084473, -2.82893967628479, -2.091921091079712, -1.3549025058746338, -0.6178836822509766, 0.11913490295410156, 0.8561534881591797, 1.5931720733642578, 2.330190658569336, 3.067209482192993, 3.8042280673980713, 4.54124641418457, 5.278265476226807, 6.015284061431885, 6.752302646636963, 7.489321231842041, 8.226340293884277, 8.963358879089355, 9.700377464294434, 10.437396049499512, 11.17441463470459, 11.911433219909668, 12.648451805114746, 13.385470390319824, 14.122488975524902, 14.85950756072998, 15.596526145935059, 16.333545684814453, 17.07056427001953, 17.80758285522461, 18.544601440429688, 19.281620025634766, 20.018638610839844, 20.755657196044922, 21.49267578125, 22.229694366455078, 22.966712951660156, 23.703731536865234, 24.440750122070312]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 8.0, 3.0, 3.0, 7.0, 4.0, 5.0, 14.0, 17.0, 20.0, 42.0, 46.0, 104.0, 185.0, 588.0, 2283.0, 19163.0, 1132759.0, 3000528.0, 33539.0, 3525.0, 791.0, 268.0, 126.0, 94.0, 62.0, 30.0, 24.0, 18.0, 7.0, 6.0, 9.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.931640625, -3.81634521484375, -3.7010498046875, -3.58575439453125, -3.470458984375, -3.35516357421875, -3.2398681640625, -3.12457275390625, -3.00927734375, -2.89398193359375, -2.7786865234375, -2.66339111328125, -2.548095703125, -2.43280029296875, -2.3175048828125, -2.20220947265625, -2.0869140625, -1.97161865234375, -1.8563232421875, -1.74102783203125, -1.625732421875, -1.51043701171875, -1.3951416015625, -1.27984619140625, -1.16455078125, -1.04925537109375, -0.9339599609375, -0.81866455078125, -0.703369140625, -0.58807373046875, -0.4727783203125, -0.35748291015625, -0.2421875, -0.12689208984375, -0.0115966796875, 0.10369873046875, 0.218994140625, 0.33428955078125, 0.4495849609375, 0.56488037109375, 0.68017578125, 0.79547119140625, 0.9107666015625, 1.02606201171875, 1.141357421875, 1.25665283203125, 1.3719482421875, 1.48724365234375, 1.6025390625, 1.71783447265625, 1.8331298828125, 1.94842529296875, 2.063720703125, 2.17901611328125, 2.2943115234375, 2.40960693359375, 2.52490234375, 2.64019775390625, 2.7554931640625, 2.87078857421875, 2.986083984375, 3.10137939453125, 3.2166748046875, 3.33197021484375, 3.447265625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 7.0, 8.0, 12.0, 14.0, 18.0, 29.0, 21.0, 23.0, 38.0, 46.0, 38.0, 61.0, 76.0, 64.0, 63.0, 82.0, 64.0, 57.0, 48.0, 43.0, 28.0, 33.0, 29.0, 24.0, 20.0, 15.0, 11.0, 7.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.021484375, -0.9857330322265625, -0.949981689453125, -0.9142303466796875, -0.87847900390625, -0.8427276611328125, -0.806976318359375, -0.7712249755859375, -0.7354736328125, -0.6997222900390625, -0.663970947265625, -0.6282196044921875, -0.59246826171875, -0.5567169189453125, -0.520965576171875, -0.4852142333984375, -0.449462890625, -0.4137115478515625, -0.377960205078125, -0.3422088623046875, -0.30645751953125, -0.2707061767578125, -0.234954833984375, -0.1992034912109375, -0.1634521484375, -0.1277008056640625, -0.091949462890625, -0.0561981201171875, -0.02044677734375, 0.0153045654296875, 0.051055908203125, 0.0868072509765625, 0.12255859375, 0.1583099365234375, 0.194061279296875, 0.2298126220703125, 0.26556396484375, 0.3013153076171875, 0.337066650390625, 0.3728179931640625, 0.4085693359375, 0.4443206787109375, 0.480072021484375, 0.5158233642578125, 0.55157470703125, 0.5873260498046875, 0.623077392578125, 0.6588287353515625, 0.694580078125, 0.7303314208984375, 0.766082763671875, 0.8018341064453125, 0.83758544921875, 0.8733367919921875, 0.909088134765625, 0.9448394775390625, 0.9805908203125, 1.0163421630859375, 1.052093505859375, 1.0878448486328125, 1.12359619140625, 1.1593475341796875, 1.195098876953125, 1.2308502197265625, 1.2666015625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 5.0, 8.0, 10.0, 11.0, 14.0, 28.0, 40.0, 88.0, 159.0, 428.0, 1300.0, 5412.0, 35263.0, 951819.0, 3109024.0, 78262.0, 9411.0, 1998.0, 581.0, 189.0, 99.0, 34.0, 24.0, 18.0, 11.0, 8.0, 9.0, 8.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.21484375, -3.125946044921875, -3.03704833984375, -2.948150634765625, -2.8592529296875, -2.770355224609375, -2.68145751953125, -2.592559814453125, -2.503662109375, -2.414764404296875, -2.32586669921875, -2.236968994140625, -2.1480712890625, -2.059173583984375, -1.97027587890625, -1.881378173828125, -1.79248046875, -1.703582763671875, -1.61468505859375, -1.525787353515625, -1.4368896484375, -1.347991943359375, -1.25909423828125, -1.170196533203125, -1.081298828125, -0.992401123046875, -0.90350341796875, -0.814605712890625, -0.7257080078125, -0.636810302734375, -0.54791259765625, -0.459014892578125, -0.3701171875, -0.281219482421875, -0.19232177734375, -0.103424072265625, -0.0145263671875, 0.074371337890625, 0.16326904296875, 0.252166748046875, 0.341064453125, 0.429962158203125, 0.51885986328125, 0.607757568359375, 0.6966552734375, 0.785552978515625, 0.87445068359375, 0.963348388671875, 1.05224609375, 1.141143798828125, 1.23004150390625, 1.318939208984375, 1.4078369140625, 1.496734619140625, 1.58563232421875, 1.674530029296875, 1.763427734375, 1.852325439453125, 1.94122314453125, 2.030120849609375, 2.1190185546875, 2.207916259765625, 2.29681396484375, 2.385711669921875, 2.474609375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 6.0, 7.0, 16.0, 12.0, 24.0, 28.0, 52.0, 66.0, 104.0, 198.0, 330.0, 527.0, 703.0, 720.0, 494.0, 295.0, 188.0, 101.0, 52.0, 33.0, 31.0, 22.0, 14.0, 9.0, 11.0, 5.0, 7.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.220703125, -2.153350830078125, -2.08599853515625, -2.018646240234375, -1.9512939453125, -1.883941650390625, -1.81658935546875, -1.749237060546875, -1.681884765625, -1.614532470703125, -1.54718017578125, -1.479827880859375, -1.4124755859375, -1.345123291015625, -1.27777099609375, -1.210418701171875, -1.14306640625, -1.075714111328125, -1.00836181640625, -0.941009521484375, -0.8736572265625, -0.806304931640625, -0.73895263671875, -0.671600341796875, -0.604248046875, -0.536895751953125, -0.46954345703125, -0.402191162109375, -0.3348388671875, -0.267486572265625, -0.20013427734375, -0.132781982421875, -0.0654296875, 0.001922607421875, 0.06927490234375, 0.136627197265625, 0.2039794921875, 0.271331787109375, 0.33868408203125, 0.406036376953125, 0.473388671875, 0.540740966796875, 0.60809326171875, 0.675445556640625, 0.7427978515625, 0.810150146484375, 0.87750244140625, 0.944854736328125, 1.01220703125, 1.079559326171875, 1.14691162109375, 1.214263916015625, 1.2816162109375, 1.348968505859375, 1.41632080078125, 1.483673095703125, 1.551025390625, 1.618377685546875, 1.68572998046875, 1.753082275390625, 1.8204345703125, 1.887786865234375, 1.95513916015625, 2.022491455078125, 2.08984375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 4.0, 1.0, 7.0, 7.0, 14.0, 21.0, 38.0, 59.0, 85.0, 128.0, 128.0, 149.0, 150.0, 90.0, 54.0, 20.0, 13.0, 13.0, 4.0, 4.0, 1.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.2736759185791, -16.79802703857422, -16.32238006591797, -15.846731185913086, -15.371082305908203, -14.895434379577637, -14.41978645324707, -13.944137573242188, -13.468489646911621, -12.992841720581055, -12.517192840576172, -12.041544914245605, -11.565896034240723, -11.090248107910156, -10.614599227905273, -10.138951301574707, -9.66330337524414, -9.187655448913574, -8.712006568908691, -8.236358642578125, -7.7607102394104, -7.285061836242676, -6.809413433074951, -6.333765029907227, -5.858116149902344, -5.382467746734619, -4.9068193435668945, -4.431171417236328, -3.9555230140686035, -3.479874610900879, -3.0042262077331543, -2.528578042984009, -2.0529298782348633, -1.5772815942764282, -1.1016333103179932, -0.6259849071502686, -0.1503366231918335, 0.32531166076660156, 0.8009600639343262, 1.2766082286834717, 1.7522566318511963, 2.227905035018921, 2.7035531997680664, 3.179201602935791, 3.6548500061035156, 4.130497932434082, 4.606146812438965, 5.081794738769531, 5.557443141937256, 6.0330915451049805, 6.508739948272705, 6.98438835144043, 7.460036277770996, 7.935684680938721, 8.411333084106445, 8.886981010437012, 9.362629890441895, 9.838277816772461, 10.313926696777344, 10.78957462310791, 11.265223503112793, 11.74087142944336, 12.216520309448242, 12.692168235778809, 13.167816162109375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 11.0, 6.0, 9.0, 13.0, 13.0, 20.0, 28.0, 21.0, 26.0, 26.0, 39.0, 41.0, 56.0, 63.0, 52.0, 57.0, 68.0, 66.0, 59.0, 46.0, 40.0, 39.0, 38.0, 39.0, 25.0, 22.0, 16.0, 17.0, 13.0, 10.0, 9.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.717267036437988, -11.328336715698242, -10.93940544128418, -10.550475120544434, -10.161544799804688, -9.772613525390625, -9.383683204650879, -8.994752883911133, -8.60582160949707, -8.216891288757324, -7.827960014343262, -7.439029693603516, -7.050098896026611, -6.661168098449707, -6.272237777709961, -5.883306980133057, -5.494376182556152, -5.105445384979248, -4.716514587402344, -4.327584266662598, -3.9386534690856934, -3.549722671508789, -3.160792112350464, -2.7718615531921387, -2.3829307556152344, -1.9940000772476196, -1.6050693988800049, -1.2161387205123901, -0.8272080421447754, -0.43827736377716064, -0.0493466854095459, 0.3395838737487793, 0.7285137176513672, 1.117444396018982, 1.5063750743865967, 1.8953057527542114, 2.284236431121826, 2.6731672286987305, 3.0620977878570557, 3.451028347015381, 3.839959144592285, 4.2288899421691895, 4.617820739746094, 5.00675106048584, 5.395681858062744, 5.784612655639648, 6.1735429763793945, 6.562473773956299, 6.951404571533203, 7.340335369110107, 7.729266166687012, 8.118196487426758, 8.50712776184082, 8.896058082580566, 9.284988403320312, 9.673919677734375, 10.062849998474121, 10.451780319213867, 10.84071159362793, 11.229641914367676, 11.618572235107422, 12.007503509521484, 12.39643383026123, 12.785364151000977, 13.174295425415039]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 6.0, 6.0, 16.0, 22.0, 39.0, 34.0, 53.0, 104.0, 148.0, 221.0, 345.0, 538.0, 873.0, 1543.0, 2827.0, 5190.0, 9927.0, 20796.0, 46676.0, 115530.0, 297178.0, 320688.0, 128038.0, 51282.0, 22891.0, 10930.0, 5627.0, 2833.0, 1605.0, 974.0, 582.0, 333.0, 243.0, 148.0, 114.0, 48.0, 40.0, 31.0, 19.0, 18.0, 10.0, 5.0, 6.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.21875, -1.17950439453125, -1.1402587890625, -1.10101318359375, -1.061767578125, -1.02252197265625, -0.9832763671875, -0.94403076171875, -0.90478515625, -0.86553955078125, -0.8262939453125, -0.78704833984375, -0.747802734375, -0.70855712890625, -0.6693115234375, -0.63006591796875, -0.5908203125, -0.55157470703125, -0.5123291015625, -0.47308349609375, -0.433837890625, -0.39459228515625, -0.3553466796875, -0.31610107421875, -0.27685546875, -0.23760986328125, -0.1983642578125, -0.15911865234375, -0.119873046875, -0.08062744140625, -0.0413818359375, -0.00213623046875, 0.037109375, 0.07635498046875, 0.1156005859375, 0.15484619140625, 0.194091796875, 0.23333740234375, 0.2725830078125, 0.31182861328125, 0.35107421875, 0.39031982421875, 0.4295654296875, 0.46881103515625, 0.508056640625, 0.54730224609375, 0.5865478515625, 0.62579345703125, 0.6650390625, 0.70428466796875, 0.7435302734375, 0.78277587890625, 0.822021484375, 0.86126708984375, 0.9005126953125, 0.93975830078125, 0.97900390625, 1.01824951171875, 1.0574951171875, 1.09674072265625, 1.135986328125, 1.17523193359375, 1.2144775390625, 1.25372314453125, 1.29296875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 4.0, 3.0, 9.0, 7.0, 9.0, 9.0, 15.0, 14.0, 18.0, 22.0, 33.0, 30.0, 38.0, 48.0, 38.0, 49.0, 47.0, 45.0, 55.0, 60.0, 57.0, 63.0, 45.0, 43.0, 23.0, 37.0, 39.0, 18.0, 21.0, 16.0, 18.0, 15.0, 17.0, 9.0, 5.0, 5.0, 6.0, 6.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0], "bins": [-1.087890625, -1.059173583984375, -1.03045654296875, -1.001739501953125, -0.9730224609375, -0.944305419921875, -0.91558837890625, -0.886871337890625, -0.858154296875, -0.829437255859375, -0.80072021484375, -0.772003173828125, -0.7432861328125, -0.714569091796875, -0.68585205078125, -0.657135009765625, -0.62841796875, -0.599700927734375, -0.57098388671875, -0.542266845703125, -0.5135498046875, -0.484832763671875, -0.45611572265625, -0.427398681640625, -0.398681640625, -0.369964599609375, -0.34124755859375, -0.312530517578125, -0.2838134765625, -0.255096435546875, -0.22637939453125, -0.197662353515625, -0.1689453125, -0.140228271484375, -0.11151123046875, -0.082794189453125, -0.0540771484375, -0.025360107421875, 0.00335693359375, 0.032073974609375, 0.060791015625, 0.089508056640625, 0.11822509765625, 0.146942138671875, 0.1756591796875, 0.204376220703125, 0.23309326171875, 0.261810302734375, 0.29052734375, 0.319244384765625, 0.34796142578125, 0.376678466796875, 0.4053955078125, 0.434112548828125, 0.46282958984375, 0.491546630859375, 0.520263671875, 0.548980712890625, 0.57769775390625, 0.606414794921875, 0.6351318359375, 0.663848876953125, 0.69256591796875, 0.721282958984375, 0.75]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 5.0, 6.0, 15.0, 24.0, 21.0, 39.0, 50.0, 93.0, 158.0, 212.0, 418.0, 719.0, 1496.0, 4433.0, 23872.0, 399311.0, 578797.0, 30306.0, 4927.0, 1714.0, 825.0, 438.0, 255.0, 147.0, 90.0, 56.0, 33.0, 26.0, 10.0, 9.0, 12.0, 6.0, 5.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.65625, -3.54217529296875, -3.4281005859375, -3.31402587890625, -3.199951171875, -3.08587646484375, -2.9718017578125, -2.85772705078125, -2.74365234375, -2.62957763671875, -2.5155029296875, -2.40142822265625, -2.287353515625, -2.17327880859375, -2.0592041015625, -1.94512939453125, -1.8310546875, -1.71697998046875, -1.6029052734375, -1.48883056640625, -1.374755859375, -1.26068115234375, -1.1466064453125, -1.03253173828125, -0.91845703125, -0.80438232421875, -0.6903076171875, -0.57623291015625, -0.462158203125, -0.34808349609375, -0.2340087890625, -0.11993408203125, -0.005859375, 0.10821533203125, 0.2222900390625, 0.33636474609375, 0.450439453125, 0.56451416015625, 0.6785888671875, 0.79266357421875, 0.90673828125, 1.02081298828125, 1.1348876953125, 1.24896240234375, 1.363037109375, 1.47711181640625, 1.5911865234375, 1.70526123046875, 1.8193359375, 1.93341064453125, 2.0474853515625, 2.16156005859375, 2.275634765625, 2.38970947265625, 2.5037841796875, 2.61785888671875, 2.73193359375, 2.84600830078125, 2.9600830078125, 3.07415771484375, 3.188232421875, 3.30230712890625, 3.4163818359375, 3.53045654296875, 3.64453125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 15.0, 9.0, 9.0, 21.0, 12.0, 15.0, 17.0, 18.0, 20.0, 24.0, 22.0, 41.0, 39.0, 39.0, 40.0, 41.0, 41.0, 56.0, 42.0, 40.0, 54.0, 41.0, 44.0, 38.0, 37.0, 32.0, 33.0, 26.0, 27.0, 18.0, 16.0, 13.0, 13.0, 13.0, 7.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.08203125, -3.96868896484375, -3.8553466796875, -3.74200439453125, -3.628662109375, -3.51531982421875, -3.4019775390625, -3.28863525390625, -3.17529296875, -3.06195068359375, -2.9486083984375, -2.83526611328125, -2.721923828125, -2.60858154296875, -2.4952392578125, -2.38189697265625, -2.2685546875, -2.15521240234375, -2.0418701171875, -1.92852783203125, -1.815185546875, -1.70184326171875, -1.5885009765625, -1.47515869140625, -1.36181640625, -1.24847412109375, -1.1351318359375, -1.02178955078125, -0.908447265625, -0.79510498046875, -0.6817626953125, -0.56842041015625, -0.455078125, -0.34173583984375, -0.2283935546875, -0.11505126953125, -0.001708984375, 0.11163330078125, 0.2249755859375, 0.33831787109375, 0.45166015625, 0.56500244140625, 0.6783447265625, 0.79168701171875, 0.905029296875, 1.01837158203125, 1.1317138671875, 1.24505615234375, 1.3583984375, 1.47174072265625, 1.5850830078125, 1.69842529296875, 1.811767578125, 1.92510986328125, 2.0384521484375, 2.15179443359375, 2.26513671875, 2.37847900390625, 2.4918212890625, 2.60516357421875, 2.718505859375, 2.83184814453125, 2.9451904296875, 3.05853271484375, 3.171875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 6.0, 8.0, 10.0, 10.0, 16.0, 25.0, 26.0, 50.0, 81.0, 99.0, 143.0, 272.0, 466.0, 867.0, 1921.0, 4976.0, 16630.0, 75115.0, 640901.0, 251400.0, 38968.0, 10128.0, 3323.0, 1336.0, 710.0, 386.0, 249.0, 145.0, 81.0, 65.0, 41.0, 27.0, 15.0, 12.0, 12.0, 10.0, 1.0, 2.0, 3.0, 1.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.083984375, -1.049896240234375, -1.01580810546875, -0.981719970703125, -0.9476318359375, -0.913543701171875, -0.87945556640625, -0.845367431640625, -0.811279296875, -0.777191162109375, -0.74310302734375, -0.709014892578125, -0.6749267578125, -0.640838623046875, -0.60675048828125, -0.572662353515625, -0.53857421875, -0.504486083984375, -0.47039794921875, -0.436309814453125, -0.4022216796875, -0.368133544921875, -0.33404541015625, -0.299957275390625, -0.265869140625, -0.231781005859375, -0.19769287109375, -0.163604736328125, -0.1295166015625, -0.095428466796875, -0.06134033203125, -0.027252197265625, 0.0068359375, 0.040924072265625, 0.07501220703125, 0.109100341796875, 0.1431884765625, 0.177276611328125, 0.21136474609375, 0.245452880859375, 0.279541015625, 0.313629150390625, 0.34771728515625, 0.381805419921875, 0.4158935546875, 0.449981689453125, 0.48406982421875, 0.518157958984375, 0.55224609375, 0.586334228515625, 0.62042236328125, 0.654510498046875, 0.6885986328125, 0.722686767578125, 0.75677490234375, 0.790863037109375, 0.824951171875, 0.859039306640625, 0.89312744140625, 0.927215576171875, 0.9613037109375, 0.995391845703125, 1.02947998046875, 1.063568115234375, 1.09765625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 8.0, 6.0, 5.0, 5.0, 9.0, 9.0, 3.0, 13.0, 8.0, 6.0, 12.0, 19.0, 29.0, 33.0, 42.0, 54.0, 82.0, 126.0, 135.0, 104.0, 76.0, 46.0, 27.0, 19.0, 26.0, 13.0, 19.0, 13.0, 8.0, 5.0, 3.0, 7.0, 6.0, 6.0, 3.0, 6.0, 4.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002124309539794922, -0.00020540505647659302, -0.00019837915897369385, -0.00019135326147079468, -0.0001843273639678955, -0.00017730146646499634, -0.00017027556896209717, -0.000163249671459198, -0.00015622377395629883, -0.00014919787645339966, -0.0001421719789505005, -0.00013514608144760132, -0.00012812018394470215, -0.00012109428644180298, -0.00011406838893890381, -0.00010704249143600464, -0.00010001659393310547, -9.29906964302063e-05, -8.596479892730713e-05, -7.893890142440796e-05, -7.191300392150879e-05, -6.488710641860962e-05, -5.786120891571045e-05, -5.083531141281128e-05, -4.380941390991211e-05, -3.678351640701294e-05, -2.975761890411377e-05, -2.27317214012146e-05, -1.570582389831543e-05, -8.67992639541626e-06, -1.6540288925170898e-06, 5.37186861038208e-06, 1.239776611328125e-05, 1.942366361618042e-05, 2.644956111907959e-05, 3.347545862197876e-05, 4.050135612487793e-05, 4.75272536277771e-05, 5.455315113067627e-05, 6.157904863357544e-05, 6.860494613647461e-05, 7.563084363937378e-05, 8.265674114227295e-05, 8.968263864517212e-05, 9.670853614807129e-05, 0.00010373443365097046, 0.00011076033115386963, 0.0001177862286567688, 0.00012481212615966797, 0.00013183802366256714, 0.0001388639211654663, 0.00014588981866836548, 0.00015291571617126465, 0.00015994161367416382, 0.000166967511177063, 0.00017399340867996216, 0.00018101930618286133, 0.0001880452036857605, 0.00019507110118865967, 0.00020209699869155884, 0.000209122896194458, 0.00021614879369735718, 0.00022317469120025635, 0.00023020058870315552, 0.0002372264862060547]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 11.0, 13.0, 23.0, 18.0, 33.0, 69.0, 102.0, 154.0, 255.0, 402.0, 798.0, 1850.0, 4973.0, 20419.0, 162201.0, 758099.0, 80033.0, 12638.0, 3488.0, 1388.0, 687.0, 320.0, 209.0, 133.0, 78.0, 40.0, 39.0, 29.0, 13.0, 14.0, 9.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.68359375, -1.64080810546875, -1.5980224609375, -1.55523681640625, -1.512451171875, -1.46966552734375, -1.4268798828125, -1.38409423828125, -1.34130859375, -1.29852294921875, -1.2557373046875, -1.21295166015625, -1.170166015625, -1.12738037109375, -1.0845947265625, -1.04180908203125, -0.9990234375, -0.95623779296875, -0.9134521484375, -0.87066650390625, -0.827880859375, -0.78509521484375, -0.7423095703125, -0.69952392578125, -0.65673828125, -0.61395263671875, -0.5711669921875, -0.52838134765625, -0.485595703125, -0.44281005859375, -0.4000244140625, -0.35723876953125, -0.314453125, -0.27166748046875, -0.2288818359375, -0.18609619140625, -0.143310546875, -0.10052490234375, -0.0577392578125, -0.01495361328125, 0.02783203125, 0.07061767578125, 0.1134033203125, 0.15618896484375, 0.198974609375, 0.24176025390625, 0.2845458984375, 0.32733154296875, 0.3701171875, 0.41290283203125, 0.4556884765625, 0.49847412109375, 0.541259765625, 0.58404541015625, 0.6268310546875, 0.66961669921875, 0.71240234375, 0.75518798828125, 0.7979736328125, 0.84075927734375, 0.883544921875, 0.92633056640625, 0.9691162109375, 1.01190185546875, 1.0546875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 12.0, 11.0, 15.0, 16.0, 26.0, 33.0, 47.0, 60.0, 92.0, 117.0, 124.0, 91.0, 92.0, 66.0, 52.0, 42.0, 27.0, 14.0, 21.0, 11.0, 8.0, 3.0, 7.0, 1.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4853515625, -1.4398345947265625, -1.394317626953125, -1.3488006591796875, -1.30328369140625, -1.2577667236328125, -1.212249755859375, -1.1667327880859375, -1.1212158203125, -1.0756988525390625, -1.030181884765625, -0.9846649169921875, -0.93914794921875, -0.8936309814453125, -0.848114013671875, -0.8025970458984375, -0.757080078125, -0.7115631103515625, -0.666046142578125, -0.6205291748046875, -0.57501220703125, -0.5294952392578125, -0.483978271484375, -0.4384613037109375, -0.3929443359375, -0.3474273681640625, -0.301910400390625, -0.2563934326171875, -0.21087646484375, -0.1653594970703125, -0.119842529296875, -0.0743255615234375, -0.02880859375, 0.0167083740234375, 0.062225341796875, 0.1077423095703125, 0.15325927734375, 0.1987762451171875, 0.244293212890625, 0.2898101806640625, 0.3353271484375, 0.3808441162109375, 0.426361083984375, 0.4718780517578125, 0.51739501953125, 0.5629119873046875, 0.608428955078125, 0.6539459228515625, 0.699462890625, 0.7449798583984375, 0.790496826171875, 0.8360137939453125, 0.88153076171875, 0.9270477294921875, 0.972564697265625, 1.0180816650390625, 1.0635986328125, 1.1091156005859375, 1.154632568359375, 1.2001495361328125, 1.24566650390625, 1.2911834716796875, 1.336700439453125, 1.3822174072265625, 1.427734375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 7.0, 23.0, 44.0, 108.0, 204.0, 271.0, 169.0, 77.0, 50.0, 23.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.294349670410156, -23.412368774414062, -22.53038787841797, -21.648405075073242, -20.76642417907715, -19.884443283081055, -19.00246238708496, -18.120479583740234, -17.23849868774414, -16.356517791748047, -15.474535942077637, -14.592555046081543, -13.710573196411133, -12.828592300415039, -11.946611404418945, -11.064629554748535, -10.182648658752441, -9.300667762756348, -8.418685913085938, -7.536705017089844, -6.654723167419434, -5.77274227142334, -4.890760898590088, -4.008779525756836, -3.126798152923584, -2.244816780090332, -1.3628355264663696, -0.4808542728424072, 0.4011270999908447, 1.2831082344055176, 2.1650896072387695, 3.0470709800720215, 3.9290523529052734, 4.811033725738525, 5.693015098571777, 6.574995994567871, 7.456977844238281, 8.338958740234375, 9.220939636230469, 10.102921485900879, 10.984903335571289, 11.866884231567383, 12.748866081237793, 13.630846977233887, 14.512828826904297, 15.39480972290039, 16.276790618896484, 17.158771514892578, 18.040752410888672, 18.922733306884766, 19.80471420288086, 20.686697006225586, 21.56867790222168, 22.450658798217773, 23.332639694213867, 24.214622497558594, 25.096603393554688, 25.97858428955078, 26.860565185546875, 27.7425479888916, 28.624528884887695, 29.50650978088379, 30.388490676879883, 31.27047348022461, 32.1524543762207]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 4.0, 6.0, 9.0, 13.0, 17.0, 24.0, 18.0, 21.0, 21.0, 55.0, 45.0, 45.0, 55.0, 60.0, 69.0, 62.0, 60.0, 63.0, 50.0, 36.0, 47.0, 30.0, 44.0, 28.0, 32.0, 17.0, 13.0, 17.0, 12.0, 10.0, 8.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.903369903564453, -21.318344116210938, -20.733318328857422, -20.148292541503906, -19.563264846801758, -18.978239059448242, -18.393213272094727, -17.80818748474121, -17.223161697387695, -16.63813591003418, -16.053110122680664, -15.468083381652832, -14.883057594299316, -14.298030853271484, -13.713005065917969, -13.127979278564453, -12.542952537536621, -11.957926750183105, -11.372900009155273, -10.787874221801758, -10.202848434448242, -9.617822647094727, -9.032795906066895, -8.447770118713379, -7.862743854522705, -7.277717590332031, -6.692691802978516, -6.107665538787842, -5.522639274597168, -4.937613487243652, -4.3525872230529785, -3.767561435699463, -3.182535171508789, -2.5975091457366943, -2.0124831199645996, -1.4274568557739258, -0.842430830001831, -0.25740480422973633, 0.3276214599609375, 0.9126472473144531, 1.497673511505127, 2.0826995372772217, 2.6677255630493164, 3.2527518272399902, 3.837777853012085, 4.42280387878418, 5.0078301429748535, 5.592855930328369, 6.177882194519043, 6.762908458709717, 7.347934246063232, 7.932960510253906, 8.517986297607422, 9.103012084960938, 9.68803882598877, 10.273064613342285, 10.858091354370117, 11.443117141723633, 12.028143882751465, 12.61316967010498, 13.198195457458496, 13.783222198486328, 14.368247985839844, 14.95327377319336, 15.538299560546875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 11.0, 10.0, 17.0, 15.0, 26.0, 47.0, 66.0, 95.0, 153.0, 257.0, 665.0, 5884.0, 3358418.0, 823589.0, 3943.0, 470.0, 195.0, 151.0, 72.0, 64.0, 46.0, 24.0, 20.0, 10.0, 11.0, 4.0, 8.0, 3.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9375, -5.75714111328125, -5.5767822265625, -5.39642333984375, -5.216064453125, -5.03570556640625, -4.8553466796875, -4.67498779296875, -4.49462890625, -4.31427001953125, -4.1339111328125, -3.95355224609375, -3.773193359375, -3.59283447265625, -3.4124755859375, -3.23211669921875, -3.0517578125, -2.87139892578125, -2.6910400390625, -2.51068115234375, -2.330322265625, -2.14996337890625, -1.9696044921875, -1.78924560546875, -1.60888671875, -1.42852783203125, -1.2481689453125, -1.06781005859375, -0.887451171875, -0.70709228515625, -0.5267333984375, -0.34637451171875, -0.166015625, 0.01434326171875, 0.1947021484375, 0.37506103515625, 0.555419921875, 0.73577880859375, 0.9161376953125, 1.09649658203125, 1.27685546875, 1.45721435546875, 1.6375732421875, 1.81793212890625, 1.998291015625, 2.17864990234375, 2.3590087890625, 2.53936767578125, 2.7197265625, 2.90008544921875, 3.0804443359375, 3.26080322265625, 3.441162109375, 3.62152099609375, 3.8018798828125, 3.98223876953125, 4.16259765625, 4.34295654296875, 4.5233154296875, 4.70367431640625, 4.884033203125, 5.06439208984375, 5.2447509765625, 5.42510986328125, 5.60546875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 8.0, 24.0, 25.0, 51.0, 76.0, 104.0, 88.0, 104.0, 93.0, 120.0, 85.0, 71.0, 46.0, 41.0, 31.0, 13.0, 8.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.240234375, -2.1842498779296875, -2.128265380859375, -2.0722808837890625, -2.01629638671875, -1.9603118896484375, -1.904327392578125, -1.8483428955078125, -1.7923583984375, -1.7363739013671875, -1.680389404296875, -1.6244049072265625, -1.56842041015625, -1.5124359130859375, -1.456451416015625, -1.4004669189453125, -1.344482421875, -1.2884979248046875, -1.232513427734375, -1.1765289306640625, -1.12054443359375, -1.0645599365234375, -1.008575439453125, -0.9525909423828125, -0.8966064453125, -0.8406219482421875, -0.784637451171875, -0.7286529541015625, -0.67266845703125, -0.6166839599609375, -0.560699462890625, -0.5047149658203125, -0.44873046875, -0.3927459716796875, -0.336761474609375, -0.2807769775390625, -0.22479248046875, -0.1688079833984375, -0.112823486328125, -0.0568389892578125, -0.0008544921875, 0.0551300048828125, 0.111114501953125, 0.1670989990234375, 0.22308349609375, 0.2790679931640625, 0.335052490234375, 0.3910369873046875, 0.447021484375, 0.5030059814453125, 0.558990478515625, 0.6149749755859375, 0.67095947265625, 0.7269439697265625, 0.782928466796875, 0.8389129638671875, 0.8948974609375, 0.9508819580078125, 1.006866455078125, 1.0628509521484375, 1.11883544921875, 1.1748199462890625, 1.230804443359375, 1.2867889404296875, 1.3427734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 3.0, 3.0, 13.0, 25.0, 39.0, 86.0, 165.0, 339.0, 683.0, 1552.0, 3630.0, 10652.0, 40201.0, 283158.0, 2746249.0, 980118.0, 93157.0, 20793.0, 7069.0, 3082.0, 1495.0, 785.0, 428.0, 238.0, 153.0, 57.0, 35.0, 26.0, 14.0, 17.0, 1.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.548828125, -1.504241943359375, -1.45965576171875, -1.415069580078125, -1.3704833984375, -1.325897216796875, -1.28131103515625, -1.236724853515625, -1.192138671875, -1.147552490234375, -1.10296630859375, -1.058380126953125, -1.0137939453125, -0.969207763671875, -0.92462158203125, -0.880035400390625, -0.83544921875, -0.790863037109375, -0.74627685546875, -0.701690673828125, -0.6571044921875, -0.612518310546875, -0.56793212890625, -0.523345947265625, -0.478759765625, -0.434173583984375, -0.38958740234375, -0.345001220703125, -0.3004150390625, -0.255828857421875, -0.21124267578125, -0.166656494140625, -0.1220703125, -0.077484130859375, -0.03289794921875, 0.011688232421875, 0.0562744140625, 0.100860595703125, 0.14544677734375, 0.190032958984375, 0.234619140625, 0.279205322265625, 0.32379150390625, 0.368377685546875, 0.4129638671875, 0.457550048828125, 0.50213623046875, 0.546722412109375, 0.59130859375, 0.635894775390625, 0.68048095703125, 0.725067138671875, 0.7696533203125, 0.814239501953125, 0.85882568359375, 0.903411865234375, 0.947998046875, 0.992584228515625, 1.03717041015625, 1.081756591796875, 1.1263427734375, 1.170928955078125, 1.21551513671875, 1.260101318359375, 1.3046875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 2.0, 6.0, 11.0, 23.0, 31.0, 38.0, 62.0, 98.0, 177.0, 263.0, 450.0, 624.0, 723.0, 561.0, 380.0, 220.0, 148.0, 90.0, 44.0, 21.0, 22.0, 21.0, 10.0, 7.0, 7.0, 4.0, 9.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.3740234375, -1.321685791015625, -1.26934814453125, -1.217010498046875, -1.1646728515625, -1.112335205078125, -1.05999755859375, -1.007659912109375, -0.955322265625, -0.902984619140625, -0.85064697265625, -0.798309326171875, -0.7459716796875, -0.693634033203125, -0.64129638671875, -0.588958740234375, -0.53662109375, -0.484283447265625, -0.43194580078125, -0.379608154296875, -0.3272705078125, -0.274932861328125, -0.22259521484375, -0.170257568359375, -0.117919921875, -0.065582275390625, -0.01324462890625, 0.039093017578125, 0.0914306640625, 0.143768310546875, 0.19610595703125, 0.248443603515625, 0.30078125, 0.353118896484375, 0.40545654296875, 0.457794189453125, 0.5101318359375, 0.562469482421875, 0.61480712890625, 0.667144775390625, 0.719482421875, 0.771820068359375, 0.82415771484375, 0.876495361328125, 0.9288330078125, 0.981170654296875, 1.03350830078125, 1.085845947265625, 1.13818359375, 1.190521240234375, 1.24285888671875, 1.295196533203125, 1.3475341796875, 1.399871826171875, 1.45220947265625, 1.504547119140625, 1.556884765625, 1.609222412109375, 1.66156005859375, 1.713897705078125, 1.7662353515625, 1.818572998046875, 1.87091064453125, 1.923248291015625, 1.9755859375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 7.0, 13.0, 12.0, 69.0, 196.0, 334.0, 250.0, 84.0, 17.0, 11.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.227092742919922, -19.37476348876953, -18.52243423461914, -17.67010498046875, -16.81777572631836, -15.965447425842285, -15.113118171691895, -14.26078987121582, -13.40846061706543, -12.556131362915039, -11.703802108764648, -10.851472854614258, -9.999144554138184, -9.146815299987793, -8.294486045837402, -7.44215726852417, -6.589827537536621, -5.7374982833862305, -4.885169506072998, -4.032840251922607, -3.180511236190796, -2.3281822204589844, -1.4758529663085938, -0.6235241889953613, 0.2288050651550293, 1.0811340808868408, 1.933463215827942, 2.785792350769043, 3.6381213665008545, 4.490450382232666, 5.342779636383057, 6.195108413696289, 7.04743766784668, 7.89976692199707, 8.752096176147461, 9.604425430297852, 10.456753730773926, 11.309082984924316, 12.161412239074707, 13.013740539550781, 13.866069793701172, 14.718399047851562, 15.570728302001953, 16.423057556152344, 17.275386810302734, 18.127716064453125, 18.980045318603516, 19.832372665405273, 20.684703826904297, 21.537033081054688, 22.389362335205078, 23.24169158935547, 24.09402084350586, 24.94635009765625, 25.79867935180664, 26.6510066986084, 27.50333595275879, 28.35566520690918, 29.20799446105957, 30.06032371520996, 30.91265296936035, 31.76498031616211, 32.6173095703125, 33.46963882446289, 34.32196807861328]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 4.0, 9.0, 11.0, 15.0, 15.0, 15.0, 34.0, 25.0, 27.0, 41.0, 43.0, 39.0, 61.0, 68.0, 52.0, 64.0, 55.0, 65.0, 58.0, 51.0, 49.0, 41.0, 31.0, 25.0, 16.0, 17.0, 8.0, 12.0, 7.0, 6.0, 2.0, 9.0, 2.0, 7.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-9.83814811706543, -9.524201393127441, -9.21025562286377, -8.896308898925781, -8.582362174987793, -8.268416404724121, -7.954469680786133, -7.640523433685303, -7.326577186584473, -7.012630939483643, -6.698684215545654, -6.384737968444824, -6.070791721343994, -5.756845474243164, -5.442898750305176, -5.128952503204346, -4.815005779266357, -4.501059532165527, -4.187112808227539, -3.873166561126709, -3.559220314025879, -3.2452738285064697, -2.9313273429870605, -2.6173810958862305, -2.3034346103668213, -1.9894882440567017, -1.675541877746582, -1.3615953922271729, -1.0476490259170532, -0.7337026596069336, -0.4197561740875244, -0.10580992698669434, 0.20813655853271484, 0.5220829248428345, 0.8360293507575989, 1.1499757766723633, 1.463922142982483, 1.7778685092926025, 2.0918149948120117, 2.405761241912842, 2.719707727432251, 3.03365421295166, 3.3476004600524902, 3.6615469455718994, 3.9754934310913086, 4.289439678192139, 4.603385925292969, 4.917332649230957, 5.231278896331787, 5.545225143432617, 5.8591718673706055, 6.1731181144714355, 6.487064361572266, 6.801011085510254, 7.114957332611084, 7.428903579711914, 7.742850303649902, 8.05679702758789, 8.370742797851562, 8.68468952178955, 8.998636245727539, 9.312582015991211, 9.6265287399292, 9.940475463867188, 10.25442123413086]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 3.0, 4.0, 8.0, 20.0, 21.0, 28.0, 57.0, 83.0, 123.0, 196.0, 311.0, 584.0, 1013.0, 1812.0, 3544.0, 7524.0, 18272.0, 47809.0, 148651.0, 419944.0, 267618.0, 80221.0, 28388.0, 11654.0, 5076.0, 2501.0, 1322.0, 698.0, 444.0, 212.0, 144.0, 95.0, 59.0, 48.0, 21.0, 19.0, 11.0, 8.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.185546875, -1.1428070068359375, -1.100067138671875, -1.0573272705078125, -1.01458740234375, -0.9718475341796875, -0.929107666015625, -0.8863677978515625, -0.8436279296875, -0.8008880615234375, -0.758148193359375, -0.7154083251953125, -0.67266845703125, -0.6299285888671875, -0.587188720703125, -0.5444488525390625, -0.501708984375, -0.4589691162109375, -0.416229248046875, -0.3734893798828125, -0.33074951171875, -0.2880096435546875, -0.245269775390625, -0.2025299072265625, -0.1597900390625, -0.1170501708984375, -0.074310302734375, -0.0315704345703125, 0.01116943359375, 0.0539093017578125, 0.096649169921875, 0.1393890380859375, 0.18212890625, 0.2248687744140625, 0.267608642578125, 0.3103485107421875, 0.35308837890625, 0.3958282470703125, 0.438568115234375, 0.4813079833984375, 0.5240478515625, 0.5667877197265625, 0.609527587890625, 0.6522674560546875, 0.69500732421875, 0.7377471923828125, 0.780487060546875, 0.8232269287109375, 0.865966796875, 0.9087066650390625, 0.951446533203125, 0.9941864013671875, 1.03692626953125, 1.0796661376953125, 1.122406005859375, 1.1651458740234375, 1.2078857421875, 1.2506256103515625, 1.293365478515625, 1.3361053466796875, 1.37884521484375, 1.4215850830078125, 1.464324951171875, 1.5070648193359375, 1.5498046875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 12.0, 17.0, 15.0, 16.0, 28.0, 33.0, 30.0, 40.0, 70.0, 47.0, 74.0, 51.0, 84.0, 52.0, 60.0, 64.0, 59.0, 43.0, 49.0, 38.0, 31.0, 22.0, 18.0, 13.0, 17.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.4638671875, -1.4288406372070312, -1.3938140869140625, -1.3587875366210938, -1.323760986328125, -1.2887344360351562, -1.2537078857421875, -1.2186813354492188, -1.18365478515625, -1.1486282348632812, -1.1136016845703125, -1.0785751342773438, -1.043548583984375, -1.0085220336914062, -0.9734954833984375, -0.9384689331054688, -0.9034423828125, -0.8684158325195312, -0.8333892822265625, -0.7983627319335938, -0.763336181640625, -0.7283096313476562, -0.6932830810546875, -0.6582565307617188, -0.62322998046875, -0.5882034301757812, -0.5531768798828125, -0.5181503295898438, -0.483123779296875, -0.44809722900390625, -0.4130706787109375, -0.37804412841796875, -0.343017578125, -0.30799102783203125, -0.2729644775390625, -0.23793792724609375, -0.202911376953125, -0.16788482666015625, -0.1328582763671875, -0.09783172607421875, -0.06280517578125, -0.02777862548828125, 0.0072479248046875, 0.04227447509765625, 0.077301025390625, 0.11232757568359375, 0.1473541259765625, 0.18238067626953125, 0.2174072265625, 0.25243377685546875, 0.2874603271484375, 0.32248687744140625, 0.357513427734375, 0.39253997802734375, 0.4275665283203125, 0.46259307861328125, 0.49761962890625, 0.5326461791992188, 0.5676727294921875, 0.6026992797851562, 0.637725830078125, 0.6727523803710938, 0.7077789306640625, 0.7428054809570312, 0.77783203125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 5.0, 5.0, 13.0, 14.0, 29.0, 36.0, 75.0, 168.0, 321.0, 855.0, 2867.0, 16658.0, 289174.0, 701762.0, 30620.0, 3983.0, 1089.0, 409.0, 211.0, 109.0, 60.0, 37.0, 13.0, 10.0, 9.0, 8.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.767578125, -3.64654541015625, -3.5255126953125, -3.40447998046875, -3.283447265625, -3.16241455078125, -3.0413818359375, -2.92034912109375, -2.79931640625, -2.67828369140625, -2.5572509765625, -2.43621826171875, -2.315185546875, -2.19415283203125, -2.0731201171875, -1.95208740234375, -1.8310546875, -1.71002197265625, -1.5889892578125, -1.46795654296875, -1.346923828125, -1.22589111328125, -1.1048583984375, -0.98382568359375, -0.86279296875, -0.74176025390625, -0.6207275390625, -0.49969482421875, -0.378662109375, -0.25762939453125, -0.1365966796875, -0.01556396484375, 0.10546875, 0.22650146484375, 0.3475341796875, 0.46856689453125, 0.589599609375, 0.71063232421875, 0.8316650390625, 0.95269775390625, 1.07373046875, 1.19476318359375, 1.3157958984375, 1.43682861328125, 1.557861328125, 1.67889404296875, 1.7999267578125, 1.92095947265625, 2.0419921875, 2.16302490234375, 2.2840576171875, 2.40509033203125, 2.526123046875, 2.64715576171875, 2.7681884765625, 2.88922119140625, 3.01025390625, 3.13128662109375, 3.2523193359375, 3.37335205078125, 3.494384765625, 3.61541748046875, 3.7364501953125, 3.85748291015625, 3.978515625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 2.0, 6.0, 6.0, 8.0, 11.0, 12.0, 18.0, 23.0, 28.0, 23.0, 24.0, 30.0, 40.0, 40.0, 36.0, 34.0, 52.0, 51.0, 58.0, 49.0, 57.0, 49.0, 43.0, 38.0, 36.0, 33.0, 28.0, 28.0, 26.0, 25.0, 18.0, 20.0, 7.0, 10.0, 8.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.310546875, -3.21258544921875, -3.1146240234375, -3.01666259765625, -2.918701171875, -2.82073974609375, -2.7227783203125, -2.62481689453125, -2.52685546875, -2.42889404296875, -2.3309326171875, -2.23297119140625, -2.135009765625, -2.03704833984375, -1.9390869140625, -1.84112548828125, -1.7431640625, -1.64520263671875, -1.5472412109375, -1.44927978515625, -1.351318359375, -1.25335693359375, -1.1553955078125, -1.05743408203125, -0.95947265625, -0.86151123046875, -0.7635498046875, -0.66558837890625, -0.567626953125, -0.46966552734375, -0.3717041015625, -0.27374267578125, -0.17578125, -0.07781982421875, 0.0201416015625, 0.11810302734375, 0.216064453125, 0.31402587890625, 0.4119873046875, 0.50994873046875, 0.60791015625, 0.70587158203125, 0.8038330078125, 0.90179443359375, 0.999755859375, 1.09771728515625, 1.1956787109375, 1.29364013671875, 1.3916015625, 1.48956298828125, 1.5875244140625, 1.68548583984375, 1.783447265625, 1.88140869140625, 1.9793701171875, 2.07733154296875, 2.17529296875, 2.27325439453125, 2.3712158203125, 2.46917724609375, 2.567138671875, 2.66510009765625, 2.7630615234375, 2.86102294921875, 2.958984375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 9.0, 15.0, 16.0, 19.0, 24.0, 61.0, 141.0, 327.0, 1058.0, 5047.0, 46027.0, 868950.0, 115541.0, 8896.0, 1573.0, 481.0, 171.0, 67.0, 42.0, 24.0, 21.0, 10.0, 4.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6728515625, -1.6144561767578125, -1.556060791015625, -1.4976654052734375, -1.43927001953125, -1.3808746337890625, -1.322479248046875, -1.2640838623046875, -1.2056884765625, -1.1472930908203125, -1.088897705078125, -1.0305023193359375, -0.97210693359375, -0.9137115478515625, -0.855316162109375, -0.7969207763671875, -0.738525390625, -0.6801300048828125, -0.621734619140625, -0.5633392333984375, -0.50494384765625, -0.4465484619140625, -0.388153076171875, -0.3297576904296875, -0.2713623046875, -0.2129669189453125, -0.154571533203125, -0.0961761474609375, -0.03778076171875, 0.0206146240234375, 0.079010009765625, 0.1374053955078125, 0.19580078125, 0.2541961669921875, 0.312591552734375, 0.3709869384765625, 0.42938232421875, 0.4877777099609375, 0.546173095703125, 0.6045684814453125, 0.6629638671875, 0.7213592529296875, 0.779754638671875, 0.8381500244140625, 0.89654541015625, 0.9549407958984375, 1.013336181640625, 1.0717315673828125, 1.130126953125, 1.1885223388671875, 1.246917724609375, 1.3053131103515625, 1.36370849609375, 1.4221038818359375, 1.480499267578125, 1.5388946533203125, 1.5972900390625, 1.6556854248046875, 1.714080810546875, 1.7724761962890625, 1.83087158203125, 1.8892669677734375, 1.947662353515625, 2.0060577392578125, 2.064453125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 8.0, 10.0, 13.0, 11.0, 10.0, 25.0, 32.0, 32.0, 39.0, 56.0, 80.0, 122.0, 150.0, 101.0, 69.0, 59.0, 32.0, 39.0, 18.0, 18.0, 17.0, 13.0, 7.0, 6.0, 12.0, 3.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020575523376464844, -0.00019957497715950012, -0.0001933947205543518, -0.0001872144639492035, -0.00018103420734405518, -0.00017485395073890686, -0.00016867369413375854, -0.00016249343752861023, -0.00015631318092346191, -0.0001501329243183136, -0.00014395266771316528, -0.00013777241110801697, -0.00013159215450286865, -0.00012541189789772034, -0.00011923164129257202, -0.0001130513846874237, -0.00010687112808227539, -0.00010069087147712708, -9.451061487197876e-05, -8.833035826683044e-05, -8.215010166168213e-05, -7.596984505653381e-05, -6.97895884513855e-05, -6.360933184623718e-05, -5.742907524108887e-05, -5.124881863594055e-05, -4.5068562030792236e-05, -3.888830542564392e-05, -3.2708048820495605e-05, -2.652779221534729e-05, -2.0347535610198975e-05, -1.416727900505066e-05, -7.987022399902344e-06, -1.8067657947540283e-06, 4.373490810394287e-06, 1.0553747415542603e-05, 1.6734004020690918e-05, 2.2914260625839233e-05, 2.909451723098755e-05, 3.5274773836135864e-05, 4.145503044128418e-05, 4.7635287046432495e-05, 5.381554365158081e-05, 5.9995800256729126e-05, 6.617605686187744e-05, 7.235631346702576e-05, 7.853657007217407e-05, 8.471682667732239e-05, 9.08970832824707e-05, 9.707733988761902e-05, 0.00010325759649276733, 0.00010943785309791565, 0.00011561810970306396, 0.00012179836630821228, 0.0001279786229133606, 0.0001341588795185089, 0.00014033913612365723, 0.00014651939272880554, 0.00015269964933395386, 0.00015887990593910217, 0.0001650601625442505, 0.0001712404191493988, 0.00017742067575454712, 0.00018360093235969543, 0.00018978118896484375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 7.0, 6.0, 8.0, 15.0, 19.0, 29.0, 60.0, 76.0, 158.0, 259.0, 456.0, 1124.0, 2649.0, 8192.0, 33662.0, 291614.0, 632155.0, 59470.0, 12132.0, 3720.0, 1347.0, 590.0, 328.0, 176.0, 113.0, 68.0, 40.0, 18.0, 24.0, 13.0, 6.0, 5.0, 3.0, 4.0, 5.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.87744140625, -0.8438949584960938, -0.8103485107421875, -0.7768020629882812, -0.743255615234375, -0.7097091674804688, -0.6761627197265625, -0.6426162719726562, -0.60906982421875, -0.5755233764648438, -0.5419769287109375, -0.5084304809570312, -0.474884033203125, -0.44133758544921875, -0.4077911376953125, -0.37424468994140625, -0.3406982421875, -0.30715179443359375, -0.2736053466796875, -0.24005889892578125, -0.206512451171875, -0.17296600341796875, -0.1394195556640625, -0.10587310791015625, -0.07232666015625, -0.03878021240234375, -0.0052337646484375, 0.02831268310546875, 0.061859130859375, 0.09540557861328125, 0.1289520263671875, 0.16249847412109375, 0.196044921875, 0.22959136962890625, 0.2631378173828125, 0.29668426513671875, 0.330230712890625, 0.36377716064453125, 0.3973236083984375, 0.43087005615234375, 0.46441650390625, 0.49796295166015625, 0.5315093994140625, 0.5650558471679688, 0.598602294921875, 0.6321487426757812, 0.6656951904296875, 0.6992416381835938, 0.7327880859375, 0.7663345336914062, 0.7998809814453125, 0.8334274291992188, 0.866973876953125, 0.9005203247070312, 0.9340667724609375, 0.9676132202148438, 1.00115966796875, 1.0347061157226562, 1.0682525634765625, 1.1017990112304688, 1.135345458984375, 1.1688919067382812, 1.2024383544921875, 1.2359848022460938, 1.26953125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 3.0, 8.0, 13.0, 9.0, 15.0, 18.0, 30.0, 37.0, 51.0, 82.0, 110.0, 113.0, 120.0, 111.0, 71.0, 64.0, 40.0, 35.0, 22.0, 10.0, 8.0, 8.0, 5.0, 5.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1015625, -1.066131591796875, -1.03070068359375, -0.995269775390625, -0.9598388671875, -0.924407958984375, -0.88897705078125, -0.853546142578125, -0.818115234375, -0.782684326171875, -0.74725341796875, -0.711822509765625, -0.6763916015625, -0.640960693359375, -0.60552978515625, -0.570098876953125, -0.53466796875, -0.499237060546875, -0.46380615234375, -0.428375244140625, -0.3929443359375, -0.357513427734375, -0.32208251953125, -0.286651611328125, -0.251220703125, -0.215789794921875, -0.18035888671875, -0.144927978515625, -0.1094970703125, -0.074066162109375, -0.03863525390625, -0.003204345703125, 0.0322265625, 0.067657470703125, 0.10308837890625, 0.138519287109375, 0.1739501953125, 0.209381103515625, 0.24481201171875, 0.280242919921875, 0.315673828125, 0.351104736328125, 0.38653564453125, 0.421966552734375, 0.4573974609375, 0.492828369140625, 0.52825927734375, 0.563690185546875, 0.59912109375, 0.634552001953125, 0.66998291015625, 0.705413818359375, 0.7408447265625, 0.776275634765625, 0.81170654296875, 0.847137451171875, 0.882568359375, 0.917999267578125, 0.95343017578125, 0.988861083984375, 1.0242919921875, 1.059722900390625, 1.09515380859375, 1.130584716796875, 1.166015625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 11.0, 22.0, 59.0, 127.0, 232.0, 240.0, 148.0, 75.0, 29.0, 23.0, 13.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.455961227416992, -20.742238998413086, -20.02851676940918, -19.314794540405273, -18.60107421875, -17.887351989746094, -17.173629760742188, -16.45990753173828, -15.746185302734375, -15.032463073730469, -14.318740844726562, -13.605019569396973, -12.891297340393066, -12.17757511138916, -11.46385383605957, -10.750131607055664, -10.036409378051758, -9.322687149047852, -8.608964920043945, -7.8952436447143555, -7.181521415710449, -6.467799186706543, -5.754077434539795, -5.040355682373047, -4.326633453369141, -3.6129114627838135, -2.8991894721984863, -2.185467481613159, -1.471745491027832, -0.7580235004425049, -0.044301509857177734, 0.6694202423095703, 1.3831405639648438, 2.096862554550171, 2.810584545135498, 3.524306535720825, 4.238028526306152, 4.951750755310059, 5.665472507476807, 6.379194259643555, 7.092916488647461, 7.806638717651367, 8.520360946655273, 9.234082221984863, 9.94780445098877, 10.661526679992676, 11.375247955322266, 12.088970184326172, 12.802692413330078, 13.516414642333984, 14.23013687133789, 14.94385814666748, 15.657580375671387, 16.371301651000977, 17.085023880004883, 17.79874610900879, 18.512468338012695, 19.2261905670166, 19.939912796020508, 20.653635025024414, 21.367355346679688, 22.081077575683594, 22.7947998046875, 23.508522033691406, 24.222244262695312]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 5.0, 8.0, 10.0, 6.0, 13.0, 25.0, 26.0, 29.0, 33.0, 37.0, 40.0, 43.0, 66.0, 46.0, 76.0, 70.0, 64.0, 60.0, 51.0, 56.0, 39.0, 35.0, 36.0, 28.0, 25.0, 18.0, 10.0, 16.0, 6.0, 9.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.629232406616211, -13.146507263183594, -12.66378116607666, -12.181056022644043, -11.69832992553711, -11.215604782104492, -10.732879638671875, -10.250153541564941, -9.767427444458008, -9.28470230102539, -8.801976203918457, -8.31925106048584, -7.836524963378906, -7.353799819946289, -6.871074199676514, -6.388348579406738, -5.905623435974121, -5.422897815704346, -4.94017219543457, -4.457447052001953, -3.9747211933135986, -3.4919955730438232, -3.009270191192627, -2.5265445709228516, -2.043818950653076, -1.5610933303833008, -1.078367829322815, -0.5956423282623291, -0.11291670799255371, 0.3698089122772217, 0.852534294128418, 1.3352599143981934, 1.8179855346679688, 2.300711154937744, 2.7834367752075195, 3.266162157058716, 3.748887777328491, 4.2316131591796875, 4.714338779449463, 5.197064399719238, 5.679790019989014, 6.162515640258789, 6.6452412605285645, 7.12796688079834, 7.610692024230957, 8.09341812133789, 8.576143264770508, 9.058868408203125, 9.541594505310059, 10.024319648742676, 10.50704574584961, 10.989770889282227, 11.47249698638916, 11.955222129821777, 12.437948226928711, 12.920673370361328, 13.403398513793945, 13.886123657226562, 14.368849754333496, 14.851574897766113, 15.334300994873047, 15.817026138305664, 16.29975128173828, 16.78247833251953, 17.26520347595215]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 5.0, 5.0, 13.0, 11.0, 28.0, 32.0, 58.0, 83.0, 131.0, 230.0, 371.0, 701.0, 1360.0, 2886.0, 6960.0, 18547.0, 60222.0, 259549.0, 1296833.0, 1907211.0, 488573.0, 103688.0, 28854.0, 10054.0, 3998.0, 1850.0, 875.0, 463.0, 254.0, 157.0, 100.0, 64.0, 38.0, 27.0, 11.0, 10.0, 10.0, 7.0, 10.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.013671875, -0.9871292114257812, -0.9605865478515625, -0.9340438842773438, -0.907501220703125, -0.8809585571289062, -0.8544158935546875, -0.8278732299804688, -0.80133056640625, -0.7747879028320312, -0.7482452392578125, -0.7217025756835938, -0.695159912109375, -0.6686172485351562, -0.6420745849609375, -0.6155319213867188, -0.5889892578125, -0.5624465942382812, -0.5359039306640625, -0.5093612670898438, -0.482818603515625, -0.45627593994140625, -0.4297332763671875, -0.40319061279296875, -0.37664794921875, -0.35010528564453125, -0.3235626220703125, -0.29701995849609375, -0.270477294921875, -0.24393463134765625, -0.2173919677734375, -0.19084930419921875, -0.164306640625, -0.13776397705078125, -0.1112213134765625, -0.08467864990234375, -0.058135986328125, -0.03159332275390625, -0.0050506591796875, 0.02149200439453125, 0.04803466796875, 0.07457733154296875, 0.1011199951171875, 0.12766265869140625, 0.154205322265625, 0.18074798583984375, 0.2072906494140625, 0.23383331298828125, 0.2603759765625, 0.28691864013671875, 0.3134613037109375, 0.34000396728515625, 0.366546630859375, 0.39308929443359375, 0.4196319580078125, 0.44617462158203125, 0.47271728515625, 0.49925994873046875, 0.5258026123046875, 0.5523452758789062, 0.578887939453125, 0.6054306030273438, 0.6319732666015625, 0.6585159301757812, 0.68505859375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 5.0, 5.0, 9.0, 17.0, 18.0, 20.0, 21.0, 29.0, 35.0, 39.0, 46.0, 42.0, 55.0, 54.0, 50.0, 51.0, 62.0, 59.0, 56.0, 47.0, 58.0, 40.0, 37.0, 32.0, 25.0, 25.0, 17.0, 16.0, 7.0, 4.0, 3.0, 9.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.96044921875, -0.93353271484375, -0.9066162109375, -0.87969970703125, -0.852783203125, -0.82586669921875, -0.7989501953125, -0.77203369140625, -0.7451171875, -0.71820068359375, -0.6912841796875, -0.66436767578125, -0.637451171875, -0.61053466796875, -0.5836181640625, -0.55670166015625, -0.52978515625, -0.50286865234375, -0.4759521484375, -0.44903564453125, -0.422119140625, -0.39520263671875, -0.3682861328125, -0.34136962890625, -0.314453125, -0.28753662109375, -0.2606201171875, -0.23370361328125, -0.206787109375, -0.17987060546875, -0.1529541015625, -0.12603759765625, -0.09912109375, -0.07220458984375, -0.0452880859375, -0.01837158203125, 0.008544921875, 0.03546142578125, 0.0623779296875, 0.08929443359375, 0.1162109375, 0.14312744140625, 0.1700439453125, 0.19696044921875, 0.223876953125, 0.25079345703125, 0.2777099609375, 0.30462646484375, 0.33154296875, 0.35845947265625, 0.3853759765625, 0.41229248046875, 0.439208984375, 0.46612548828125, 0.4930419921875, 0.51995849609375, 0.546875, 0.57379150390625, 0.6007080078125, 0.62762451171875, 0.654541015625, 0.68145751953125, 0.7083740234375, 0.73529052734375, 0.76220703125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 9.0, 7.0, 4.0, 6.0, 16.0, 21.0, 25.0, 42.0, 59.0, 83.0, 187.0, 400.0, 931.0, 2837.0, 10128.0, 51308.0, 451882.0, 3053525.0, 543012.0, 60722.0, 12738.0, 3747.0, 1378.0, 560.0, 274.0, 136.0, 90.0, 55.0, 34.0, 18.0, 15.0, 15.0, 10.0, 5.0, 2.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.591796875, -1.5428619384765625, -1.493927001953125, -1.4449920654296875, -1.39605712890625, -1.3471221923828125, -1.298187255859375, -1.2492523193359375, -1.2003173828125, -1.1513824462890625, -1.102447509765625, -1.0535125732421875, -1.00457763671875, -0.9556427001953125, -0.906707763671875, -0.8577728271484375, -0.808837890625, -0.7599029541015625, -0.710968017578125, -0.6620330810546875, -0.61309814453125, -0.5641632080078125, -0.515228271484375, -0.4662933349609375, -0.4173583984375, -0.3684234619140625, -0.319488525390625, -0.2705535888671875, -0.22161865234375, -0.1726837158203125, -0.123748779296875, -0.0748138427734375, -0.02587890625, 0.0230560302734375, 0.071990966796875, 0.1209259033203125, 0.16986083984375, 0.2187957763671875, 0.267730712890625, 0.3166656494140625, 0.3656005859375, 0.4145355224609375, 0.463470458984375, 0.5124053955078125, 0.56134033203125, 0.6102752685546875, 0.659210205078125, 0.7081451416015625, 0.757080078125, 0.8060150146484375, 0.854949951171875, 0.9038848876953125, 0.95281982421875, 1.0017547607421875, 1.050689697265625, 1.0996246337890625, 1.1485595703125, 1.1974945068359375, 1.246429443359375, 1.2953643798828125, 1.34429931640625, 1.3932342529296875, 1.442169189453125, 1.4911041259765625, 1.5400390625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 7.0, 5.0, 5.0, 8.0, 17.0, 17.0, 24.0, 24.0, 38.0, 50.0, 79.0, 115.0, 208.0, 324.0, 450.0, 565.0, 573.0, 479.0, 320.0, 240.0, 149.0, 118.0, 75.0, 50.0, 35.0, 23.0, 23.0, 10.0, 13.0, 6.0, 9.0, 6.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.462890625, -1.410888671875, -1.35888671875, -1.306884765625, -1.2548828125, -1.202880859375, -1.15087890625, -1.098876953125, -1.046875, -0.994873046875, -0.94287109375, -0.890869140625, -0.8388671875, -0.786865234375, -0.73486328125, -0.682861328125, -0.630859375, -0.578857421875, -0.52685546875, -0.474853515625, -0.4228515625, -0.370849609375, -0.31884765625, -0.266845703125, -0.21484375, -0.162841796875, -0.11083984375, -0.058837890625, -0.0068359375, 0.045166015625, 0.09716796875, 0.149169921875, 0.201171875, 0.253173828125, 0.30517578125, 0.357177734375, 0.4091796875, 0.461181640625, 0.51318359375, 0.565185546875, 0.6171875, 0.669189453125, 0.72119140625, 0.773193359375, 0.8251953125, 0.877197265625, 0.92919921875, 0.981201171875, 1.033203125, 1.085205078125, 1.13720703125, 1.189208984375, 1.2412109375, 1.293212890625, 1.34521484375, 1.397216796875, 1.44921875, 1.501220703125, 1.55322265625, 1.605224609375, 1.6572265625, 1.709228515625, 1.76123046875, 1.813232421875, 1.865234375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 5.0, 4.0, 8.0, 12.0, 23.0, 69.0, 209.0, 298.0, 220.0, 83.0, 39.0, 15.0, 9.0, 3.0, 2.0, 2.0, 0.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.281211853027344, -31.395849227905273, -30.51048469543457, -29.6251220703125, -28.739757537841797, -27.854394912719727, -26.969032287597656, -26.083667755126953, -25.198305130004883, -24.312942504882812, -23.42757797241211, -22.54221534729004, -21.65685272216797, -20.771488189697266, -19.886125564575195, -19.000762939453125, -18.115398406982422, -17.23003578186035, -16.34467124938965, -15.459308624267578, -14.573945045471191, -13.688581466674805, -12.803218841552734, -11.917855262756348, -11.032491683959961, -10.147128105163574, -9.261764526367188, -8.376401901245117, -7.4910383224487305, -6.605674743652344, -5.720311641693115, -4.834948539733887, -3.9495849609375, -3.0642216205596924, -2.1788582801818848, -1.2934949398040771, -0.40813159942626953, 0.4772319793701172, 1.3625950813293457, 2.247958183288574, 3.133321762084961, 4.018685340881348, 4.904048442840576, 5.789411544799805, 6.674775123596191, 7.560138702392578, 8.445501327514648, 9.330864906311035, 10.216228485107422, 11.101592063903809, 11.986955642700195, 12.872318267822266, 13.757681846618652, 14.643045425415039, 15.52840805053711, 16.413772583007812, 17.299135208129883, 18.184497833251953, 19.069862365722656, 19.955224990844727, 20.840587615966797, 21.7259521484375, 22.61131477355957, 23.49667739868164, 24.382041931152344]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 8.0, 8.0, 9.0, 16.0, 7.0, 23.0, 19.0, 23.0, 30.0, 33.0, 34.0, 35.0, 50.0, 42.0, 42.0, 56.0, 60.0, 50.0, 46.0, 53.0, 53.0, 53.0, 44.0, 35.0, 35.0, 27.0, 18.0, 16.0, 13.0, 15.0, 9.0, 6.0, 6.0, 3.0, 2.0, 4.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.833175659179688, -8.531219482421875, -8.229263305664062, -7.927306652069092, -7.625350475311279, -7.323394298553467, -7.021437644958496, -6.719481468200684, -6.417525291442871, -6.115569114685059, -5.813612937927246, -5.511656284332275, -5.209700107574463, -4.90774393081665, -4.60578727722168, -4.303831100463867, -4.001874923706055, -3.699918746948242, -3.3979623317718506, -3.096005916595459, -2.7940497398376465, -2.492093563079834, -2.1901371479034424, -1.8881807327270508, -1.5862245559692383, -1.2842682600021362, -0.9823119640350342, -0.6803556680679321, -0.3783993721008301, -0.07644307613372803, 0.22551321983337402, 0.5274696350097656, 0.8294258117675781, 1.1313821077346802, 1.4333384037017822, 1.7352946996688843, 2.0372509956359863, 2.339207172393799, 2.6411635875701904, 2.943120002746582, 3.2450761795043945, 3.547032356262207, 3.8489887714385986, 4.15094518661499, 4.452901363372803, 4.754857540130615, 5.056814193725586, 5.358770370483398, 5.660726547241211, 5.962682723999023, 6.264638900756836, 6.566595554351807, 6.868551731109619, 7.170507907867432, 7.472464561462402, 7.774420738220215, 8.076376914978027, 8.37833309173584, 8.680289268493652, 8.982245445251465, 9.284202575683594, 9.586158752441406, 9.888114929199219, 10.190071105957031, 10.492027282714844]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 7.0, 0.0, 10.0, 25.0, 27.0, 33.0, 44.0, 68.0, 136.0, 233.0, 341.0, 658.0, 1265.0, 2522.0, 5386.0, 12528.0, 29819.0, 75083.0, 194226.0, 362971.0, 219210.0, 84617.0, 33675.0, 13829.0, 5993.0, 2766.0, 1364.0, 705.0, 392.0, 237.0, 127.0, 85.0, 59.0, 33.0, 20.0, 23.0, 9.0, 7.0, 5.0, 8.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.359375, -1.3211517333984375, -1.282928466796875, -1.2447052001953125, -1.20648193359375, -1.1682586669921875, -1.130035400390625, -1.0918121337890625, -1.0535888671875, -1.0153656005859375, -0.977142333984375, -0.9389190673828125, -0.90069580078125, -0.8624725341796875, -0.824249267578125, -0.7860260009765625, -0.747802734375, -0.7095794677734375, -0.671356201171875, -0.6331329345703125, -0.59490966796875, -0.5566864013671875, -0.518463134765625, -0.4802398681640625, -0.4420166015625, -0.4037933349609375, -0.365570068359375, -0.3273468017578125, -0.28912353515625, -0.2509002685546875, -0.212677001953125, -0.1744537353515625, -0.13623046875, -0.0980072021484375, -0.059783935546875, -0.0215606689453125, 0.01666259765625, 0.0548858642578125, 0.093109130859375, 0.1313323974609375, 0.1695556640625, 0.2077789306640625, 0.246002197265625, 0.2842254638671875, 0.32244873046875, 0.3606719970703125, 0.398895263671875, 0.4371185302734375, 0.475341796875, 0.5135650634765625, 0.551788330078125, 0.5900115966796875, 0.62823486328125, 0.6664581298828125, 0.704681396484375, 0.7429046630859375, 0.7811279296875, 0.8193511962890625, 0.857574462890625, 0.8957977294921875, 0.93402099609375, 0.9722442626953125, 1.010467529296875, 1.0486907958984375, 1.0869140625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 9.0, 14.0, 18.0, 20.0, 21.0, 27.0, 31.0, 44.0, 44.0, 53.0, 37.0, 53.0, 48.0, 62.0, 58.0, 54.0, 58.0, 59.0, 43.0, 41.0, 47.0, 27.0, 35.0, 17.0, 20.0, 15.0, 9.0, 9.0, 5.0, 2.0, 9.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.9501953125, -0.9230270385742188, -0.8958587646484375, -0.8686904907226562, -0.841522216796875, -0.8143539428710938, -0.7871856689453125, -0.7600173950195312, -0.73284912109375, -0.7056808471679688, -0.6785125732421875, -0.6513442993164062, -0.624176025390625, -0.5970077514648438, -0.5698394775390625, -0.5426712036132812, -0.5155029296875, -0.48833465576171875, -0.4611663818359375, -0.43399810791015625, -0.406829833984375, -0.37966156005859375, -0.3524932861328125, -0.32532501220703125, -0.29815673828125, -0.27098846435546875, -0.2438201904296875, -0.21665191650390625, -0.189483642578125, -0.16231536865234375, -0.1351470947265625, -0.10797882080078125, -0.080810546875, -0.05364227294921875, -0.0264739990234375, 0.00069427490234375, 0.027862548828125, 0.05503082275390625, 0.0821990966796875, 0.10936737060546875, 0.13653564453125, 0.16370391845703125, 0.1908721923828125, 0.21804046630859375, 0.245208740234375, 0.27237701416015625, 0.2995452880859375, 0.32671356201171875, 0.3538818359375, 0.38105010986328125, 0.4082183837890625, 0.43538665771484375, 0.462554931640625, 0.48972320556640625, 0.5168914794921875, 0.5440597534179688, 0.57122802734375, 0.5983963012695312, 0.6255645751953125, 0.6527328491210938, 0.679901123046875, 0.7070693969726562, 0.7342376708984375, 0.7614059448242188, 0.78857421875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 4.0, 4.0, 6.0, 5.0, 13.0, 17.0, 14.0, 32.0, 27.0, 36.0, 53.0, 75.0, 117.0, 128.0, 218.0, 284.0, 444.0, 636.0, 1078.0, 1917.0, 3590.0, 8751.0, 31760.0, 187643.0, 666144.0, 110262.0, 21434.0, 6647.0, 2777.0, 1583.0, 954.0, 607.0, 402.0, 240.0, 192.0, 107.0, 91.0, 77.0, 50.0, 37.0, 27.0, 17.0, 11.0, 7.0, 11.0, 8.0, 5.0, 6.0, 1.0, 0.0, 5.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.271484375, -2.203399658203125, -2.13531494140625, -2.067230224609375, -1.9991455078125, -1.931060791015625, -1.86297607421875, -1.794891357421875, -1.726806640625, -1.658721923828125, -1.59063720703125, -1.522552490234375, -1.4544677734375, -1.386383056640625, -1.31829833984375, -1.250213623046875, -1.18212890625, -1.114044189453125, -1.04595947265625, -0.977874755859375, -0.9097900390625, -0.841705322265625, -0.77362060546875, -0.705535888671875, -0.637451171875, -0.569366455078125, -0.50128173828125, -0.433197021484375, -0.3651123046875, -0.297027587890625, -0.22894287109375, -0.160858154296875, -0.0927734375, -0.024688720703125, 0.04339599609375, 0.111480712890625, 0.1795654296875, 0.247650146484375, 0.31573486328125, 0.383819580078125, 0.451904296875, 0.519989013671875, 0.58807373046875, 0.656158447265625, 0.7242431640625, 0.792327880859375, 0.86041259765625, 0.928497314453125, 0.99658203125, 1.064666748046875, 1.13275146484375, 1.200836181640625, 1.2689208984375, 1.337005615234375, 1.40509033203125, 1.473175048828125, 1.541259765625, 1.609344482421875, 1.67742919921875, 1.745513916015625, 1.8135986328125, 1.881683349609375, 1.94976806640625, 2.017852783203125, 2.0859375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 2.0, 7.0, 3.0, 5.0, 9.0, 7.0, 11.0, 7.0, 6.0, 18.0, 23.0, 18.0, 26.0, 28.0, 23.0, 35.0, 36.0, 27.0, 31.0, 34.0, 35.0, 41.0, 48.0, 57.0, 30.0, 33.0, 49.0, 36.0, 40.0, 36.0, 39.0, 29.0, 22.0, 13.0, 22.0, 16.0, 19.0, 16.0, 13.0, 7.0, 9.0, 13.0, 7.0, 5.0, 5.0, 0.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.828125, -2.743011474609375, -2.65789794921875, -2.572784423828125, -2.4876708984375, -2.402557373046875, -2.31744384765625, -2.232330322265625, -2.147216796875, -2.062103271484375, -1.97698974609375, -1.891876220703125, -1.8067626953125, -1.721649169921875, -1.63653564453125, -1.551422119140625, -1.46630859375, -1.381195068359375, -1.29608154296875, -1.210968017578125, -1.1258544921875, -1.040740966796875, -0.95562744140625, -0.870513916015625, -0.785400390625, -0.700286865234375, -0.61517333984375, -0.530059814453125, -0.4449462890625, -0.359832763671875, -0.27471923828125, -0.189605712890625, -0.1044921875, -0.019378662109375, 0.06573486328125, 0.150848388671875, 0.2359619140625, 0.321075439453125, 0.40618896484375, 0.491302490234375, 0.576416015625, 0.661529541015625, 0.74664306640625, 0.831756591796875, 0.9168701171875, 1.001983642578125, 1.08709716796875, 1.172210693359375, 1.25732421875, 1.342437744140625, 1.42755126953125, 1.512664794921875, 1.5977783203125, 1.682891845703125, 1.76800537109375, 1.853118896484375, 1.938232421875, 2.023345947265625, 2.10845947265625, 2.193572998046875, 2.2786865234375, 2.363800048828125, 2.44891357421875, 2.534027099609375, 2.619140625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 3.0, 8.0, 12.0, 15.0, 15.0, 11.0, 33.0, 42.0, 64.0, 113.0, 218.0, 356.0, 654.0, 1446.0, 3952.0, 14695.0, 78065.0, 705767.0, 200654.0, 30915.0, 7026.0, 2363.0, 981.0, 470.0, 248.0, 167.0, 74.0, 54.0, 40.0, 25.0, 16.0, 15.0, 11.0, 10.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0908203125, -1.05413818359375, -1.0174560546875, -0.98077392578125, -0.944091796875, -0.90740966796875, -0.8707275390625, -0.83404541015625, -0.79736328125, -0.76068115234375, -0.7239990234375, -0.68731689453125, -0.650634765625, -0.61395263671875, -0.5772705078125, -0.54058837890625, -0.50390625, -0.46722412109375, -0.4305419921875, -0.39385986328125, -0.357177734375, -0.32049560546875, -0.2838134765625, -0.24713134765625, -0.21044921875, -0.17376708984375, -0.1370849609375, -0.10040283203125, -0.063720703125, -0.02703857421875, 0.0096435546875, 0.04632568359375, 0.0830078125, 0.11968994140625, 0.1563720703125, 0.19305419921875, 0.229736328125, 0.26641845703125, 0.3031005859375, 0.33978271484375, 0.37646484375, 0.41314697265625, 0.4498291015625, 0.48651123046875, 0.523193359375, 0.55987548828125, 0.5965576171875, 0.63323974609375, 0.669921875, 0.70660400390625, 0.7432861328125, 0.77996826171875, 0.816650390625, 0.85333251953125, 0.8900146484375, 0.92669677734375, 0.96337890625, 1.00006103515625, 1.0367431640625, 1.07342529296875, 1.110107421875, 1.14678955078125, 1.1834716796875, 1.22015380859375, 1.2568359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 7.0, 6.0, 3.0, 7.0, 7.0, 14.0, 17.0, 23.0, 31.0, 26.0, 43.0, 55.0, 101.0, 193.0, 142.0, 95.0, 51.0, 42.0, 33.0, 22.0, 18.0, 19.0, 10.0, 12.0, 4.0, 8.0, 8.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00037741661071777344, -0.0003662519156932831, -0.0003550872206687927, -0.00034392252564430237, -0.000332757830619812, -0.00032159313559532166, -0.0003104284405708313, -0.00029926374554634094, -0.0002880990505218506, -0.00027693435549736023, -0.0002657696604728699, -0.0002546049654483795, -0.00024344027042388916, -0.0002322755753993988, -0.00022111088037490845, -0.0002099461853504181, -0.00019878149032592773, -0.00018761679530143738, -0.00017645210027694702, -0.00016528740525245667, -0.0001541227102279663, -0.00014295801520347595, -0.0001317933201789856, -0.00012062862515449524, -0.00010946393013000488, -9.829923510551453e-05, -8.713454008102417e-05, -7.596984505653381e-05, -6.480515003204346e-05, -5.36404550075531e-05, -4.2475759983062744e-05, -3.131106495857239e-05, -2.014636993408203e-05, -8.981674909591675e-06, 2.1830201148986816e-06, 1.3347715139389038e-05, 2.4512410163879395e-05, 3.567710518836975e-05, 4.684180021286011e-05, 5.8006495237350464e-05, 6.917119026184082e-05, 8.033588528633118e-05, 9.150058031082153e-05, 0.00010266527533531189, 0.00011382997035980225, 0.0001249946653842926, 0.00013615936040878296, 0.00014732405543327332, 0.00015848875045776367, 0.00016965344548225403, 0.00018081814050674438, 0.00019198283553123474, 0.0002031475305557251, 0.00021431222558021545, 0.0002254769206047058, 0.00023664161562919617, 0.0002478063106536865, 0.0002589710056781769, 0.00027013570070266724, 0.0002813003957271576, 0.00029246509075164795, 0.0003036297857761383, 0.00031479448080062866, 0.000325959175825119, 0.0003371238708496094]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 6.0, 6.0, 7.0, 17.0, 25.0, 34.0, 41.0, 48.0, 73.0, 95.0, 187.0, 290.0, 491.0, 848.0, 1777.0, 4029.0, 11381.0, 42186.0, 293290.0, 609434.0, 60026.0, 14699.0, 4884.0, 2110.0, 1058.0, 548.0, 358.0, 191.0, 145.0, 79.0, 47.0, 40.0, 33.0, 29.0, 9.0, 10.0, 10.0, 8.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94580078125, -0.9109115600585938, -0.8760223388671875, -0.8411331176757812, -0.806243896484375, -0.7713546752929688, -0.7364654541015625, -0.7015762329101562, -0.66668701171875, -0.6317977905273438, -0.5969085693359375, -0.5620193481445312, -0.527130126953125, -0.49224090576171875, -0.4573516845703125, -0.42246246337890625, -0.3875732421875, -0.35268402099609375, -0.3177947998046875, -0.28290557861328125, -0.248016357421875, -0.21312713623046875, -0.1782379150390625, -0.14334869384765625, -0.10845947265625, -0.07357025146484375, -0.0386810302734375, -0.00379180908203125, 0.031097412109375, 0.06598663330078125, 0.1008758544921875, 0.13576507568359375, 0.170654296875, 0.20554351806640625, 0.2404327392578125, 0.27532196044921875, 0.310211181640625, 0.34510040283203125, 0.3799896240234375, 0.41487884521484375, 0.44976806640625, 0.48465728759765625, 0.5195465087890625, 0.5544357299804688, 0.589324951171875, 0.6242141723632812, 0.6591033935546875, 0.6939926147460938, 0.7288818359375, 0.7637710571289062, 0.7986602783203125, 0.8335494995117188, 0.868438720703125, 0.9033279418945312, 0.9382171630859375, 0.9731063842773438, 1.00799560546875, 1.0428848266601562, 1.0777740478515625, 1.1126632690429688, 1.147552490234375, 1.1824417114257812, 1.2173309326171875, 1.2522201538085938, 1.287109375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 0.0, 5.0, 8.0, 6.0, 17.0, 21.0, 18.0, 23.0, 38.0, 38.0, 38.0, 54.0, 76.0, 85.0, 98.0, 102.0, 79.0, 49.0, 43.0, 32.0, 36.0, 33.0, 14.0, 13.0, 14.0, 6.0, 7.0, 5.0, 7.0, 3.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.8857421875, -0.8575668334960938, -0.8293914794921875, -0.8012161254882812, -0.773040771484375, -0.7448654174804688, -0.7166900634765625, -0.6885147094726562, -0.66033935546875, -0.6321640014648438, -0.6039886474609375, -0.5758132934570312, -0.547637939453125, -0.5194625854492188, -0.4912872314453125, -0.46311187744140625, -0.4349365234375, -0.40676116943359375, -0.3785858154296875, -0.35041046142578125, -0.322235107421875, -0.29405975341796875, -0.2658843994140625, -0.23770904541015625, -0.20953369140625, -0.18135833740234375, -0.1531829833984375, -0.12500762939453125, -0.096832275390625, -0.06865692138671875, -0.0404815673828125, -0.01230621337890625, 0.015869140625, 0.04404449462890625, 0.0722198486328125, 0.10039520263671875, 0.128570556640625, 0.15674591064453125, 0.1849212646484375, 0.21309661865234375, 0.24127197265625, 0.26944732666015625, 0.2976226806640625, 0.32579803466796875, 0.353973388671875, 0.38214874267578125, 0.4103240966796875, 0.43849945068359375, 0.4666748046875, 0.49485015869140625, 0.5230255126953125, 0.5512008666992188, 0.579376220703125, 0.6075515747070312, 0.6357269287109375, 0.6639022827148438, 0.69207763671875, 0.7202529907226562, 0.7484283447265625, 0.7766036987304688, 0.804779052734375, 0.8329544067382812, 0.8611297607421875, 0.8893051147460938, 0.91748046875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 9.0, 16.0, 36.0, 142.0, 314.0, 271.0, 120.0, 49.0, 23.0, 9.0, 6.0, 3.0, 3.0, 6.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.53903579711914, -35.59982681274414, -34.66061782836914, -33.72140884399414, -32.782203674316406, -31.842992782592773, -30.903785705566406, -29.964576721191406, -29.025367736816406, -28.086158752441406, -27.146949768066406, -26.20774269104004, -25.26853370666504, -24.32932472229004, -23.390117645263672, -22.450908660888672, -21.511699676513672, -20.572490692138672, -19.633281707763672, -18.694074630737305, -17.754865646362305, -16.815656661987305, -15.876448631286621, -14.937240600585938, -13.998031616210938, -13.058822631835938, -12.119614601135254, -11.18040657043457, -10.24119758605957, -9.30198860168457, -8.362780570983887, -7.423572063446045, -6.484363555908203, -5.545155048370361, -4.6059465408325195, -3.6667380332946777, -2.727529525756836, -1.7883210182189941, -0.8491125106811523, 0.09009599685668945, 1.0293045043945312, 1.968513011932373, 2.907721519470215, 3.8469300270080566, 4.786138534545898, 5.72534704208374, 6.664555549621582, 7.603764057159424, 8.542972564697266, 9.482181549072266, 10.42138957977295, 11.360597610473633, 12.299806594848633, 13.239015579223633, 14.178223609924316, 15.117431640625, 16.056640625, 16.995849609375, 17.93505859375, 18.874265670776367, 19.813474655151367, 20.752683639526367, 21.691890716552734, 22.631099700927734, 23.570308685302734]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 5.0, 3.0, 5.0, 7.0, 10.0, 3.0, 13.0, 16.0, 14.0, 20.0, 21.0, 28.0, 25.0, 22.0, 39.0, 37.0, 30.0, 46.0, 49.0, 79.0, 80.0, 65.0, 54.0, 46.0, 35.0, 37.0, 33.0, 24.0, 22.0, 30.0, 20.0, 15.0, 11.0, 11.0, 12.0, 10.0, 11.0, 5.0, 5.0, 1.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.537027359008789, -12.151224136352539, -11.765420913696289, -11.379617691040039, -10.993815422058105, -10.608012199401855, -10.222208976745605, -9.836405754089355, -9.450602531433105, -9.064799308776855, -8.678996086120605, -8.293193817138672, -7.907390117645264, -7.521587371826172, -7.135784149169922, -6.749980926513672, -6.36417818069458, -5.97837495803833, -5.592572212219238, -5.206768989562988, -4.820965766906738, -4.435162544250488, -4.0493597984313965, -3.6635565757751465, -3.2777535915374756, -2.8919506072998047, -2.5061473846435547, -2.120344400405884, -1.7345412969589233, -1.348738193511963, -0.962935209274292, -0.577131986618042, -0.1913290023803711, 0.19447407126426697, 0.580277144908905, 0.9660801887512207, 1.3518832921981812, 1.7376863956451416, 2.1234893798828125, 2.5092926025390625, 2.8950955867767334, 3.2808985710144043, 3.6667017936706543, 4.052504539489746, 4.438307762145996, 4.824110984802246, 5.209914207458496, 5.595717430114746, 5.981520175933838, 6.367323398590088, 6.75312614440918, 7.13892936706543, 7.52473258972168, 7.91053581237793, 8.29633903503418, 8.68214225769043, 9.067944526672363, 9.453747749328613, 9.839550971984863, 10.225353240966797, 10.611156463623047, 10.996959686279297, 11.382762908935547, 11.768566131591797, 12.154369354248047]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 3.0, 7.0, 7.0, 11.0, 22.0, 20.0, 28.0, 47.0, 67.0, 93.0, 140.0, 184.0, 397.0, 712.0, 1597.0, 3592.0, 10027.0, 35971.0, 197270.0, 1450445.0, 2084265.0, 330582.0, 54914.0, 14643.0, 4921.0, 2084.0, 976.0, 481.0, 268.0, 183.0, 97.0, 69.0, 41.0, 38.0, 19.0, 23.0, 10.0, 3.0, 8.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.95947265625, -0.9296112060546875, -0.899749755859375, -0.8698883056640625, -0.84002685546875, -0.8101654052734375, -0.780303955078125, -0.7504425048828125, -0.7205810546875, -0.6907196044921875, -0.660858154296875, -0.6309967041015625, -0.60113525390625, -0.5712738037109375, -0.541412353515625, -0.5115509033203125, -0.481689453125, -0.4518280029296875, -0.421966552734375, -0.3921051025390625, -0.36224365234375, -0.3323822021484375, -0.302520751953125, -0.2726593017578125, -0.2427978515625, -0.2129364013671875, -0.183074951171875, -0.1532135009765625, -0.12335205078125, -0.0934906005859375, -0.063629150390625, -0.0337677001953125, -0.00390625, 0.0259552001953125, 0.055816650390625, 0.0856781005859375, 0.11553955078125, 0.1454010009765625, 0.175262451171875, 0.2051239013671875, 0.2349853515625, 0.2648468017578125, 0.294708251953125, 0.3245697021484375, 0.35443115234375, 0.3842926025390625, 0.414154052734375, 0.4440155029296875, 0.473876953125, 0.5037384033203125, 0.533599853515625, 0.5634613037109375, 0.59332275390625, 0.6231842041015625, 0.653045654296875, 0.6829071044921875, 0.7127685546875, 0.7426300048828125, 0.772491455078125, 0.8023529052734375, 0.83221435546875, 0.8620758056640625, 0.891937255859375, 0.9217987060546875, 0.95166015625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 11.0, 14.0, 21.0, 28.0, 28.0, 20.0, 33.0, 44.0, 42.0, 55.0, 49.0, 40.0, 53.0, 58.0, 53.0, 68.0, 66.0, 54.0, 45.0, 30.0, 43.0, 32.0, 18.0, 17.0, 24.0, 12.0, 5.0, 9.0, 4.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.947265625, -0.9198455810546875, -0.892425537109375, -0.8650054931640625, -0.83758544921875, -0.8101654052734375, -0.782745361328125, -0.7553253173828125, -0.7279052734375, -0.7004852294921875, -0.673065185546875, -0.6456451416015625, -0.61822509765625, -0.5908050537109375, -0.563385009765625, -0.5359649658203125, -0.508544921875, -0.4811248779296875, -0.453704833984375, -0.4262847900390625, -0.39886474609375, -0.3714447021484375, -0.344024658203125, -0.3166046142578125, -0.2891845703125, -0.2617645263671875, -0.234344482421875, -0.2069244384765625, -0.17950439453125, -0.1520843505859375, -0.124664306640625, -0.0972442626953125, -0.06982421875, -0.0424041748046875, -0.014984130859375, 0.0124359130859375, 0.03985595703125, 0.0672760009765625, 0.094696044921875, 0.1221160888671875, 0.1495361328125, 0.1769561767578125, 0.204376220703125, 0.2317962646484375, 0.25921630859375, 0.2866363525390625, 0.314056396484375, 0.3414764404296875, 0.368896484375, 0.3963165283203125, 0.423736572265625, 0.4511566162109375, 0.47857666015625, 0.5059967041015625, 0.533416748046875, 0.5608367919921875, 0.5882568359375, 0.6156768798828125, 0.643096923828125, 0.6705169677734375, 0.69793701171875, 0.7253570556640625, 0.752777099609375, 0.7801971435546875, 0.8076171875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 6.0, 9.0, 8.0, 9.0, 31.0, 44.0, 92.0, 123.0, 242.0, 486.0, 1198.0, 3921.0, 20735.0, 278408.0, 3557938.0, 303488.0, 20687.0, 3989.0, 1383.0, 665.0, 309.0, 195.0, 111.0, 70.0, 41.0, 27.0, 9.0, 15.0, 17.0, 6.0, 7.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.134765625, -2.071075439453125, -2.00738525390625, -1.943695068359375, -1.8800048828125, -1.816314697265625, -1.75262451171875, -1.688934326171875, -1.625244140625, -1.561553955078125, -1.49786376953125, -1.434173583984375, -1.3704833984375, -1.306793212890625, -1.24310302734375, -1.179412841796875, -1.11572265625, -1.052032470703125, -0.98834228515625, -0.924652099609375, -0.8609619140625, -0.797271728515625, -0.73358154296875, -0.669891357421875, -0.606201171875, -0.542510986328125, -0.47882080078125, -0.415130615234375, -0.3514404296875, -0.287750244140625, -0.22406005859375, -0.160369873046875, -0.0966796875, -0.032989501953125, 0.03070068359375, 0.094390869140625, 0.1580810546875, 0.221771240234375, 0.28546142578125, 0.349151611328125, 0.412841796875, 0.476531982421875, 0.54022216796875, 0.603912353515625, 0.6676025390625, 0.731292724609375, 0.79498291015625, 0.858673095703125, 0.92236328125, 0.986053466796875, 1.04974365234375, 1.113433837890625, 1.1771240234375, 1.240814208984375, 1.30450439453125, 1.368194580078125, 1.431884765625, 1.495574951171875, 1.55926513671875, 1.622955322265625, 1.6866455078125, 1.750335693359375, 1.81402587890625, 1.877716064453125, 1.94140625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 14.0, 18.0, 15.0, 33.0, 69.0, 98.0, 157.0, 343.0, 567.0, 780.0, 840.0, 483.0, 283.0, 150.0, 86.0, 50.0, 34.0, 17.0, 5.0, 12.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.43359375, -1.3682861328125, -1.302978515625, -1.2376708984375, -1.17236328125, -1.1070556640625, -1.041748046875, -0.9764404296875, -0.9111328125, -0.8458251953125, -0.780517578125, -0.7152099609375, -0.64990234375, -0.5845947265625, -0.519287109375, -0.4539794921875, -0.388671875, -0.3233642578125, -0.258056640625, -0.1927490234375, -0.12744140625, -0.0621337890625, 0.003173828125, 0.0684814453125, 0.1337890625, 0.1990966796875, 0.264404296875, 0.3297119140625, 0.39501953125, 0.4603271484375, 0.525634765625, 0.5909423828125, 0.65625, 0.7215576171875, 0.786865234375, 0.8521728515625, 0.91748046875, 0.9827880859375, 1.048095703125, 1.1134033203125, 1.1787109375, 1.2440185546875, 1.309326171875, 1.3746337890625, 1.43994140625, 1.5052490234375, 1.570556640625, 1.6358642578125, 1.701171875, 1.7664794921875, 1.831787109375, 1.8970947265625, 1.96240234375, 2.0277099609375, 2.093017578125, 2.1583251953125, 2.2236328125, 2.2889404296875, 2.354248046875, 2.4195556640625, 2.48486328125, 2.5501708984375, 2.615478515625, 2.6807861328125, 2.74609375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 11.0, 20.0, 38.0, 111.0, 216.0, 249.0, 215.0, 78.0, 30.0, 9.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.156108856201172, -22.466157913208008, -21.776208877563477, -21.086257934570312, -20.39630699157715, -19.706356048583984, -19.016407012939453, -18.32645606994629, -17.636505126953125, -16.94655418395996, -16.25660514831543, -15.566654205322266, -14.876703262329102, -14.186753273010254, -13.496803283691406, -12.806852340698242, -12.116902351379395, -11.426952362060547, -10.737001419067383, -10.047051429748535, -9.357100486755371, -8.667150497436523, -7.977200031280518, -7.287249565124512, -6.597299098968506, -5.9073486328125, -5.217398166656494, -4.527447700500488, -3.8374974727630615, -3.1475470066070557, -2.457596778869629, -1.767646312713623, -1.0776958465576172, -0.3877454400062561, 0.302204966545105, 0.9921553134918213, 1.6821057796478271, 2.372056245803833, 3.0620064735412598, 3.7519569396972656, 4.4419074058532715, 5.131857872009277, 5.821808338165283, 6.511758804321289, 7.201708793640137, 7.891659736633301, 8.581609725952148, 9.271560668945312, 9.96151065826416, 10.651460647583008, 11.341411590576172, 12.03136157989502, 12.721312522888184, 13.411262512207031, 14.101213455200195, 14.791163444519043, 15.48111343383789, 16.171064376831055, 16.861013412475586, 17.55096435546875, 18.240915298461914, 18.930866241455078, 19.62081527709961, 20.310766220092773, 21.000717163085938]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 6.0, 8.0, 14.0, 15.0, 5.0, 19.0, 23.0, 17.0, 22.0, 20.0, 32.0, 27.0, 27.0, 29.0, 36.0, 36.0, 38.0, 42.0, 39.0, 42.0, 41.0, 53.0, 54.0, 43.0, 32.0, 30.0, 36.0, 30.0, 31.0, 27.0, 30.0, 13.0, 21.0, 14.0, 4.0, 7.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-6.1588826179504395, -5.958489894866943, -5.758097171783447, -5.557704448699951, -5.357311725616455, -5.156919002532959, -4.956525802612305, -4.756133079528809, -4.5557403564453125, -4.355347633361816, -4.15495491027832, -3.954562187194824, -3.754169464111328, -3.553776741027832, -3.353383779525757, -3.1529910564422607, -2.9525985717773438, -2.7522058486938477, -2.5518131256103516, -2.3514204025268555, -2.1510276794433594, -1.9506348371505737, -1.750241994857788, -1.549849271774292, -1.349456548690796, -1.1490638256072998, -0.9486710429191589, -0.7482782602310181, -0.547885537147522, -0.3474928140640259, -0.14709997177124023, 0.05329275131225586, 0.25368499755859375, 0.45407775044441223, 0.6544705033302307, 0.8548632860183716, 1.0552560091018677, 1.2556487321853638, 1.4560415744781494, 1.6564342975616455, 1.8568270206451416, 2.0572197437286377, 2.257612466812134, 2.458005428314209, 2.658398151397705, 2.858790874481201, 3.0591835975646973, 3.2595763206481934, 3.4599690437316895, 3.6603617668151855, 3.8607544898986816, 4.061147212982178, 4.261539936065674, 4.46193265914917, 4.662325859069824, 4.86271858215332, 5.063111305236816, 5.2635040283203125, 5.463896751403809, 5.664289474487305, 5.864682197570801, 6.065074920654297, 6.265467643737793, 6.465860366821289, 6.666253089904785]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 9.0, 6.0, 18.0, 16.0, 27.0, 38.0, 53.0, 114.0, 228.0, 432.0, 840.0, 2016.0, 5069.0, 16077.0, 61631.0, 279425.0, 500777.0, 135018.0, 31884.0, 9094.0, 3199.0, 1329.0, 555.0, 293.0, 152.0, 88.0, 53.0, 35.0, 24.0, 15.0, 20.0, 8.0, 1.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7001953125, -1.64581298828125, -1.5914306640625, -1.53704833984375, -1.482666015625, -1.42828369140625, -1.3739013671875, -1.31951904296875, -1.26513671875, -1.21075439453125, -1.1563720703125, -1.10198974609375, -1.047607421875, -0.99322509765625, -0.9388427734375, -0.88446044921875, -0.830078125, -0.77569580078125, -0.7213134765625, -0.66693115234375, -0.612548828125, -0.55816650390625, -0.5037841796875, -0.44940185546875, -0.39501953125, -0.34063720703125, -0.2862548828125, -0.23187255859375, -0.177490234375, -0.12310791015625, -0.0687255859375, -0.01434326171875, 0.0400390625, 0.09442138671875, 0.1488037109375, 0.20318603515625, 0.257568359375, 0.31195068359375, 0.3663330078125, 0.42071533203125, 0.47509765625, 0.52947998046875, 0.5838623046875, 0.63824462890625, 0.692626953125, 0.74700927734375, 0.8013916015625, 0.85577392578125, 0.91015625, 0.96453857421875, 1.0189208984375, 1.07330322265625, 1.127685546875, 1.18206787109375, 1.2364501953125, 1.29083251953125, 1.34521484375, 1.39959716796875, 1.4539794921875, 1.50836181640625, 1.562744140625, 1.61712646484375, 1.6715087890625, 1.72589111328125, 1.7802734375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 10.0, 9.0, 19.0, 16.0, 22.0, 21.0, 33.0, 34.0, 39.0, 46.0, 46.0, 55.0, 59.0, 51.0, 62.0, 62.0, 53.0, 59.0, 44.0, 46.0, 42.0, 25.0, 25.0, 26.0, 22.0, 23.0, 19.0, 13.0, 5.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.990234375, -0.9630355834960938, -0.9358367919921875, -0.9086380004882812, -0.881439208984375, -0.8542404174804688, -0.8270416259765625, -0.7998428344726562, -0.77264404296875, -0.7454452514648438, -0.7182464599609375, -0.6910476684570312, -0.663848876953125, -0.6366500854492188, -0.6094512939453125, -0.5822525024414062, -0.5550537109375, -0.5278549194335938, -0.5006561279296875, -0.47345733642578125, -0.446258544921875, -0.41905975341796875, -0.3918609619140625, -0.36466217041015625, -0.33746337890625, -0.31026458740234375, -0.2830657958984375, -0.25586700439453125, -0.228668212890625, -0.20146942138671875, -0.1742706298828125, -0.14707183837890625, -0.119873046875, -0.09267425537109375, -0.0654754638671875, -0.03827667236328125, -0.011077880859375, 0.01612091064453125, 0.0433197021484375, 0.07051849365234375, 0.09771728515625, 0.12491607666015625, 0.1521148681640625, 0.17931365966796875, 0.206512451171875, 0.23371124267578125, 0.2609100341796875, 0.28810882568359375, 0.3153076171875, 0.34250640869140625, 0.3697052001953125, 0.39690399169921875, 0.424102783203125, 0.45130157470703125, 0.4785003662109375, 0.5056991577148438, 0.53289794921875, 0.5600967407226562, 0.5872955322265625, 0.6144943237304688, 0.641693115234375, 0.6688919067382812, 0.6960906982421875, 0.7232894897460938, 0.75048828125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 10.0, 14.0, 14.0, 20.0, 34.0, 68.0, 97.0, 176.0, 279.0, 524.0, 1347.0, 4301.0, 24695.0, 649822.0, 342295.0, 18818.0, 3593.0, 1205.0, 574.0, 266.0, 158.0, 88.0, 47.0, 33.0, 27.0, 14.0, 10.0, 11.0, 4.0, 7.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4921875, -3.3671875, -3.2421875, -3.1171875, -2.9921875, -2.8671875, -2.7421875, -2.6171875, -2.4921875, -2.3671875, -2.2421875, -2.1171875, -1.9921875, -1.8671875, -1.7421875, -1.6171875, -1.4921875, -1.3671875, -1.2421875, -1.1171875, -0.9921875, -0.8671875, -0.7421875, -0.6171875, -0.4921875, -0.3671875, -0.2421875, -0.1171875, 0.0078125, 0.1328125, 0.2578125, 0.3828125, 0.5078125, 0.6328125, 0.7578125, 0.8828125, 1.0078125, 1.1328125, 1.2578125, 1.3828125, 1.5078125, 1.6328125, 1.7578125, 1.8828125, 2.0078125, 2.1328125, 2.2578125, 2.3828125, 2.5078125, 2.6328125, 2.7578125, 2.8828125, 3.0078125, 3.1328125, 3.2578125, 3.3828125, 3.5078125, 3.6328125, 3.7578125, 3.8828125, 4.0078125, 4.1328125, 4.2578125, 4.3828125, 4.5078125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 7.0, 3.0, 5.0, 2.0, 1.0, 2.0, 7.0, 11.0, 10.0, 18.0, 18.0, 17.0, 14.0, 25.0, 32.0, 41.0, 47.0, 38.0, 50.0, 49.0, 44.0, 58.0, 39.0, 48.0, 53.0, 40.0, 37.0, 35.0, 39.0, 27.0, 34.0, 26.0, 28.0, 28.0, 12.0, 13.0, 8.0, 6.0, 6.0, 8.0, 4.0, 8.0, 6.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.9375, -2.85009765625, -2.7626953125, -2.67529296875, -2.587890625, -2.50048828125, -2.4130859375, -2.32568359375, -2.23828125, -2.15087890625, -2.0634765625, -1.97607421875, -1.888671875, -1.80126953125, -1.7138671875, -1.62646484375, -1.5390625, -1.45166015625, -1.3642578125, -1.27685546875, -1.189453125, -1.10205078125, -1.0146484375, -0.92724609375, -0.83984375, -0.75244140625, -0.6650390625, -0.57763671875, -0.490234375, -0.40283203125, -0.3154296875, -0.22802734375, -0.140625, -0.05322265625, 0.0341796875, 0.12158203125, 0.208984375, 0.29638671875, 0.3837890625, 0.47119140625, 0.55859375, 0.64599609375, 0.7333984375, 0.82080078125, 0.908203125, 0.99560546875, 1.0830078125, 1.17041015625, 1.2578125, 1.34521484375, 1.4326171875, 1.52001953125, 1.607421875, 1.69482421875, 1.7822265625, 1.86962890625, 1.95703125, 2.04443359375, 2.1318359375, 2.21923828125, 2.306640625, 2.39404296875, 2.4814453125, 2.56884765625, 2.65625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 6.0, 2.0, 9.0, 4.0, 13.0, 13.0, 17.0, 39.0, 60.0, 84.0, 145.0, 328.0, 786.0, 2462.0, 14478.0, 291575.0, 713430.0, 20392.0, 3113.0, 854.0, 359.0, 154.0, 92.0, 38.0, 31.0, 27.0, 14.0, 10.0, 6.0, 5.0, 3.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.892578125, -1.825164794921875, -1.75775146484375, -1.690338134765625, -1.6229248046875, -1.555511474609375, -1.48809814453125, -1.420684814453125, -1.353271484375, -1.285858154296875, -1.21844482421875, -1.151031494140625, -1.0836181640625, -1.016204833984375, -0.94879150390625, -0.881378173828125, -0.81396484375, -0.746551513671875, -0.67913818359375, -0.611724853515625, -0.5443115234375, -0.476898193359375, -0.40948486328125, -0.342071533203125, -0.274658203125, -0.207244873046875, -0.13983154296875, -0.072418212890625, -0.0050048828125, 0.062408447265625, 0.12982177734375, 0.197235107421875, 0.2646484375, 0.332061767578125, 0.39947509765625, 0.466888427734375, 0.5343017578125, 0.601715087890625, 0.66912841796875, 0.736541748046875, 0.803955078125, 0.871368408203125, 0.93878173828125, 1.006195068359375, 1.0736083984375, 1.141021728515625, 1.20843505859375, 1.275848388671875, 1.34326171875, 1.410675048828125, 1.47808837890625, 1.545501708984375, 1.6129150390625, 1.680328369140625, 1.74774169921875, 1.815155029296875, 1.882568359375, 1.949981689453125, 2.01739501953125, 2.084808349609375, 2.1522216796875, 2.219635009765625, 2.28704833984375, 2.354461669921875, 2.421875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 2.0, 7.0, 4.0, 5.0, 10.0, 9.0, 2.0, 10.0, 9.0, 21.0, 27.0, 23.0, 26.0, 39.0, 48.0, 72.0, 131.0, 143.0, 136.0, 61.0, 50.0, 36.0, 20.0, 19.0, 13.0, 11.0, 12.0, 8.0, 5.0, 9.0, 4.0, 6.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.0002741813659667969, -0.00026664137840270996, -0.00025910139083862305, -0.00025156140327453613, -0.00024402141571044922, -0.0002364814281463623, -0.0002289414405822754, -0.00022140145301818848, -0.00021386146545410156, -0.00020632147789001465, -0.00019878149032592773, -0.00019124150276184082, -0.0001837015151977539, -0.000176161527633667, -0.00016862154006958008, -0.00016108155250549316, -0.00015354156494140625, -0.00014600157737731934, -0.00013846158981323242, -0.0001309216022491455, -0.0001233816146850586, -0.00011584162712097168, -0.00010830163955688477, -0.00010076165199279785, -9.322166442871094e-05, -8.568167686462402e-05, -7.814168930053711e-05, -7.06017017364502e-05, -6.306171417236328e-05, -5.552172660827637e-05, -4.798173904418945e-05, -4.044175148010254e-05, -3.2901763916015625e-05, -2.536177635192871e-05, -1.7821788787841797e-05, -1.0281801223754883e-05, -2.7418136596679688e-06, 4.798173904418945e-06, 1.233816146850586e-05, 1.9878149032592773e-05, 2.7418136596679688e-05, 3.49581241607666e-05, 4.2498111724853516e-05, 5.003809928894043e-05, 5.7578086853027344e-05, 6.511807441711426e-05, 7.265806198120117e-05, 8.019804954528809e-05, 8.7738037109375e-05, 9.527802467346191e-05, 0.00010281801223754883, 0.00011035799980163574, 0.00011789798736572266, 0.00012543797492980957, 0.00013297796249389648, 0.0001405179500579834, 0.0001480579376220703, 0.00015559792518615723, 0.00016313791275024414, 0.00017067790031433105, 0.00017821788787841797, 0.00018575787544250488, 0.0001932978630065918, 0.0002008378505706787, 0.00020837783813476562]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 6.0, 13.0, 14.0, 24.0, 35.0, 48.0, 82.0, 167.0, 261.0, 456.0, 918.0, 2515.0, 8317.0, 40286.0, 741063.0, 222647.0, 22709.0, 5557.0, 1753.0, 756.0, 386.0, 212.0, 128.0, 64.0, 44.0, 22.0, 24.0, 16.0, 10.0, 9.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.525390625, -1.47747802734375, -1.4295654296875, -1.38165283203125, -1.333740234375, -1.28582763671875, -1.2379150390625, -1.19000244140625, -1.14208984375, -1.09417724609375, -1.0462646484375, -0.99835205078125, -0.950439453125, -0.90252685546875, -0.8546142578125, -0.80670166015625, -0.7587890625, -0.71087646484375, -0.6629638671875, -0.61505126953125, -0.567138671875, -0.51922607421875, -0.4713134765625, -0.42340087890625, -0.37548828125, -0.32757568359375, -0.2796630859375, -0.23175048828125, -0.183837890625, -0.13592529296875, -0.0880126953125, -0.04010009765625, 0.0078125, 0.05572509765625, 0.1036376953125, 0.15155029296875, 0.199462890625, 0.24737548828125, 0.2952880859375, 0.34320068359375, 0.39111328125, 0.43902587890625, 0.4869384765625, 0.53485107421875, 0.582763671875, 0.63067626953125, 0.6785888671875, 0.72650146484375, 0.7744140625, 0.82232666015625, 0.8702392578125, 0.91815185546875, 0.966064453125, 1.01397705078125, 1.0618896484375, 1.10980224609375, 1.15771484375, 1.20562744140625, 1.2535400390625, 1.30145263671875, 1.349365234375, 1.39727783203125, 1.4451904296875, 1.49310302734375, 1.541015625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 4.0, 4.0, 10.0, 5.0, 10.0, 10.0, 10.0, 12.0, 22.0, 23.0, 25.0, 47.0, 65.0, 95.0, 115.0, 114.0, 99.0, 72.0, 59.0, 40.0, 30.0, 20.0, 18.0, 7.0, 10.0, 5.0, 12.0, 7.0, 5.0, 8.0, 8.0, 2.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.955078125, -0.92559814453125, -0.8961181640625, -0.86663818359375, -0.837158203125, -0.80767822265625, -0.7781982421875, -0.74871826171875, -0.71923828125, -0.68975830078125, -0.6602783203125, -0.63079833984375, -0.601318359375, -0.57183837890625, -0.5423583984375, -0.51287841796875, -0.4833984375, -0.45391845703125, -0.4244384765625, -0.39495849609375, -0.365478515625, -0.33599853515625, -0.3065185546875, -0.27703857421875, -0.24755859375, -0.21807861328125, -0.1885986328125, -0.15911865234375, -0.129638671875, -0.10015869140625, -0.0706787109375, -0.04119873046875, -0.01171875, 0.01776123046875, 0.0472412109375, 0.07672119140625, 0.106201171875, 0.13568115234375, 0.1651611328125, 0.19464111328125, 0.22412109375, 0.25360107421875, 0.2830810546875, 0.31256103515625, 0.342041015625, 0.37152099609375, 0.4010009765625, 0.43048095703125, 0.4599609375, 0.48944091796875, 0.5189208984375, 0.54840087890625, 0.577880859375, 0.60736083984375, 0.6368408203125, 0.66632080078125, 0.69580078125, 0.72528076171875, 0.7547607421875, 0.78424072265625, 0.813720703125, 0.84320068359375, 0.8726806640625, 0.90216064453125, 0.931640625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 4.0, 5.0, 7.0, 12.0, 36.0, 62.0, 99.0, 232.0, 257.0, 142.0, 84.0, 21.0, 11.0, 4.0, 7.0, 4.0, 3.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.733699798583984, -21.057241439819336, -20.380783081054688, -19.704322814941406, -19.027864456176758, -18.35140609741211, -17.674945831298828, -16.99848747253418, -16.32202911376953, -15.645570755004883, -14.969111442565918, -14.292652130126953, -13.616193771362305, -12.939735412597656, -12.263276100158691, -11.586816787719727, -10.910358428955078, -10.23390007019043, -9.557440757751465, -8.8809814453125, -8.204523086547852, -7.528064250946045, -6.851605415344238, -6.175146579742432, -5.498687744140625, -4.822228908538818, -4.145770072937012, -3.469311237335205, -2.7928524017333984, -2.116393566131592, -1.4399347305297852, -0.7634758949279785, -0.08701896667480469, 0.589439868927002, 1.2658987045288086, 1.9423575401306152, 2.618816375732422, 3.2952752113342285, 3.971734046936035, 4.648192882537842, 5.324651718139648, 6.001110553741455, 6.677569389343262, 7.354028224945068, 8.030487060546875, 8.706945419311523, 9.383404731750488, 10.059864044189453, 10.736322402954102, 11.41278076171875, 12.089240074157715, 12.76569938659668, 13.442157745361328, 14.118616104125977, 14.795075416564941, 15.471534729003906, 16.147993087768555, 16.824451446533203, 17.500911712646484, 18.177370071411133, 18.85382843017578, 19.53028678894043, 20.206745147705078, 20.88320541381836, 21.559663772583008]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 6.0, 5.0, 5.0, 11.0, 4.0, 10.0, 13.0, 12.0, 19.0, 18.0, 22.0, 24.0, 33.0, 31.0, 41.0, 34.0, 33.0, 37.0, 55.0, 61.0, 80.0, 49.0, 70.0, 46.0, 44.0, 37.0, 31.0, 31.0, 23.0, 26.0, 21.0, 16.0, 15.0, 13.0, 5.0, 4.0, 4.0, 2.0, 1.0, 7.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.778682708740234, -9.441977500915527, -9.10527229309082, -8.768567085266113, -8.431861877441406, -8.0951566696167, -7.758450984954834, -7.421745777130127, -7.08504056930542, -6.748335361480713, -6.411630153656006, -6.074924468994141, -5.738219261169434, -5.401514053344727, -5.0648088455200195, -4.7281036376953125, -4.3913984298706055, -4.054693222045898, -3.7179880142211914, -3.3812825679779053, -3.0445773601531982, -2.707872152328491, -2.371166706085205, -2.034461498260498, -1.697756290435791, -1.361051082611084, -1.0243457555770874, -0.6876404285430908, -0.3509352207183838, -0.014230012893676758, 0.3224754333496094, 0.6591806411743164, 0.9958858489990234, 1.3325910568237305, 1.669296383857727, 2.0060017108917236, 2.3427069187164307, 2.6794121265411377, 3.016117572784424, 3.352822780609131, 3.689527988433838, 4.026233196258545, 4.362938404083252, 4.699644088745117, 5.036349296569824, 5.373054504394531, 5.709759712219238, 6.046464920043945, 6.383170127868652, 6.719875335693359, 7.056580543518066, 7.393285751342773, 7.7299909591674805, 8.066696166992188, 8.403402328491211, 8.740106582641602, 9.076812744140625, 9.413517951965332, 9.750223159790039, 10.086928367614746, 10.423633575439453, 10.76033878326416, 11.097043991088867, 11.43375015258789, 11.770454406738281]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 4.0, 5.0, 10.0, 8.0, 17.0, 23.0, 36.0, 75.0, 137.0, 317.0, 910.0, 3450.0, 30779.0, 2940929.0, 1195763.0, 18118.0, 2531.0, 634.0, 254.0, 116.0, 63.0, 44.0, 23.0, 14.0, 7.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.859375, -2.777435302734375, -2.69549560546875, -2.613555908203125, -2.5316162109375, -2.449676513671875, -2.36773681640625, -2.285797119140625, -2.203857421875, -2.121917724609375, -2.03997802734375, -1.958038330078125, -1.8760986328125, -1.794158935546875, -1.71221923828125, -1.630279541015625, -1.54833984375, -1.466400146484375, -1.38446044921875, -1.302520751953125, -1.2205810546875, -1.138641357421875, -1.05670166015625, -0.974761962890625, -0.892822265625, -0.810882568359375, -0.72894287109375, -0.647003173828125, -0.5650634765625, -0.483123779296875, -0.40118408203125, -0.319244384765625, -0.2373046875, -0.155364990234375, -0.07342529296875, 0.008514404296875, 0.0904541015625, 0.172393798828125, 0.25433349609375, 0.336273193359375, 0.418212890625, 0.500152587890625, 0.58209228515625, 0.664031982421875, 0.7459716796875, 0.827911376953125, 0.90985107421875, 0.991790771484375, 1.07373046875, 1.155670166015625, 1.23760986328125, 1.319549560546875, 1.4014892578125, 1.483428955078125, 1.56536865234375, 1.647308349609375, 1.729248046875, 1.811187744140625, 1.89312744140625, 1.975067138671875, 2.0570068359375, 2.138946533203125, 2.22088623046875, 2.302825927734375, 2.384765625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 8.0, 7.0, 4.0, 11.0, 16.0, 28.0, 31.0, 35.0, 33.0, 45.0, 74.0, 66.0, 62.0, 63.0, 63.0, 74.0, 63.0, 69.0, 44.0, 56.0, 34.0, 33.0, 25.0, 12.0, 14.0, 10.0, 7.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96435546875, -0.9333114624023438, -0.9022674560546875, -0.8712234497070312, -0.840179443359375, -0.8091354370117188, -0.7780914306640625, -0.7470474243164062, -0.71600341796875, -0.6849594116210938, -0.6539154052734375, -0.6228713989257812, -0.591827392578125, -0.5607833862304688, -0.5297393798828125, -0.49869537353515625, -0.4676513671875, -0.43660736083984375, -0.4055633544921875, -0.37451934814453125, -0.343475341796875, -0.31243133544921875, -0.2813873291015625, -0.25034332275390625, -0.21929931640625, -0.18825531005859375, -0.1572113037109375, -0.12616729736328125, -0.095123291015625, -0.06407928466796875, -0.0330352783203125, -0.00199127197265625, 0.029052734375, 0.06009674072265625, 0.0911407470703125, 0.12218475341796875, 0.153228759765625, 0.18427276611328125, 0.2153167724609375, 0.24636077880859375, 0.27740478515625, 0.30844879150390625, 0.3394927978515625, 0.37053680419921875, 0.401580810546875, 0.43262481689453125, 0.4636688232421875, 0.49471282958984375, 0.5257568359375, 0.5568008422851562, 0.5878448486328125, 0.6188888549804688, 0.649932861328125, 0.6809768676757812, 0.7120208740234375, 0.7430648803710938, 0.77410888671875, 0.8051528930664062, 0.8361968994140625, 0.8672409057617188, 0.898284912109375, 0.9293289184570312, 0.9603729248046875, 0.9914169311523438, 1.0224609375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 0.0, 3.0, 11.0, 12.0, 16.0, 27.0, 44.0, 87.0, 161.0, 266.0, 542.0, 1257.0, 3380.0, 14056.0, 195188.0, 3791946.0, 168080.0, 13275.0, 3320.0, 1279.0, 593.0, 315.0, 156.0, 99.0, 64.0, 47.0, 20.0, 9.0, 11.0, 6.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6796875, -2.604156494140625, -2.52862548828125, -2.453094482421875, -2.3775634765625, -2.302032470703125, -2.22650146484375, -2.150970458984375, -2.075439453125, -1.999908447265625, -1.92437744140625, -1.848846435546875, -1.7733154296875, -1.697784423828125, -1.62225341796875, -1.546722412109375, -1.47119140625, -1.395660400390625, -1.32012939453125, -1.244598388671875, -1.1690673828125, -1.093536376953125, -1.01800537109375, -0.942474365234375, -0.866943359375, -0.791412353515625, -0.71588134765625, -0.640350341796875, -0.5648193359375, -0.489288330078125, -0.41375732421875, -0.338226318359375, -0.2626953125, -0.187164306640625, -0.11163330078125, -0.036102294921875, 0.0394287109375, 0.114959716796875, 0.19049072265625, 0.266021728515625, 0.341552734375, 0.417083740234375, 0.49261474609375, 0.568145751953125, 0.6436767578125, 0.719207763671875, 0.79473876953125, 0.870269775390625, 0.94580078125, 1.021331787109375, 1.09686279296875, 1.172393798828125, 1.2479248046875, 1.323455810546875, 1.39898681640625, 1.474517822265625, 1.550048828125, 1.625579833984375, 1.70111083984375, 1.776641845703125, 1.8521728515625, 1.927703857421875, 2.00323486328125, 2.078765869140625, 2.154296875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 8.0, 3.0, 9.0, 18.0, 31.0, 32.0, 54.0, 116.0, 203.0, 355.0, 649.0, 837.0, 718.0, 447.0, 247.0, 120.0, 77.0, 51.0, 24.0, 14.0, 10.0, 8.0, 12.0, 9.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2119140625, -1.1559295654296875, -1.099945068359375, -1.0439605712890625, -0.98797607421875, -0.9319915771484375, -0.876007080078125, -0.8200225830078125, -0.7640380859375, -0.7080535888671875, -0.652069091796875, -0.5960845947265625, -0.54010009765625, -0.4841156005859375, -0.428131103515625, -0.3721466064453125, -0.316162109375, -0.2601776123046875, -0.204193115234375, -0.1482086181640625, -0.09222412109375, -0.0362396240234375, 0.019744873046875, 0.0757293701171875, 0.1317138671875, 0.1876983642578125, 0.243682861328125, 0.2996673583984375, 0.35565185546875, 0.4116363525390625, 0.467620849609375, 0.5236053466796875, 0.57958984375, 0.6355743408203125, 0.691558837890625, 0.7475433349609375, 0.80352783203125, 0.8595123291015625, 0.915496826171875, 0.9714813232421875, 1.0274658203125, 1.0834503173828125, 1.139434814453125, 1.1954193115234375, 1.25140380859375, 1.3073883056640625, 1.363372802734375, 1.4193572998046875, 1.475341796875, 1.5313262939453125, 1.587310791015625, 1.6432952880859375, 1.69927978515625, 1.7552642822265625, 1.811248779296875, 1.8672332763671875, 1.9232177734375, 1.9792022705078125, 2.035186767578125, 2.0911712646484375, 2.14715576171875, 2.2031402587890625, 2.259124755859375, 2.3151092529296875, 2.37109375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 6.0, 4.0, 8.0, 9.0, 14.0, 48.0, 153.0, 256.0, 287.0, 117.0, 57.0, 26.0, 7.0, 3.0, 8.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.355823516845703, -21.633390426635742, -20.910959243774414, -20.188526153564453, -19.466094970703125, -18.743661880493164, -18.021228790283203, -17.298797607421875, -16.576364517211914, -15.85393238067627, -15.131500244140625, -14.409067153930664, -13.68663501739502, -12.964202880859375, -12.241769790649414, -11.51933765411377, -10.796905517578125, -10.07447338104248, -9.352041244506836, -8.629608154296875, -7.9071760177612305, -7.184743881225586, -6.462311267852783, -5.7398786544799805, -5.017446517944336, -4.295014381408691, -3.5725817680358887, -2.850149393081665, -2.1277170181274414, -1.4052846431732178, -0.6828522682189941, 0.039580345153808594, 0.7620105743408203, 1.484442949295044, 2.2068753242492676, 2.929307699203491, 3.651740074157715, 4.374172210693359, 5.096604824066162, 5.819037437438965, 6.541469573974609, 7.263901710510254, 7.986334323883057, 8.70876693725586, 9.431199073791504, 10.153631210327148, 10.87606430053711, 11.598496437072754, 12.320928573608398, 13.043360710144043, 13.765792846679688, 14.488225936889648, 15.210658073425293, 15.933090209960938, 16.6555233001709, 17.37795639038086, 18.100387573242188, 18.82282066345215, 19.545251846313477, 20.267684936523438, 20.990116119384766, 21.712549209594727, 22.434982299804688, 23.157413482666016, 23.879846572875977]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 2.0, 6.0, 7.0, 14.0, 21.0, 13.0, 37.0, 49.0, 49.0, 57.0, 70.0, 66.0, 73.0, 73.0, 65.0, 61.0, 69.0, 63.0, 43.0, 36.0, 34.0, 30.0, 14.0, 17.0, 8.0, 6.0, 6.0, 1.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.74617862701416, -10.46107292175293, -10.175966262817383, -9.890859603881836, -9.605753898620605, -9.320648193359375, -9.035541534423828, -8.750434875488281, -8.46532917022705, -8.18022346496582, -7.895116806030273, -7.610010623931885, -7.324904441833496, -7.039798259735107, -6.754692077636719, -6.46958589553833, -6.184479713439941, -5.899373531341553, -5.614267349243164, -5.329161167144775, -5.044054985046387, -4.758948802947998, -4.473842620849609, -4.188736438751221, -3.903630256652832, -3.6185240745544434, -3.3334178924560547, -3.048311710357666, -2.7632055282592773, -2.4780993461608887, -2.1929931640625, -1.9078869819641113, -1.6227798461914062, -1.3376736640930176, -1.052567481994629, -0.7674612998962402, -0.48235511779785156, -0.1972489356994629, 0.08785724639892578, 0.37296342849731445, 0.6580696105957031, 0.9431757926940918, 1.2282819747924805, 1.5133881568908691, 1.7984943389892578, 2.0836005210876465, 2.368706703186035, 2.653812885284424, 2.9389190673828125, 3.224025249481201, 3.50913143157959, 3.7942376136779785, 4.079343795776367, 4.364449977874756, 4.6495561599731445, 4.934662342071533, 5.219768524169922, 5.5048747062683105, 5.789980888366699, 6.075087070465088, 6.360193252563477, 6.645299434661865, 6.930405616760254, 7.215511798858643, 7.500617980957031]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 7.0, 15.0, 15.0, 20.0, 27.0, 65.0, 67.0, 160.0, 252.0, 569.0, 1412.0, 3972.0, 14068.0, 74480.0, 436222.0, 425471.0, 71758.0, 13706.0, 3777.0, 1317.0, 561.0, 257.0, 129.0, 79.0, 48.0, 28.0, 19.0, 12.0, 16.0, 7.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-2.001953125, -1.9478302001953125, -1.893707275390625, -1.8395843505859375, -1.78546142578125, -1.7313385009765625, -1.677215576171875, -1.6230926513671875, -1.5689697265625, -1.5148468017578125, -1.460723876953125, -1.4066009521484375, -1.35247802734375, -1.2983551025390625, -1.244232177734375, -1.1901092529296875, -1.135986328125, -1.0818634033203125, -1.027740478515625, -0.9736175537109375, -0.91949462890625, -0.8653717041015625, -0.811248779296875, -0.7571258544921875, -0.7030029296875, -0.6488800048828125, -0.594757080078125, -0.5406341552734375, -0.48651123046875, -0.4323883056640625, -0.378265380859375, -0.3241424560546875, -0.27001953125, -0.2158966064453125, -0.161773681640625, -0.1076507568359375, -0.05352783203125, 0.0005950927734375, 0.054718017578125, 0.1088409423828125, 0.1629638671875, 0.2170867919921875, 0.271209716796875, 0.3253326416015625, 0.37945556640625, 0.4335784912109375, 0.487701416015625, 0.5418243408203125, 0.595947265625, 0.6500701904296875, 0.704193115234375, 0.7583160400390625, 0.81243896484375, 0.8665618896484375, 0.920684814453125, 0.9748077392578125, 1.0289306640625, 1.0830535888671875, 1.137176513671875, 1.1912994384765625, 1.24542236328125, 1.2995452880859375, 1.353668212890625, 1.4077911376953125, 1.4619140625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 3.0, 1.0, 5.0, 5.0, 5.0, 6.0, 11.0, 19.0, 21.0, 27.0, 38.0, 42.0, 38.0, 43.0, 59.0, 65.0, 71.0, 55.0, 65.0, 48.0, 58.0, 61.0, 49.0, 51.0, 46.0, 19.0, 24.0, 13.0, 16.0, 9.0, 7.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.005859375, -0.97674560546875, -0.9476318359375, -0.91851806640625, -0.889404296875, -0.86029052734375, -0.8311767578125, -0.80206298828125, -0.77294921875, -0.74383544921875, -0.7147216796875, -0.68560791015625, -0.656494140625, -0.62738037109375, -0.5982666015625, -0.56915283203125, -0.5400390625, -0.51092529296875, -0.4818115234375, -0.45269775390625, -0.423583984375, -0.39447021484375, -0.3653564453125, -0.33624267578125, -0.30712890625, -0.27801513671875, -0.2489013671875, -0.21978759765625, -0.190673828125, -0.16156005859375, -0.1324462890625, -0.10333251953125, -0.07421875, -0.04510498046875, -0.0159912109375, 0.01312255859375, 0.042236328125, 0.07135009765625, 0.1004638671875, 0.12957763671875, 0.15869140625, 0.18780517578125, 0.2169189453125, 0.24603271484375, 0.275146484375, 0.30426025390625, 0.3333740234375, 0.36248779296875, 0.3916015625, 0.42071533203125, 0.4498291015625, 0.47894287109375, 0.508056640625, 0.53717041015625, 0.5662841796875, 0.59539794921875, 0.62451171875, 0.65362548828125, 0.6827392578125, 0.71185302734375, 0.740966796875, 0.77008056640625, 0.7991943359375, 0.82830810546875, 0.857421875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 3.0, 8.0, 6.0, 11.0, 14.0, 28.0, 27.0, 30.0, 55.0, 85.0, 130.0, 239.0, 399.0, 846.0, 2275.0, 7063.0, 31986.0, 211679.0, 658017.0, 109722.0, 18111.0, 4715.0, 1580.0, 674.0, 305.0, 177.0, 134.0, 74.0, 46.0, 26.0, 22.0, 17.0, 10.0, 10.0, 6.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.451171875, -1.3980712890625, -1.344970703125, -1.2918701171875, -1.23876953125, -1.1856689453125, -1.132568359375, -1.0794677734375, -1.0263671875, -0.9732666015625, -0.920166015625, -0.8670654296875, -0.81396484375, -0.7608642578125, -0.707763671875, -0.6546630859375, -0.6015625, -0.5484619140625, -0.495361328125, -0.4422607421875, -0.38916015625, -0.3360595703125, -0.282958984375, -0.2298583984375, -0.1767578125, -0.1236572265625, -0.070556640625, -0.0174560546875, 0.03564453125, 0.0887451171875, 0.141845703125, 0.1949462890625, 0.248046875, 0.3011474609375, 0.354248046875, 0.4073486328125, 0.46044921875, 0.5135498046875, 0.566650390625, 0.6197509765625, 0.6728515625, 0.7259521484375, 0.779052734375, 0.8321533203125, 0.88525390625, 0.9383544921875, 0.991455078125, 1.0445556640625, 1.09765625, 1.1507568359375, 1.203857421875, 1.2569580078125, 1.31005859375, 1.3631591796875, 1.416259765625, 1.4693603515625, 1.5224609375, 1.5755615234375, 1.628662109375, 1.6817626953125, 1.73486328125, 1.7879638671875, 1.841064453125, 1.8941650390625, 1.947265625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 3.0, 8.0, 6.0, 8.0, 9.0, 18.0, 16.0, 19.0, 26.0, 25.0, 36.0, 34.0, 61.0, 39.0, 55.0, 51.0, 69.0, 48.0, 53.0, 58.0, 49.0, 46.0, 42.0, 48.0, 34.0, 32.0, 25.0, 17.0, 10.0, 8.0, 9.0, 4.0, 13.0, 6.0, 5.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.89453125, -2.807403564453125, -2.72027587890625, -2.633148193359375, -2.5460205078125, -2.458892822265625, -2.37176513671875, -2.284637451171875, -2.197509765625, -2.110382080078125, -2.02325439453125, -1.936126708984375, -1.8489990234375, -1.761871337890625, -1.67474365234375, -1.587615966796875, -1.50048828125, -1.413360595703125, -1.32623291015625, -1.239105224609375, -1.1519775390625, -1.064849853515625, -0.97772216796875, -0.890594482421875, -0.803466796875, -0.716339111328125, -0.62921142578125, -0.542083740234375, -0.4549560546875, -0.367828369140625, -0.28070068359375, -0.193572998046875, -0.1064453125, -0.019317626953125, 0.06781005859375, 0.154937744140625, 0.2420654296875, 0.329193115234375, 0.41632080078125, 0.503448486328125, 0.590576171875, 0.677703857421875, 0.76483154296875, 0.851959228515625, 0.9390869140625, 1.026214599609375, 1.11334228515625, 1.200469970703125, 1.28759765625, 1.374725341796875, 1.46185302734375, 1.548980712890625, 1.6361083984375, 1.723236083984375, 1.81036376953125, 1.897491455078125, 1.984619140625, 2.071746826171875, 2.15887451171875, 2.246002197265625, 2.3331298828125, 2.420257568359375, 2.50738525390625, 2.594512939453125, 2.681640625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 6.0, 13.0, 10.0, 25.0, 35.0, 67.0, 132.0, 205.0, 493.0, 1460.0, 4494.0, 15956.0, 74206.0, 604667.0, 283230.0, 47264.0, 11130.0, 3232.0, 1091.0, 386.0, 186.0, 102.0, 62.0, 26.0, 20.0, 10.0, 5.0, 9.0, 6.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6923828125, -0.6725234985351562, -0.6526641845703125, -0.6328048706054688, -0.612945556640625, -0.5930862426757812, -0.5732269287109375, -0.5533676147460938, -0.53350830078125, -0.5136489868164062, -0.4937896728515625, -0.47393035888671875, -0.454071044921875, -0.43421173095703125, -0.4143524169921875, -0.39449310302734375, -0.3746337890625, -0.35477447509765625, -0.3349151611328125, -0.31505584716796875, -0.295196533203125, -0.27533721923828125, -0.2554779052734375, -0.23561859130859375, -0.21575927734375, -0.19589996337890625, -0.1760406494140625, -0.15618133544921875, -0.136322021484375, -0.11646270751953125, -0.0966033935546875, -0.07674407958984375, -0.056884765625, -0.03702545166015625, -0.0171661376953125, 0.00269317626953125, 0.022552490234375, 0.04241180419921875, 0.0622711181640625, 0.08213043212890625, 0.10198974609375, 0.12184906005859375, 0.1417083740234375, 0.16156768798828125, 0.181427001953125, 0.20128631591796875, 0.2211456298828125, 0.24100494384765625, 0.2608642578125, 0.28072357177734375, 0.3005828857421875, 0.32044219970703125, 0.340301513671875, 0.36016082763671875, 0.3800201416015625, 0.39987945556640625, 0.41973876953125, 0.43959808349609375, 0.4594573974609375, 0.47931671142578125, 0.499176025390625, 0.5190353393554688, 0.5388946533203125, 0.5587539672851562, 0.57861328125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 6.0, 3.0, 7.0, 5.0, 13.0, 14.0, 15.0, 10.0, 24.0, 44.0, 47.0, 74.0, 93.0, 111.0, 113.0, 118.0, 88.0, 63.0, 41.0, 38.0, 16.0, 10.0, 9.0, 7.0, 7.0, 7.0, 6.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014507770538330078, -0.00014009512960910797, -0.00013511255383491516, -0.00013012997806072235, -0.00012514740228652954, -0.00012016482651233673, -0.00011518225073814392, -0.00011019967496395111, -0.0001052170991897583, -0.00010023452341556549, -9.525194764137268e-05, -9.026937186717987e-05, -8.528679609298706e-05, -8.030422031879425e-05, -7.532164454460144e-05, -7.033906877040863e-05, -6.535649299621582e-05, -6.037391722202301e-05, -5.53913414478302e-05, -5.040876567363739e-05, -4.542618989944458e-05, -4.044361412525177e-05, -3.546103835105896e-05, -3.047846257686615e-05, -2.549588680267334e-05, -2.051331102848053e-05, -1.553073525428772e-05, -1.054815948009491e-05, -5.5655837059021e-06, -5.830079317092896e-07, 4.3995678424835205e-06, 9.38214361667633e-06, 1.436471939086914e-05, 1.934729516506195e-05, 2.432987093925476e-05, 2.931244671344757e-05, 3.429502248764038e-05, 3.927759826183319e-05, 4.4260174036026e-05, 4.924274981021881e-05, 5.422532558441162e-05, 5.920790135860443e-05, 6.419047713279724e-05, 6.917305290699005e-05, 7.415562868118286e-05, 7.913820445537567e-05, 8.412078022956848e-05, 8.910335600376129e-05, 9.40859317779541e-05, 9.906850755214691e-05, 0.00010405108332633972, 0.00010903365910053253, 0.00011401623487472534, 0.00011899881064891815, 0.00012398138642311096, 0.00012896396219730377, 0.00013394653797149658, 0.0001389291137456894, 0.0001439116895198822, 0.000148894265294075, 0.00015387684106826782, 0.00015885941684246063, 0.00016384199261665344, 0.00016882456839084625, 0.00017380714416503906]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 12.0, 7.0, 17.0, 17.0, 31.0, 62.0, 100.0, 211.0, 449.0, 1176.0, 3694.0, 15536.0, 93056.0, 697737.0, 199323.0, 28158.0, 6073.0, 1762.0, 609.0, 234.0, 126.0, 71.0, 47.0, 22.0, 13.0, 5.0, 6.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.85498046875, -0.8316726684570312, -0.8083648681640625, -0.7850570678710938, -0.761749267578125, -0.7384414672851562, -0.7151336669921875, -0.6918258666992188, -0.66851806640625, -0.6452102661132812, -0.6219024658203125, -0.5985946655273438, -0.575286865234375, -0.5519790649414062, -0.5286712646484375, -0.5053634643554688, -0.4820556640625, -0.45874786376953125, -0.4354400634765625, -0.41213226318359375, -0.388824462890625, -0.36551666259765625, -0.3422088623046875, -0.31890106201171875, -0.29559326171875, -0.27228546142578125, -0.2489776611328125, -0.22566986083984375, -0.202362060546875, -0.17905426025390625, -0.1557464599609375, -0.13243865966796875, -0.109130859375, -0.08582305908203125, -0.0625152587890625, -0.03920745849609375, -0.015899658203125, 0.00740814208984375, 0.0307159423828125, 0.05402374267578125, 0.07733154296875, 0.10063934326171875, 0.1239471435546875, 0.14725494384765625, 0.170562744140625, 0.19387054443359375, 0.2171783447265625, 0.24048614501953125, 0.2637939453125, 0.28710174560546875, 0.3104095458984375, 0.33371734619140625, 0.357025146484375, 0.38033294677734375, 0.4036407470703125, 0.42694854736328125, 0.45025634765625, 0.47356414794921875, 0.4968719482421875, 0.5201797485351562, 0.543487548828125, 0.5667953491210938, 0.5901031494140625, 0.6134109497070312, 0.63671875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 7.0, 6.0, 11.0, 13.0, 26.0, 23.0, 26.0, 25.0, 59.0, 55.0, 57.0, 78.0, 86.0, 93.0, 64.0, 77.0, 47.0, 56.0, 39.0, 42.0, 21.0, 19.0, 15.0, 9.0, 5.0, 12.0, 8.0, 3.0, 2.0, 4.0, 2.0, 6.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.72705078125, -0.7090568542480469, -0.6910629272460938, -0.6730690002441406, -0.6550750732421875, -0.6370811462402344, -0.6190872192382812, -0.6010932922363281, -0.583099365234375, -0.5651054382324219, -0.5471115112304688, -0.5291175842285156, -0.5111236572265625, -0.4931297302246094, -0.47513580322265625, -0.4571418762207031, -0.43914794921875, -0.4211540222167969, -0.40316009521484375, -0.3851661682128906, -0.3671722412109375, -0.3491783142089844, -0.33118438720703125, -0.3131904602050781, -0.295196533203125, -0.2772026062011719, -0.25920867919921875, -0.24121475219726562, -0.2232208251953125, -0.20522689819335938, -0.18723297119140625, -0.16923904418945312, -0.1512451171875, -0.13325119018554688, -0.11525726318359375, -0.09726333618164062, -0.0792694091796875, -0.061275482177734375, -0.04328155517578125, -0.025287628173828125, -0.007293701171875, 0.010700225830078125, 0.02869415283203125, 0.046688079833984375, 0.0646820068359375, 0.08267593383789062, 0.10066986083984375, 0.11866378784179688, 0.13665771484375, 0.15465164184570312, 0.17264556884765625, 0.19063949584960938, 0.2086334228515625, 0.22662734985351562, 0.24462127685546875, 0.2626152038574219, 0.280609130859375, 0.2986030578613281, 0.31659698486328125, 0.3345909118652344, 0.3525848388671875, 0.3705787658691406, 0.38857269287109375, 0.4065666198730469, 0.424560546875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 9.0, 28.0, 47.0, 78.0, 141.0, 296.0, 145.0, 99.0, 57.0, 35.0, 17.0, 13.0, 7.0, 8.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.53817081451416, -7.108944892883301, -6.679718494415283, -6.250492572784424, -5.821266174316406, -5.392040252685547, -4.9628143310546875, -4.533588409423828, -4.1043620109558105, -3.675135850906372, -3.2459096908569336, -2.816683769226074, -2.3874576091766357, -1.9582314491271973, -1.529005527496338, -1.0997793674468994, -0.6705532073974609, -0.24132710695266724, 0.18789899349212646, 0.6171250343322754, 1.0463511943817139, 1.4755773544311523, 1.9048032760620117, 2.33402943611145, 2.7632555961608887, 3.192481756210327, 3.6217079162597656, 4.050933837890625, 4.480159759521484, 4.909386157989502, 5.338612079620361, 5.767838478088379, 6.197063446044922, 6.626289367675781, 7.055515766143799, 7.484741687774658, 7.913968086242676, 8.343194007873535, 8.772419929504395, 9.201645851135254, 9.63087272644043, 10.060098648071289, 10.489324569702148, 10.918550491333008, 11.347777366638184, 11.777003288269043, 12.206229209899902, 12.635455131530762, 13.064681053161621, 13.49390697479248, 13.92313289642334, 14.352359771728516, 14.781585693359375, 15.210811614990234, 15.640037536621094, 16.069263458251953, 16.498489379882812, 16.927715301513672, 17.35694122314453, 17.78616714477539, 18.21539306640625, 18.64461898803711, 19.07384490966797, 19.50307273864746, 19.93229866027832]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 6.0, 8.0, 13.0, 15.0, 15.0, 24.0, 25.0, 28.0, 34.0, 39.0, 38.0, 44.0, 51.0, 78.0, 108.0, 88.0, 64.0, 51.0, 37.0, 40.0, 17.0, 31.0, 39.0, 24.0, 20.0, 19.0, 12.0, 12.0, 8.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.512866020202637, -9.144973754882812, -8.777080535888672, -8.409188270568848, -8.041296005249023, -7.673402786254883, -7.305510520935059, -6.937617778778076, -6.569725036621094, -6.201832294464111, -5.833939552307129, -5.466047286987305, -5.098154544830322, -4.73026180267334, -4.362369537353516, -3.994476795196533, -3.626584053039551, -3.2586913108825684, -2.890798807144165, -2.5229063034057617, -2.1550135612487793, -1.7871209383010864, -1.4192283153533936, -1.0513358116149902, -0.6834430694580078, -0.31555044651031494, 0.05234217643737793, 0.4202347993850708, 0.7881274223327637, 1.1560200452804565, 1.5239126682281494, 1.8918051719665527, 2.259697914123535, 2.6275906562805176, 2.995483160018921, 3.363375663757324, 3.7312684059143066, 4.099161148071289, 4.467053413391113, 4.834946155548096, 5.202838897705078, 5.5707316398620605, 5.938624382019043, 6.306516647338867, 6.67440938949585, 7.042302131652832, 7.410194396972656, 7.778087139129639, 8.145979881286621, 8.513872146606445, 8.881765365600586, 9.24965763092041, 9.617549896240234, 9.985443115234375, 10.3533353805542, 10.721227645874023, 11.089120864868164, 11.457013130187988, 11.824906349182129, 12.192798614501953, 12.560691833496094, 12.928584098815918, 13.296476364135742, 13.664369583129883, 14.032261848449707]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 10.0, 11.0, 11.0, 21.0, 35.0, 47.0, 76.0, 150.0, 271.0, 600.0, 1585.0, 6046.0, 39335.0, 824614.0, 3123143.0, 177145.0, 15842.0, 3445.0, 1048.0, 409.0, 172.0, 105.0, 66.0, 33.0, 26.0, 12.0, 8.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2119140625, -1.16748046875, -1.123046875, -1.07861328125, -1.0341796875, -0.98974609375, -0.9453125, -0.90087890625, -0.8564453125, -0.81201171875, -0.767578125, -0.72314453125, -0.6787109375, -0.63427734375, -0.58984375, -0.54541015625, -0.5009765625, -0.45654296875, -0.412109375, -0.36767578125, -0.3232421875, -0.27880859375, -0.234375, -0.18994140625, -0.1455078125, -0.10107421875, -0.056640625, -0.01220703125, 0.0322265625, 0.07666015625, 0.12109375, 0.16552734375, 0.2099609375, 0.25439453125, 0.298828125, 0.34326171875, 0.3876953125, 0.43212890625, 0.4765625, 0.52099609375, 0.5654296875, 0.60986328125, 0.654296875, 0.69873046875, 0.7431640625, 0.78759765625, 0.83203125, 0.87646484375, 0.9208984375, 0.96533203125, 1.009765625, 1.05419921875, 1.0986328125, 1.14306640625, 1.1875, 1.23193359375, 1.2763671875, 1.32080078125, 1.365234375, 1.40966796875, 1.4541015625, 1.49853515625, 1.54296875, 1.58740234375, 1.6318359375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 8.0, 9.0, 19.0, 10.0, 21.0, 24.0, 24.0, 28.0, 34.0, 40.0, 56.0, 54.0, 51.0, 77.0, 53.0, 51.0, 55.0, 59.0, 55.0, 52.0, 40.0, 33.0, 28.0, 27.0, 20.0, 15.0, 10.0, 10.0, 7.0, 5.0, 3.0, 6.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8359375, -0.8117523193359375, -0.787567138671875, -0.7633819580078125, -0.73919677734375, -0.7150115966796875, -0.690826416015625, -0.6666412353515625, -0.6424560546875, -0.6182708740234375, -0.594085693359375, -0.5699005126953125, -0.54571533203125, -0.5215301513671875, -0.497344970703125, -0.4731597900390625, -0.448974609375, -0.4247894287109375, -0.400604248046875, -0.3764190673828125, -0.35223388671875, -0.3280487060546875, -0.303863525390625, -0.2796783447265625, -0.2554931640625, -0.2313079833984375, -0.207122802734375, -0.1829376220703125, -0.15875244140625, -0.1345672607421875, -0.110382080078125, -0.0861968994140625, -0.06201171875, -0.0378265380859375, -0.013641357421875, 0.0105438232421875, 0.03472900390625, 0.0589141845703125, 0.083099365234375, 0.1072845458984375, 0.1314697265625, 0.1556549072265625, 0.179840087890625, 0.2040252685546875, 0.22821044921875, 0.2523956298828125, 0.276580810546875, 0.3007659912109375, 0.324951171875, 0.3491363525390625, 0.373321533203125, 0.3975067138671875, 0.42169189453125, 0.4458770751953125, 0.470062255859375, 0.4942474365234375, 0.5184326171875, 0.5426177978515625, 0.566802978515625, 0.5909881591796875, 0.61517333984375, 0.6393585205078125, 0.663543701171875, 0.6877288818359375, 0.7119140625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 5.0, 22.0, 18.0, 28.0, 54.0, 69.0, 127.0, 294.0, 624.0, 1910.0, 16646.0, 1889330.0, 2263792.0, 18267.0, 1932.0, 566.0, 275.0, 132.0, 64.0, 48.0, 30.0, 11.0, 19.0, 6.0, 4.0, 1.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.421875, -2.338409423828125, -2.25494384765625, -2.171478271484375, -2.0880126953125, -2.004547119140625, -1.92108154296875, -1.837615966796875, -1.754150390625, -1.670684814453125, -1.58721923828125, -1.503753662109375, -1.4202880859375, -1.336822509765625, -1.25335693359375, -1.169891357421875, -1.08642578125, -1.002960205078125, -0.91949462890625, -0.836029052734375, -0.7525634765625, -0.669097900390625, -0.58563232421875, -0.502166748046875, -0.418701171875, -0.335235595703125, -0.25177001953125, -0.168304443359375, -0.0848388671875, -0.001373291015625, 0.08209228515625, 0.165557861328125, 0.2490234375, 0.332489013671875, 0.41595458984375, 0.499420166015625, 0.5828857421875, 0.666351318359375, 0.74981689453125, 0.833282470703125, 0.916748046875, 1.000213623046875, 1.08367919921875, 1.167144775390625, 1.2506103515625, 1.334075927734375, 1.41754150390625, 1.501007080078125, 1.58447265625, 1.667938232421875, 1.75140380859375, 1.834869384765625, 1.9183349609375, 2.001800537109375, 2.08526611328125, 2.168731689453125, 2.252197265625, 2.335662841796875, 2.41912841796875, 2.502593994140625, 2.5860595703125, 2.669525146484375, 2.75299072265625, 2.836456298828125, 2.919921875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 9.0, 10.0, 21.0, 32.0, 69.0, 157.0, 315.0, 652.0, 1136.0, 856.0, 455.0, 177.0, 94.0, 35.0, 23.0, 14.0, 11.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.203125, -2.137664794921875, -2.07220458984375, -2.006744384765625, -1.9412841796875, -1.875823974609375, -1.81036376953125, -1.744903564453125, -1.679443359375, -1.613983154296875, -1.54852294921875, -1.483062744140625, -1.4176025390625, -1.352142333984375, -1.28668212890625, -1.221221923828125, -1.15576171875, -1.090301513671875, -1.02484130859375, -0.959381103515625, -0.8939208984375, -0.828460693359375, -0.76300048828125, -0.697540283203125, -0.632080078125, -0.566619873046875, -0.50115966796875, -0.435699462890625, -0.3702392578125, -0.304779052734375, -0.23931884765625, -0.173858642578125, -0.1083984375, -0.042938232421875, 0.02252197265625, 0.087982177734375, 0.1534423828125, 0.218902587890625, 0.28436279296875, 0.349822998046875, 0.415283203125, 0.480743408203125, 0.54620361328125, 0.611663818359375, 0.6771240234375, 0.742584228515625, 0.80804443359375, 0.873504638671875, 0.93896484375, 1.004425048828125, 1.06988525390625, 1.135345458984375, 1.2008056640625, 1.266265869140625, 1.33172607421875, 1.397186279296875, 1.462646484375, 1.528106689453125, 1.59356689453125, 1.659027099609375, 1.7244873046875, 1.789947509765625, 1.85540771484375, 1.920867919921875, 1.986328125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 3.0, 2.0, 3.0, 3.0, 2.0, 13.0, 16.0, 19.0, 40.0, 55.0, 86.0, 109.0, 126.0, 118.0, 93.0, 103.0, 67.0, 45.0, 37.0, 17.0, 13.0, 13.0, 6.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.485197067260742, -11.214035987854004, -10.942874908447266, -10.671712875366211, -10.400551795959473, -10.129390716552734, -9.858229637145996, -9.587068557739258, -9.315906524658203, -9.044745445251465, -8.773584365844727, -8.502422332763672, -8.231261253356934, -7.960100173950195, -7.688939094543457, -7.417778015136719, -7.1466169357299805, -6.875455856323242, -6.604294300079346, -6.333133220672607, -6.061971664428711, -5.790810585021973, -5.519649505615234, -5.248488426208496, -4.9773268699646, -4.706165790557861, -4.435004234313965, -4.163843154907227, -3.892681837081909, -3.621520519256592, -3.3503594398498535, -3.079198122024536, -2.8080368041992188, -2.5368754863739014, -2.265714168548584, -1.9945530891418457, -1.7233917713165283, -1.452230453491211, -1.181069254875183, -0.9099080562591553, -0.6387467384338379, -0.3675854802131653, -0.09642422199249268, 0.17473703622817993, 0.44589829444885254, 0.7170596122741699, 0.9882208108901978, 1.2593820095062256, 1.530543327331543, 1.8017046451568604, 2.0728659629821777, 2.344027042388916, 2.6151883602142334, 2.886349678039551, 3.157510757446289, 3.4286720752716064, 3.699833393096924, 3.970994710922241, 4.242156028747559, 4.513317108154297, 4.784478187561035, 5.055639743804932, 5.32680082321167, 5.597962379455566, 5.869123458862305]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 1.0, 5.0, 3.0, 9.0, 7.0, 13.0, 10.0, 14.0, 10.0, 22.0, 27.0, 33.0, 23.0, 47.0, 35.0, 40.0, 40.0, 52.0, 64.0, 36.0, 59.0, 50.0, 57.0, 43.0, 35.0, 37.0, 29.0, 28.0, 27.0, 21.0, 18.0, 19.0, 16.0, 17.0, 10.0, 6.0, 14.0, 6.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.218724250793457, -5.0508575439453125, -4.882990837097168, -4.715124607086182, -4.547257900238037, -4.379391193389893, -4.211524963378906, -4.043658256530762, -3.875791549682617, -3.7079248428344727, -3.5400583744049072, -3.372191905975342, -3.2043251991271973, -3.0364584922790527, -2.8685920238494873, -2.700725555419922, -2.5328588485717773, -2.364992141723633, -2.1971256732940674, -2.029259204864502, -1.8613924980163574, -1.6935259103775024, -1.5256593227386475, -1.3577927350997925, -1.1899261474609375, -1.0220595598220825, -0.8541929721832275, -0.6863263845443726, -0.5184597969055176, -0.3505932092666626, -0.18272662162780762, -0.014860033988952637, 0.15300655364990234, 0.3208731412887573, 0.4887397289276123, 0.6566063165664673, 0.8244729042053223, 0.9923394918441772, 1.1602060794830322, 1.3280726671218872, 1.4959392547607422, 1.6638058423995972, 1.8316724300384521, 1.9995390176773071, 2.167405605316162, 2.3352723121643066, 2.503138780593872, 2.6710052490234375, 2.838871955871582, 3.0067386627197266, 3.174605131149292, 3.3424715995788574, 3.510338306427002, 3.6782050132751465, 3.846071481704712, 4.013937950134277, 4.181804656982422, 4.349671363830566, 4.517538070678711, 4.685404300689697, 4.853271007537842, 5.021137714385986, 5.189003944396973, 5.356870651245117, 5.524737358093262]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 7.0, 2.0, 2.0, 9.0, 6.0, 19.0, 24.0, 35.0, 50.0, 74.0, 118.0, 203.0, 305.0, 574.0, 1163.0, 2735.0, 7263.0, 22875.0, 86802.0, 359510.0, 417519.0, 107202.0, 27712.0, 8467.0, 3055.0, 1296.0, 627.0, 339.0, 195.0, 114.0, 78.0, 52.0, 40.0, 28.0, 20.0, 10.0, 7.0, 6.0, 3.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.134765625, -1.0928497314453125, -1.050933837890625, -1.0090179443359375, -0.96710205078125, -0.9251861572265625, -0.883270263671875, -0.8413543701171875, -0.7994384765625, -0.7575225830078125, -0.715606689453125, -0.6736907958984375, -0.63177490234375, -0.5898590087890625, -0.547943115234375, -0.5060272216796875, -0.464111328125, -0.4221954345703125, -0.380279541015625, -0.3383636474609375, -0.29644775390625, -0.2545318603515625, -0.212615966796875, -0.1707000732421875, -0.1287841796875, -0.0868682861328125, -0.044952392578125, -0.0030364990234375, 0.03887939453125, 0.0807952880859375, 0.122711181640625, 0.1646270751953125, 0.20654296875, 0.2484588623046875, 0.290374755859375, 0.3322906494140625, 0.37420654296875, 0.4161224365234375, 0.458038330078125, 0.4999542236328125, 0.5418701171875, 0.5837860107421875, 0.625701904296875, 0.6676177978515625, 0.70953369140625, 0.7514495849609375, 0.793365478515625, 0.8352813720703125, 0.877197265625, 0.9191131591796875, 0.961029052734375, 1.0029449462890625, 1.04486083984375, 1.0867767333984375, 1.128692626953125, 1.1706085205078125, 1.2125244140625, 1.2544403076171875, 1.296356201171875, 1.3382720947265625, 1.38018798828125, 1.4221038818359375, 1.464019775390625, 1.5059356689453125, 1.5478515625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 9.0, 15.0, 18.0, 17.0, 26.0, 31.0, 56.0, 50.0, 56.0, 50.0, 88.0, 79.0, 73.0, 100.0, 79.0, 62.0, 46.0, 46.0, 32.0, 19.0, 16.0, 13.0, 5.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.341796875, -1.3072052001953125, -1.272613525390625, -1.2380218505859375, -1.20343017578125, -1.1688385009765625, -1.134246826171875, -1.0996551513671875, -1.0650634765625, -1.0304718017578125, -0.995880126953125, -0.9612884521484375, -0.92669677734375, -0.8921051025390625, -0.857513427734375, -0.8229217529296875, -0.788330078125, -0.7537384033203125, -0.719146728515625, -0.6845550537109375, -0.64996337890625, -0.6153717041015625, -0.580780029296875, -0.5461883544921875, -0.5115966796875, -0.4770050048828125, -0.442413330078125, -0.4078216552734375, -0.37322998046875, -0.3386383056640625, -0.304046630859375, -0.2694549560546875, -0.23486328125, -0.2002716064453125, -0.165679931640625, -0.1310882568359375, -0.09649658203125, -0.0619049072265625, -0.027313232421875, 0.0072784423828125, 0.0418701171875, 0.0764617919921875, 0.111053466796875, 0.1456451416015625, 0.18023681640625, 0.2148284912109375, 0.249420166015625, 0.2840118408203125, 0.318603515625, 0.3531951904296875, 0.387786865234375, 0.4223785400390625, 0.45697021484375, 0.4915618896484375, 0.526153564453125, 0.5607452392578125, 0.5953369140625, 0.6299285888671875, 0.664520263671875, 0.6991119384765625, 0.73370361328125, 0.7682952880859375, 0.802886962890625, 0.8374786376953125, 0.8720703125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 6.0, 11.0, 10.0, 20.0, 20.0, 32.0, 40.0, 56.0, 84.0, 144.0, 187.0, 358.0, 581.0, 1184.0, 3075.0, 10008.0, 51974.0, 617406.0, 311857.0, 38109.0, 8098.0, 2659.0, 1175.0, 557.0, 305.0, 195.0, 129.0, 68.0, 54.0, 39.0, 28.0, 23.0, 14.0, 10.0, 4.0, 8.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.890625, -1.83319091796875, -1.7757568359375, -1.71832275390625, -1.660888671875, -1.60345458984375, -1.5460205078125, -1.48858642578125, -1.43115234375, -1.37371826171875, -1.3162841796875, -1.25885009765625, -1.201416015625, -1.14398193359375, -1.0865478515625, -1.02911376953125, -0.9716796875, -0.91424560546875, -0.8568115234375, -0.79937744140625, -0.741943359375, -0.68450927734375, -0.6270751953125, -0.56964111328125, -0.51220703125, -0.45477294921875, -0.3973388671875, -0.33990478515625, -0.282470703125, -0.22503662109375, -0.1676025390625, -0.11016845703125, -0.052734375, 0.00469970703125, 0.0621337890625, 0.11956787109375, 0.177001953125, 0.23443603515625, 0.2918701171875, 0.34930419921875, 0.40673828125, 0.46417236328125, 0.5216064453125, 0.57904052734375, 0.636474609375, 0.69390869140625, 0.7513427734375, 0.80877685546875, 0.8662109375, 0.92364501953125, 0.9810791015625, 1.03851318359375, 1.095947265625, 1.15338134765625, 1.2108154296875, 1.26824951171875, 1.32568359375, 1.38311767578125, 1.4405517578125, 1.49798583984375, 1.555419921875, 1.61285400390625, 1.6702880859375, 1.72772216796875, 1.78515625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 14.0, 4.0, 13.0, 18.0, 14.0, 22.0, 27.0, 40.0, 31.0, 47.0, 44.0, 64.0, 38.0, 54.0, 72.0, 52.0, 53.0, 52.0, 60.0, 53.0, 45.0, 27.0, 24.0, 25.0, 23.0, 24.0, 10.0, 12.0, 8.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.5625, -2.470794677734375, -2.37908935546875, -2.287384033203125, -2.1956787109375, -2.103973388671875, -2.01226806640625, -1.920562744140625, -1.828857421875, -1.737152099609375, -1.64544677734375, -1.553741455078125, -1.4620361328125, -1.370330810546875, -1.27862548828125, -1.186920166015625, -1.09521484375, -1.003509521484375, -0.91180419921875, -0.820098876953125, -0.7283935546875, -0.636688232421875, -0.54498291015625, -0.453277587890625, -0.361572265625, -0.269866943359375, -0.17816162109375, -0.086456298828125, 0.0052490234375, 0.096954345703125, 0.18865966796875, 0.280364990234375, 0.3720703125, 0.463775634765625, 0.55548095703125, 0.647186279296875, 0.7388916015625, 0.830596923828125, 0.92230224609375, 1.014007568359375, 1.105712890625, 1.197418212890625, 1.28912353515625, 1.380828857421875, 1.4725341796875, 1.564239501953125, 1.65594482421875, 1.747650146484375, 1.83935546875, 1.931060791015625, 2.02276611328125, 2.114471435546875, 2.2061767578125, 2.297882080078125, 2.38958740234375, 2.481292724609375, 2.572998046875, 2.664703369140625, 2.75640869140625, 2.848114013671875, 2.9398193359375, 3.031524658203125, 3.12322998046875, 3.214935302734375, 3.306640625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 7.0, 5.0, 3.0, 4.0, 12.0, 19.0, 24.0, 23.0, 31.0, 53.0, 74.0, 101.0, 183.0, 269.0, 440.0, 805.0, 1419.0, 2752.0, 5668.0, 13046.0, 34464.0, 121880.0, 644041.0, 153750.0, 41097.0, 15001.0, 6446.0, 3151.0, 1582.0, 853.0, 479.0, 307.0, 186.0, 111.0, 73.0, 62.0, 37.0, 33.0, 11.0, 18.0, 9.0, 9.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.4560546875, -0.44161224365234375, -0.4271697998046875, -0.41272735595703125, -0.398284912109375, -0.38384246826171875, -0.3694000244140625, -0.35495758056640625, -0.34051513671875, -0.32607269287109375, -0.3116302490234375, -0.29718780517578125, -0.282745361328125, -0.26830291748046875, -0.2538604736328125, -0.23941802978515625, -0.2249755859375, -0.21053314208984375, -0.1960906982421875, -0.18164825439453125, -0.167205810546875, -0.15276336669921875, -0.1383209228515625, -0.12387847900390625, -0.10943603515625, -0.09499359130859375, -0.0805511474609375, -0.06610870361328125, -0.051666259765625, -0.03722381591796875, -0.0227813720703125, -0.00833892822265625, 0.006103515625, 0.02054595947265625, 0.0349884033203125, 0.04943084716796875, 0.063873291015625, 0.07831573486328125, 0.0927581787109375, 0.10720062255859375, 0.12164306640625, 0.13608551025390625, 0.1505279541015625, 0.16497039794921875, 0.179412841796875, 0.19385528564453125, 0.2082977294921875, 0.22274017333984375, 0.2371826171875, 0.25162506103515625, 0.2660675048828125, 0.28050994873046875, 0.294952392578125, 0.30939483642578125, 0.3238372802734375, 0.33827972412109375, 0.35272216796875, 0.36716461181640625, 0.3816070556640625, 0.39604949951171875, 0.410491943359375, 0.42493438720703125, 0.4393768310546875, 0.45381927490234375, 0.46826171875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 3.0, 6.0, 4.0, 7.0, 3.0, 11.0, 17.0, 24.0, 34.0, 46.0, 71.0, 115.0, 132.0, 137.0, 98.0, 84.0, 64.0, 36.0, 19.0, 22.0, 10.0, 10.0, 7.0, 3.0, 10.0, 3.0, 5.0, 7.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012624263763427734, -0.00012120045721530914, -0.00011615827679634094, -0.00011111609637737274, -0.00010607391595840454, -0.00010103173553943634, -9.598955512046814e-05, -9.094737470149994e-05, -8.590519428253174e-05, -8.086301386356354e-05, -7.582083344459534e-05, -7.077865302562714e-05, -6.573647260665894e-05, -6.0694292187690735e-05, -5.5652111768722534e-05, -5.0609931349754333e-05, -4.556775093078613e-05, -4.052557051181793e-05, -3.548339009284973e-05, -3.044120967388153e-05, -2.539902925491333e-05, -2.035684883594513e-05, -1.531466841697693e-05, -1.0272487998008728e-05, -5.230307579040527e-06, -1.8812716007232666e-07, 4.854053258895874e-06, 9.896233677864075e-06, 1.4938414096832275e-05, 1.9980594515800476e-05, 2.5022774934768677e-05, 3.0064955353736877e-05, 3.510713577270508e-05, 4.014931619167328e-05, 4.519149661064148e-05, 5.023367702960968e-05, 5.527585744857788e-05, 6.031803786754608e-05, 6.536021828651428e-05, 7.040239870548248e-05, 7.544457912445068e-05, 8.048675954341888e-05, 8.552893996238708e-05, 9.057112038135529e-05, 9.561330080032349e-05, 0.00010065548121929169, 0.00010569766163825989, 0.00011073984205722809, 0.00011578202247619629, 0.00012082420289516449, 0.0001258663833141327, 0.0001309085637331009, 0.0001359507441520691, 0.0001409929245710373, 0.0001460351049900055, 0.0001510772854089737, 0.0001561194658279419, 0.0001611616462469101, 0.0001662038266658783, 0.0001712460070848465, 0.0001762881875038147, 0.0001813303679227829, 0.0001863725483417511, 0.0001914147287607193, 0.0001964569091796875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 9.0, 8.0, 14.0, 13.0, 23.0, 34.0, 36.0, 59.0, 74.0, 109.0, 179.0, 283.0, 478.0, 802.0, 1621.0, 3228.0, 7173.0, 17485.0, 50019.0, 205874.0, 615105.0, 96203.0, 28638.0, 11206.0, 4770.0, 2230.0, 1200.0, 640.0, 342.0, 207.0, 139.0, 106.0, 55.0, 46.0, 50.0, 20.0, 19.0, 9.0, 17.0, 14.0, 6.0, 5.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.46484375, -0.4499702453613281, -0.43509674072265625, -0.4202232360839844, -0.4053497314453125, -0.3904762268066406, -0.37560272216796875, -0.3607292175292969, -0.345855712890625, -0.3309822082519531, -0.31610870361328125, -0.3012351989746094, -0.2863616943359375, -0.2714881896972656, -0.25661468505859375, -0.24174118041992188, -0.22686767578125, -0.21199417114257812, -0.19712066650390625, -0.18224716186523438, -0.1673736572265625, -0.15250015258789062, -0.13762664794921875, -0.12275314331054688, -0.107879638671875, -0.09300613403320312, -0.07813262939453125, -0.06325912475585938, -0.0483856201171875, -0.033512115478515625, -0.01863861083984375, -0.003765106201171875, 0.0111083984375, 0.025981903076171875, 0.04085540771484375, 0.055728912353515625, 0.0706024169921875, 0.08547592163085938, 0.10034942626953125, 0.11522293090820312, 0.130096435546875, 0.14496994018554688, 0.15984344482421875, 0.17471694946289062, 0.1895904541015625, 0.20446395874023438, 0.21933746337890625, 0.23421096801757812, 0.24908447265625, 0.2639579772949219, 0.27883148193359375, 0.2937049865722656, 0.3085784912109375, 0.3234519958496094, 0.33832550048828125, 0.3531990051269531, 0.368072509765625, 0.3829460144042969, 0.39781951904296875, 0.4126930236816406, 0.4275665283203125, 0.4424400329589844, 0.45731353759765625, 0.4721870422363281, 0.487060546875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 3.0, 3.0, 4.0, 4.0, 1.0, 6.0, 7.0, 14.0, 12.0, 22.0, 25.0, 34.0, 43.0, 70.0, 86.0, 114.0, 100.0, 101.0, 84.0, 45.0, 57.0, 39.0, 31.0, 20.0, 18.0, 15.0, 11.0, 6.0, 7.0, 2.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54150390625, -0.52362060546875, -0.5057373046875, -0.48785400390625, -0.469970703125, -0.45208740234375, -0.4342041015625, -0.41632080078125, -0.3984375, -0.38055419921875, -0.3626708984375, -0.34478759765625, -0.326904296875, -0.30902099609375, -0.2911376953125, -0.27325439453125, -0.25537109375, -0.23748779296875, -0.2196044921875, -0.20172119140625, -0.183837890625, -0.16595458984375, -0.1480712890625, -0.13018798828125, -0.1123046875, -0.09442138671875, -0.0765380859375, -0.05865478515625, -0.040771484375, -0.02288818359375, -0.0050048828125, 0.01287841796875, 0.03076171875, 0.04864501953125, 0.0665283203125, 0.08441162109375, 0.102294921875, 0.12017822265625, 0.1380615234375, 0.15594482421875, 0.173828125, 0.19171142578125, 0.2095947265625, 0.22747802734375, 0.245361328125, 0.26324462890625, 0.2811279296875, 0.29901123046875, 0.31689453125, 0.33477783203125, 0.3526611328125, 0.37054443359375, 0.388427734375, 0.40631103515625, 0.4241943359375, 0.44207763671875, 0.4599609375, 0.47784423828125, 0.4957275390625, 0.51361083984375, 0.531494140625, 0.54937744140625, 0.5672607421875, 0.58514404296875, 0.60302734375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 6.0, 16.0, 20.0, 126.0, 451.0, 274.0, 78.0, 19.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.717517852783203, -27.786540985107422, -26.85556411743164, -25.92458724975586, -24.993610382080078, -24.062633514404297, -23.131656646728516, -22.200679779052734, -21.269702911376953, -20.338726043701172, -19.40774917602539, -18.47677230834961, -17.545795440673828, -16.614818572998047, -15.683842658996582, -14.7528657913208, -13.821889877319336, -12.890913009643555, -11.959936141967773, -11.028959274291992, -10.097982406616211, -9.16700553894043, -8.236029624938965, -7.305052757263184, -6.374075889587402, -5.443099021911621, -4.51212215423584, -3.581145763397217, -2.6501688957214355, -1.7191920280456543, -0.7882156372070312, 0.14276123046875, 1.0737361907958984, 2.0047130584716797, 2.935689687728882, 3.866666316986084, 4.797643184661865, 5.7286200523376465, 6.6595964431762695, 7.590573310852051, 8.521550178527832, 9.452527046203613, 10.383503913879395, 11.31447982788086, 12.24545669555664, 13.176433563232422, 14.107410430908203, 15.038387298583984, 15.969364166259766, 16.900341033935547, 17.831317901611328, 18.76229476928711, 19.69327163696289, 20.624248504638672, 21.555225372314453, 22.486202239990234, 23.417179107666016, 24.348155975341797, 25.279132843017578, 26.21010971069336, 27.14108657836914, 28.072063446044922, 29.003040313720703, 29.934017181396484, 30.864992141723633]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 6.0, 5.0, 8.0, 5.0, 14.0, 16.0, 18.0, 21.0, 22.0, 19.0, 23.0, 27.0, 36.0, 29.0, 28.0, 35.0, 76.0, 70.0, 108.0, 70.0, 56.0, 47.0, 40.0, 34.0, 31.0, 19.0, 26.0, 16.0, 22.0, 9.0, 14.0, 10.0, 5.0, 8.0, 8.0, 8.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.930009841918945, -8.614164352416992, -8.298317909240723, -7.982471942901611, -7.6666259765625, -7.350780010223389, -7.034934043884277, -6.719088077545166, -6.403242111206055, -6.087396144866943, -5.771550178527832, -5.455704212188721, -5.139858245849609, -4.824012279510498, -4.508166313171387, -4.192320346832275, -3.876474380493164, -3.5606284141540527, -3.2447824478149414, -2.92893648147583, -2.6130905151367188, -2.2972445487976074, -1.981398582458496, -1.6655526161193848, -1.3497066497802734, -1.033860683441162, -0.7180147171020508, -0.40216875076293945, -0.08632278442382812, 0.2295231819152832, 0.5453691482543945, 0.8612151145935059, 1.1770620346069336, 1.492908000946045, 1.8087539672851562, 2.1245999336242676, 2.440445899963379, 2.7562918663024902, 3.0721378326416016, 3.387983798980713, 3.703829765319824, 4.0196757316589355, 4.335521697998047, 4.651367664337158, 4.9672136306762695, 5.283059597015381, 5.598905563354492, 5.9147515296936035, 6.230597496032715, 6.546443462371826, 6.8622894287109375, 7.178135395050049, 7.49398136138916, 7.8098273277282715, 8.125673294067383, 8.441518783569336, 8.757365226745605, 9.073211669921875, 9.389057159423828, 9.704902648925781, 10.02074909210205, 10.33659553527832, 10.652441024780273, 10.968286514282227, 11.284132957458496]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 14.0, 18.0, 25.0, 53.0, 78.0, 118.0, 232.0, 514.0, 1336.0, 5089.0, 70699.0, 3665392.0, 436202.0, 11195.0, 1976.0, 655.0, 286.0, 155.0, 92.0, 59.0, 36.0, 21.0, 8.0, 6.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.970703125, -2.887481689453125, -2.80426025390625, -2.721038818359375, -2.6378173828125, -2.554595947265625, -2.47137451171875, -2.388153076171875, -2.304931640625, -2.221710205078125, -2.13848876953125, -2.055267333984375, -1.9720458984375, -1.888824462890625, -1.80560302734375, -1.722381591796875, -1.63916015625, -1.555938720703125, -1.47271728515625, -1.389495849609375, -1.3062744140625, -1.223052978515625, -1.13983154296875, -1.056610107421875, -0.973388671875, -0.890167236328125, -0.80694580078125, -0.723724365234375, -0.6405029296875, -0.557281494140625, -0.47406005859375, -0.390838623046875, -0.3076171875, -0.224395751953125, -0.14117431640625, -0.057952880859375, 0.0252685546875, 0.108489990234375, 0.19171142578125, 0.274932861328125, 0.358154296875, 0.441375732421875, 0.52459716796875, 0.607818603515625, 0.6910400390625, 0.774261474609375, 0.85748291015625, 0.940704345703125, 1.02392578125, 1.107147216796875, 1.19036865234375, 1.273590087890625, 1.3568115234375, 1.440032958984375, 1.52325439453125, 1.606475830078125, 1.689697265625, 1.772918701171875, 1.85614013671875, 1.939361572265625, 2.0225830078125, 2.105804443359375, 2.18902587890625, 2.272247314453125, 2.35546875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 4.0, 3.0, 1.0, 8.0, 6.0, 13.0, 8.0, 18.0, 22.0, 27.0, 18.0, 37.0, 38.0, 45.0, 44.0, 40.0, 64.0, 68.0, 62.0, 50.0, 46.0, 49.0, 59.0, 56.0, 41.0, 41.0, 28.0, 26.0, 18.0, 21.0, 10.0, 6.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7412109375, -0.7153549194335938, -0.6894989013671875, -0.6636428833007812, -0.637786865234375, -0.6119308471679688, -0.5860748291015625, -0.5602188110351562, -0.53436279296875, -0.5085067749023438, -0.4826507568359375, -0.45679473876953125, -0.430938720703125, -0.40508270263671875, -0.3792266845703125, -0.35337066650390625, -0.3275146484375, -0.30165863037109375, -0.2758026123046875, -0.24994659423828125, -0.224090576171875, -0.19823455810546875, -0.1723785400390625, -0.14652252197265625, -0.12066650390625, -0.09481048583984375, -0.0689544677734375, -0.04309844970703125, -0.017242431640625, 0.00861358642578125, 0.0344696044921875, 0.06032562255859375, 0.086181640625, 0.11203765869140625, 0.1378936767578125, 0.16374969482421875, 0.189605712890625, 0.21546173095703125, 0.2413177490234375, 0.26717376708984375, 0.29302978515625, 0.31888580322265625, 0.3447418212890625, 0.37059783935546875, 0.396453857421875, 0.42230987548828125, 0.4481658935546875, 0.47402191162109375, 0.4998779296875, 0.5257339477539062, 0.5515899658203125, 0.5774459838867188, 0.603302001953125, 0.6291580200195312, 0.6550140380859375, 0.6808700561523438, 0.70672607421875, 0.7325820922851562, 0.7584381103515625, 0.7842941284179688, 0.810150146484375, 0.8360061645507812, 0.8618621826171875, 0.8877182006835938, 0.91357421875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 12.0, 13.0, 35.0, 58.0, 139.0, 390.0, 1339.0, 8853.0, 3650223.0, 527479.0, 4380.0, 909.0, 269.0, 91.0, 36.0, 32.0, 9.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.333984375, -3.194244384765625, -3.05450439453125, -2.914764404296875, -2.7750244140625, -2.635284423828125, -2.49554443359375, -2.355804443359375, -2.216064453125, -2.076324462890625, -1.93658447265625, -1.796844482421875, -1.6571044921875, -1.517364501953125, -1.37762451171875, -1.237884521484375, -1.09814453125, -0.958404541015625, -0.81866455078125, -0.678924560546875, -0.5391845703125, -0.399444580078125, -0.25970458984375, -0.119964599609375, 0.019775390625, 0.159515380859375, 0.29925537109375, 0.438995361328125, 0.5787353515625, 0.718475341796875, 0.85821533203125, 0.997955322265625, 1.1376953125, 1.277435302734375, 1.41717529296875, 1.556915283203125, 1.6966552734375, 1.836395263671875, 1.97613525390625, 2.115875244140625, 2.255615234375, 2.395355224609375, 2.53509521484375, 2.674835205078125, 2.8145751953125, 2.954315185546875, 3.09405517578125, 3.233795166015625, 3.37353515625, 3.513275146484375, 3.65301513671875, 3.792755126953125, 3.9324951171875, 4.072235107421875, 4.21197509765625, 4.351715087890625, 4.491455078125, 4.631195068359375, 4.77093505859375, 4.910675048828125, 5.0504150390625, 5.190155029296875, 5.32989501953125, 5.469635009765625, 5.609375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 8.0, 7.0, 15.0, 44.0, 64.0, 132.0, 233.0, 450.0, 827.0, 901.0, 661.0, 321.0, 187.0, 76.0, 56.0, 39.0, 21.0, 10.0, 6.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.25, -2.184234619140625, -2.11846923828125, -2.052703857421875, -1.9869384765625, -1.921173095703125, -1.85540771484375, -1.789642333984375, -1.723876953125, -1.658111572265625, -1.59234619140625, -1.526580810546875, -1.4608154296875, -1.395050048828125, -1.32928466796875, -1.263519287109375, -1.19775390625, -1.131988525390625, -1.06622314453125, -1.000457763671875, -0.9346923828125, -0.868927001953125, -0.80316162109375, -0.737396240234375, -0.671630859375, -0.605865478515625, -0.54010009765625, -0.474334716796875, -0.4085693359375, -0.342803955078125, -0.27703857421875, -0.211273193359375, -0.1455078125, -0.079742431640625, -0.01397705078125, 0.051788330078125, 0.1175537109375, 0.183319091796875, 0.24908447265625, 0.314849853515625, 0.380615234375, 0.446380615234375, 0.51214599609375, 0.577911376953125, 0.6436767578125, 0.709442138671875, 0.77520751953125, 0.840972900390625, 0.90673828125, 0.972503662109375, 1.03826904296875, 1.104034423828125, 1.1697998046875, 1.235565185546875, 1.30133056640625, 1.367095947265625, 1.432861328125, 1.498626708984375, 1.56439208984375, 1.630157470703125, 1.6959228515625, 1.761688232421875, 1.82745361328125, 1.893218994140625, 1.958984375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 6.0, 12.0, 11.0, 33.0, 80.0, 134.0, 206.0, 215.0, 152.0, 74.0, 36.0, 18.0, 11.0, 4.0, 2.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-22.01462173461914, -21.450361251831055, -20.88610076904297, -20.32183837890625, -19.757577896118164, -19.193317413330078, -18.629056930541992, -18.064796447753906, -17.500534057617188, -16.9362735748291, -16.372013092041016, -15.807751655578613, -15.243490219116211, -14.679229736328125, -14.114969253540039, -13.550707817077637, -12.98644733428955, -12.422186851501465, -11.857925415039062, -11.293664932250977, -10.729403495788574, -10.165143013000488, -9.600881576538086, -9.03662109375, -8.472360610961914, -7.90809965133667, -7.343838691711426, -6.77957820892334, -6.2153167724609375, -5.651056289672852, -5.086795330047607, -4.522534370422363, -3.958272933959961, -3.394011974334717, -2.8297510147094727, -2.2654902935028076, -1.7012293338775635, -1.1369683742523193, -0.5727076530456543, -0.008446693420410156, 0.555814266204834, 1.1200752258300781, 1.6843360662460327, 2.2485969066619873, 2.8128578662872314, 3.3771188259124756, 3.9413795471191406, 4.505640506744385, 5.069901466369629, 5.634162425994873, 6.198423385620117, 6.762683868408203, 7.3269453048706055, 7.891205787658691, 8.455467224121094, 9.01972770690918, 9.583988189697266, 10.148248672485352, 10.712510108947754, 11.27677059173584, 11.841032028198242, 12.405292510986328, 12.969552993774414, 13.533814430236816, 14.098075866699219]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 1.0, 2.0, 2.0, 9.0, 15.0, 8.0, 22.0, 23.0, 20.0, 24.0, 28.0, 39.0, 31.0, 48.0, 40.0, 39.0, 41.0, 38.0, 71.0, 57.0, 50.0, 59.0, 44.0, 49.0, 39.0, 42.0, 29.0, 22.0, 16.0, 17.0, 21.0, 8.0, 13.0, 5.0, 10.0, 1.0, 5.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.788386344909668, -6.557389736175537, -6.326393127441406, -6.095396518707275, -5.8643999099731445, -5.633403301239014, -5.402406692504883, -5.171409606933594, -4.940413475036621, -4.70941686630249, -4.478420257568359, -4.2474236488342285, -4.016427040100098, -3.785430431365967, -3.554433584213257, -3.323436975479126, -3.092440128326416, -2.861443519592285, -2.6304469108581543, -2.3994503021240234, -2.1684536933898926, -1.9374569654464722, -1.7064602375030518, -1.475463628768921, -1.24446702003479, -1.0134704113006592, -0.7824737429618835, -0.5514770746231079, -0.32048046588897705, -0.08948385715484619, 0.14151287078857422, 0.3725094795227051, 0.6035056114196777, 0.8345022201538086, 1.0654988288879395, 1.2964955568313599, 1.5274921655654907, 1.7584887742996216, 1.989485502243042, 2.220482110977173, 2.4514787197113037, 2.6824753284454346, 2.9134719371795654, 3.1444687843322754, 3.3754653930664062, 3.606462001800537, 3.837458610534668, 4.068455219268799, 4.29945182800293, 4.5304484367370605, 4.761445045471191, 4.992441654205322, 5.223438262939453, 5.454434871673584, 5.685431480407715, 5.916428565979004, 6.147424697875977, 6.378421306610107, 6.609417915344238, 6.840414524078369, 7.0714111328125, 7.302407741546631, 7.533404350280762, 7.764401435852051, 7.995398044586182]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 3.0, 9.0, 5.0, 18.0, 28.0, 33.0, 82.0, 122.0, 301.0, 734.0, 2165.0, 7351.0, 31649.0, 172544.0, 602127.0, 186697.0, 33207.0, 7787.0, 2224.0, 763.0, 376.0, 154.0, 73.0, 38.0, 29.0, 18.0, 11.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5869140625, -1.5292510986328125, -1.471588134765625, -1.4139251708984375, -1.35626220703125, -1.2985992431640625, -1.240936279296875, -1.1832733154296875, -1.1256103515625, -1.0679473876953125, -1.010284423828125, -0.9526214599609375, -0.89495849609375, -0.8372955322265625, -0.779632568359375, -0.7219696044921875, -0.664306640625, -0.6066436767578125, -0.548980712890625, -0.4913177490234375, -0.43365478515625, -0.3759918212890625, -0.318328857421875, -0.2606658935546875, -0.2030029296875, -0.1453399658203125, -0.087677001953125, -0.0300140380859375, 0.02764892578125, 0.0853118896484375, 0.142974853515625, 0.2006378173828125, 0.25830078125, 0.3159637451171875, 0.373626708984375, 0.4312896728515625, 0.48895263671875, 0.5466156005859375, 0.604278564453125, 0.6619415283203125, 0.7196044921875, 0.7772674560546875, 0.834930419921875, 0.8925933837890625, 0.95025634765625, 1.0079193115234375, 1.065582275390625, 1.1232452392578125, 1.180908203125, 1.2385711669921875, 1.296234130859375, 1.3538970947265625, 1.41156005859375, 1.4692230224609375, 1.526885986328125, 1.5845489501953125, 1.6422119140625, 1.6998748779296875, 1.757537841796875, 1.8152008056640625, 1.87286376953125, 1.9305267333984375, 1.988189697265625, 2.0458526611328125, 2.103515625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 7.0, 9.0, 15.0, 21.0, 20.0, 21.0, 19.0, 37.0, 30.0, 40.0, 46.0, 42.0, 58.0, 63.0, 60.0, 52.0, 43.0, 50.0, 58.0, 52.0, 50.0, 41.0, 37.0, 20.0, 22.0, 28.0, 13.0, 8.0, 7.0, 2.0, 5.0, 6.0, 2.0, 2.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.728515625, -0.7017288208007812, -0.6749420166015625, -0.6481552124023438, -0.621368408203125, -0.5945816040039062, -0.5677947998046875, -0.5410079956054688, -0.51422119140625, -0.48743438720703125, -0.4606475830078125, -0.43386077880859375, -0.407073974609375, -0.38028717041015625, -0.3535003662109375, -0.32671356201171875, -0.2999267578125, -0.27313995361328125, -0.2463531494140625, -0.21956634521484375, -0.192779541015625, -0.16599273681640625, -0.1392059326171875, -0.11241912841796875, -0.08563232421875, -0.05884552001953125, -0.0320587158203125, -0.00527191162109375, 0.021514892578125, 0.04830169677734375, 0.0750885009765625, 0.10187530517578125, 0.128662109375, 0.15544891357421875, 0.1822357177734375, 0.20902252197265625, 0.235809326171875, 0.26259613037109375, 0.2893829345703125, 0.31616973876953125, 0.34295654296875, 0.36974334716796875, 0.3965301513671875, 0.42331695556640625, 0.450103759765625, 0.47689056396484375, 0.5036773681640625, 0.5304641723632812, 0.5572509765625, 0.5840377807617188, 0.6108245849609375, 0.6376113891601562, 0.664398193359375, 0.6911849975585938, 0.7179718017578125, 0.7447586059570312, 0.77154541015625, 0.7983322143554688, 0.8251190185546875, 0.8519058227539062, 0.878692626953125, 0.9054794311523438, 0.9322662353515625, 0.9590530395507812, 0.98583984375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 3.0, 5.0, 5.0, 10.0, 6.0, 10.0, 11.0, 26.0, 28.0, 36.0, 65.0, 97.0, 122.0, 196.0, 300.0, 467.0, 885.0, 2063.0, 6208.0, 28342.0, 209422.0, 715745.0, 66684.0, 11524.0, 3292.0, 1273.0, 621.0, 361.0, 221.0, 145.0, 102.0, 73.0, 56.0, 36.0, 26.0, 21.0, 17.0, 12.0, 15.0, 5.0, 9.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.93359375, -1.87359619140625, -1.8135986328125, -1.75360107421875, -1.693603515625, -1.63360595703125, -1.5736083984375, -1.51361083984375, -1.45361328125, -1.39361572265625, -1.3336181640625, -1.27362060546875, -1.213623046875, -1.15362548828125, -1.0936279296875, -1.03363037109375, -0.9736328125, -0.91363525390625, -0.8536376953125, -0.79364013671875, -0.733642578125, -0.67364501953125, -0.6136474609375, -0.55364990234375, -0.49365234375, -0.43365478515625, -0.3736572265625, -0.31365966796875, -0.253662109375, -0.19366455078125, -0.1336669921875, -0.07366943359375, -0.013671875, 0.04632568359375, 0.1063232421875, 0.16632080078125, 0.226318359375, 0.28631591796875, 0.3463134765625, 0.40631103515625, 0.46630859375, 0.52630615234375, 0.5863037109375, 0.64630126953125, 0.706298828125, 0.76629638671875, 0.8262939453125, 0.88629150390625, 0.9462890625, 1.00628662109375, 1.0662841796875, 1.12628173828125, 1.186279296875, 1.24627685546875, 1.3062744140625, 1.36627197265625, 1.42626953125, 1.48626708984375, 1.5462646484375, 1.60626220703125, 1.666259765625, 1.72625732421875, 1.7862548828125, 1.84625244140625, 1.90625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 10.0, 6.0, 10.0, 12.0, 17.0, 15.0, 20.0, 22.0, 36.0, 43.0, 46.0, 66.0, 85.0, 69.0, 84.0, 66.0, 68.0, 64.0, 50.0, 39.0, 26.0, 36.0, 23.0, 20.0, 20.0, 17.0, 8.0, 4.0, 4.0, 4.0, 4.0, 2.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.39453125, -4.274261474609375, -4.15399169921875, -4.033721923828125, -3.9134521484375, -3.793182373046875, -3.67291259765625, -3.552642822265625, -3.432373046875, -3.312103271484375, -3.19183349609375, -3.071563720703125, -2.9512939453125, -2.831024169921875, -2.71075439453125, -2.590484619140625, -2.47021484375, -2.349945068359375, -2.22967529296875, -2.109405517578125, -1.9891357421875, -1.868865966796875, -1.74859619140625, -1.628326416015625, -1.508056640625, -1.387786865234375, -1.26751708984375, -1.147247314453125, -1.0269775390625, -0.906707763671875, -0.78643798828125, -0.666168212890625, -0.5458984375, -0.425628662109375, -0.30535888671875, -0.185089111328125, -0.0648193359375, 0.055450439453125, 0.17572021484375, 0.295989990234375, 0.416259765625, 0.536529541015625, 0.65679931640625, 0.777069091796875, 0.8973388671875, 1.017608642578125, 1.13787841796875, 1.258148193359375, 1.37841796875, 1.498687744140625, 1.61895751953125, 1.739227294921875, 1.8594970703125, 1.979766845703125, 2.10003662109375, 2.220306396484375, 2.340576171875, 2.460845947265625, 2.58111572265625, 2.701385498046875, 2.8216552734375, 2.941925048828125, 3.06219482421875, 3.182464599609375, 3.302734375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 2.0, 8.0, 9.0, 10.0, 19.0, 35.0, 39.0, 79.0, 122.0, 208.0, 441.0, 1157.0, 3674.0, 15864.0, 107756.0, 820034.0, 81040.0, 13014.0, 3110.0, 1041.0, 405.0, 176.0, 100.0, 69.0, 43.0, 22.0, 21.0, 14.0, 8.0, 5.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81591796875, -0.7928924560546875, -0.769866943359375, -0.7468414306640625, -0.72381591796875, -0.7007904052734375, -0.677764892578125, -0.6547393798828125, -0.6317138671875, -0.6086883544921875, -0.585662841796875, -0.5626373291015625, -0.53961181640625, -0.5165863037109375, -0.493560791015625, -0.4705352783203125, -0.447509765625, -0.4244842529296875, -0.401458740234375, -0.3784332275390625, -0.35540771484375, -0.3323822021484375, -0.309356689453125, -0.2863311767578125, -0.2633056640625, -0.2402801513671875, -0.217254638671875, -0.1942291259765625, -0.17120361328125, -0.1481781005859375, -0.125152587890625, -0.1021270751953125, -0.0791015625, -0.0560760498046875, -0.033050537109375, -0.0100250244140625, 0.01300048828125, 0.0360260009765625, 0.059051513671875, 0.0820770263671875, 0.1051025390625, 0.1281280517578125, 0.151153564453125, 0.1741790771484375, 0.19720458984375, 0.2202301025390625, 0.243255615234375, 0.2662811279296875, 0.289306640625, 0.3123321533203125, 0.335357666015625, 0.3583831787109375, 0.38140869140625, 0.4044342041015625, 0.427459716796875, 0.4504852294921875, 0.4735107421875, 0.4965362548828125, 0.519561767578125, 0.5425872802734375, 0.56561279296875, 0.5886383056640625, 0.611663818359375, 0.6346893310546875, 0.65771484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 8.0, 7.0, 10.0, 9.0, 20.0, 20.0, 23.0, 49.0, 46.0, 80.0, 121.0, 148.0, 137.0, 90.0, 54.0, 37.0, 27.0, 13.0, 21.0, 6.0, 15.0, 5.0, 9.0, 5.0, 2.0, 8.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.00020766258239746094, -0.00020199082791805267, -0.0001963190734386444, -0.00019064731895923615, -0.00018497556447982788, -0.00017930381000041962, -0.00017363205552101135, -0.0001679603010416031, -0.00016228854656219482, -0.00015661679208278656, -0.0001509450376033783, -0.00014527328312397003, -0.00013960152864456177, -0.0001339297741651535, -0.00012825801968574524, -0.00012258626520633698, -0.00011691451072692871, -0.00011124275624752045, -0.00010557100176811218, -9.989924728870392e-05, -9.422749280929565e-05, -8.855573832988739e-05, -8.288398385047913e-05, -7.721222937107086e-05, -7.15404748916626e-05, -6.586872041225433e-05, -6.019696593284607e-05, -5.4525211453437805e-05, -4.885345697402954e-05, -4.318170249462128e-05, -3.750994801521301e-05, -3.183819353580475e-05, -2.6166439056396484e-05, -2.049468457698822e-05, -1.4822930097579956e-05, -9.151175618171692e-06, -3.4794211387634277e-06, 2.1923333406448364e-06, 7.8640878200531e-06, 1.3535842299461365e-05, 1.920759677886963e-05, 2.4879351258277893e-05, 3.055110573768616e-05, 3.622286021709442e-05, 4.1894614696502686e-05, 4.756636917591095e-05, 5.3238123655319214e-05, 5.890987813472748e-05, 6.458163261413574e-05, 7.0253387093544e-05, 7.592514157295227e-05, 8.159689605236053e-05, 8.72686505317688e-05, 9.294040501117706e-05, 9.861215949058533e-05, 0.00010428391396999359, 0.00010995566844940186, 0.00011562742292881012, 0.00012129917740821838, 0.00012697093188762665, 0.0001326426863670349, 0.00013831444084644318, 0.00014398619532585144, 0.0001496579498052597, 0.00015532970428466797]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 7.0, 9.0, 9.0, 18.0, 28.0, 57.0, 87.0, 138.0, 229.0, 397.0, 757.0, 1597.0, 3959.0, 11616.0, 45929.0, 303150.0, 606006.0, 53606.0, 13158.0, 4235.0, 1732.0, 796.0, 422.0, 259.0, 127.0, 88.0, 45.0, 27.0, 23.0, 8.0, 11.0, 6.0, 2.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5263671875, -0.50885009765625, -0.4913330078125, -0.47381591796875, -0.456298828125, -0.43878173828125, -0.4212646484375, -0.40374755859375, -0.38623046875, -0.36871337890625, -0.3511962890625, -0.33367919921875, -0.316162109375, -0.29864501953125, -0.2811279296875, -0.26361083984375, -0.24609375, -0.22857666015625, -0.2110595703125, -0.19354248046875, -0.176025390625, -0.15850830078125, -0.1409912109375, -0.12347412109375, -0.10595703125, -0.08843994140625, -0.0709228515625, -0.05340576171875, -0.035888671875, -0.01837158203125, -0.0008544921875, 0.01666259765625, 0.0341796875, 0.05169677734375, 0.0692138671875, 0.08673095703125, 0.104248046875, 0.12176513671875, 0.1392822265625, 0.15679931640625, 0.17431640625, 0.19183349609375, 0.2093505859375, 0.22686767578125, 0.244384765625, 0.26190185546875, 0.2794189453125, 0.29693603515625, 0.314453125, 0.33197021484375, 0.3494873046875, 0.36700439453125, 0.384521484375, 0.40203857421875, 0.4195556640625, 0.43707275390625, 0.45458984375, 0.47210693359375, 0.4896240234375, 0.50714111328125, 0.524658203125, 0.54217529296875, 0.5596923828125, 0.57720947265625, 0.5947265625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 8.0, 10.0, 7.0, 11.0, 17.0, 23.0, 38.0, 43.0, 85.0, 110.0, 156.0, 146.0, 109.0, 90.0, 50.0, 34.0, 27.0, 16.0, 10.0, 8.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8134765625, -0.787139892578125, -0.76080322265625, -0.734466552734375, -0.7081298828125, -0.681793212890625, -0.65545654296875, -0.629119873046875, -0.602783203125, -0.576446533203125, -0.55010986328125, -0.523773193359375, -0.4974365234375, -0.471099853515625, -0.44476318359375, -0.418426513671875, -0.39208984375, -0.365753173828125, -0.33941650390625, -0.313079833984375, -0.2867431640625, -0.260406494140625, -0.23406982421875, -0.207733154296875, -0.181396484375, -0.155059814453125, -0.12872314453125, -0.102386474609375, -0.0760498046875, -0.049713134765625, -0.02337646484375, 0.002960205078125, 0.029296875, 0.055633544921875, 0.08197021484375, 0.108306884765625, 0.1346435546875, 0.160980224609375, 0.18731689453125, 0.213653564453125, 0.239990234375, 0.266326904296875, 0.29266357421875, 0.319000244140625, 0.3453369140625, 0.371673583984375, 0.39801025390625, 0.424346923828125, 0.45068359375, 0.477020263671875, 0.50335693359375, 0.529693603515625, 0.5560302734375, 0.582366943359375, 0.60870361328125, 0.635040283203125, 0.661376953125, 0.687713623046875, 0.71405029296875, 0.740386962890625, 0.7667236328125, 0.793060302734375, 0.81939697265625, 0.845733642578125, 0.8720703125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 12.0, 16.0, 46.0, 140.0, 421.0, 229.0, 74.0, 29.0, 11.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.44162940979004, -21.659757614135742, -20.877885818481445, -20.09601402282715, -19.31414222717285, -18.532270431518555, -17.750396728515625, -16.968524932861328, -16.18665313720703, -15.404781341552734, -14.622909545898438, -13.84103775024414, -13.059165954589844, -12.277294158935547, -11.495421409606934, -10.713549613952637, -9.931678771972656, -9.14980697631836, -8.367935180664062, -7.586062908172607, -6.8041911125183105, -6.022319316864014, -5.240447044372559, -4.458575248718262, -3.676703453063965, -2.894831657409668, -2.112959623336792, -1.331087589263916, -0.5492157936096191, 0.23265600204467773, 1.0145282745361328, 1.7964000701904297, 2.5782718658447266, 3.3601436614990234, 4.14201545715332, 4.923887729644775, 5.705759525299072, 6.487631320953369, 7.269503593444824, 8.051375389099121, 8.833247184753418, 9.615118980407715, 10.396990776062012, 11.178863525390625, 11.960735321044922, 12.742607116699219, 13.524478912353516, 14.306350708007812, 15.08822250366211, 15.870094299316406, 16.651966094970703, 17.433837890625, 18.215709686279297, 18.997581481933594, 19.77945327758789, 20.561325073242188, 21.343196868896484, 22.12506866455078, 22.906940460205078, 23.688812255859375, 24.470684051513672, 25.25255584716797, 26.034427642822266, 26.816299438476562, 27.598173141479492]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 6.0, 4.0, 3.0, 10.0, 8.0, 10.0, 6.0, 11.0, 7.0, 14.0, 13.0, 14.0, 13.0, 24.0, 27.0, 27.0, 27.0, 40.0, 35.0, 43.0, 67.0, 99.0, 88.0, 57.0, 42.0, 35.0, 40.0, 34.0, 30.0, 25.0, 22.0, 17.0, 17.0, 11.0, 14.0, 11.0, 7.0, 8.0, 7.0, 3.0, 7.0, 4.0, 2.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0], "bins": [-11.67521858215332, -11.349438667297363, -11.023659706115723, -10.697879791259766, -10.372100830078125, -10.046320915222168, -9.720541000366211, -9.39476203918457, -9.068982124328613, -8.743202209472656, -8.417423248291016, -8.091643333435059, -7.76586389541626, -7.440084457397461, -7.114304542541504, -6.788525104522705, -6.462745666503906, -6.136966228485107, -5.811186790466309, -5.485406875610352, -5.159627437591553, -4.833847999572754, -4.508068084716797, -4.182288646697998, -3.856509208679199, -3.5307297706604004, -3.2049500942230225, -2.8791704177856445, -2.5533909797668457, -2.227611541748047, -1.901831865310669, -1.576052188873291, -1.2502727508544922, -0.9244931936264038, -0.5987136363983154, -0.27293407917022705, 0.05284547805786133, 0.3786250352859497, 0.7044045925140381, 1.030184268951416, 1.3559637069702148, 1.6817432641983032, 2.0075228214263916, 2.3333024978637695, 2.6590819358825684, 2.984861373901367, 3.310641050338745, 3.636420726776123, 3.962200164794922, 4.287979602813721, 4.6137590408325195, 4.939538955688477, 5.265318393707275, 5.591097831726074, 5.916877746582031, 6.24265718460083, 6.568436622619629, 6.894216060638428, 7.219995498657227, 7.545775413513184, 7.871554851531982, 8.197334289550781, 8.523114204406738, 8.848894119262695, 9.174673080444336]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 12.0, 10.0, 18.0, 23.0, 41.0, 62.0, 98.0, 130.0, 219.0, 419.0, 832.0, 1746.0, 4370.0, 12953.0, 60378.0, 484431.0, 2372149.0, 1088483.0, 133194.0, 23093.0, 6645.0, 2550.0, 1106.0, 581.0, 298.0, 164.0, 109.0, 56.0, 31.0, 29.0, 11.0, 10.0, 5.0, 6.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.408203125, -1.35736083984375, -1.3065185546875, -1.25567626953125, -1.204833984375, -1.15399169921875, -1.1031494140625, -1.05230712890625, -1.00146484375, -0.95062255859375, -0.8997802734375, -0.84893798828125, -0.798095703125, -0.74725341796875, -0.6964111328125, -0.64556884765625, -0.5947265625, -0.54388427734375, -0.4930419921875, -0.44219970703125, -0.391357421875, -0.34051513671875, -0.2896728515625, -0.23883056640625, -0.18798828125, -0.13714599609375, -0.0863037109375, -0.03546142578125, 0.015380859375, 0.06622314453125, 0.1170654296875, 0.16790771484375, 0.21875, 0.26959228515625, 0.3204345703125, 0.37127685546875, 0.422119140625, 0.47296142578125, 0.5238037109375, 0.57464599609375, 0.62548828125, 0.67633056640625, 0.7271728515625, 0.77801513671875, 0.828857421875, 0.87969970703125, 0.9305419921875, 0.98138427734375, 1.0322265625, 1.08306884765625, 1.1339111328125, 1.18475341796875, 1.235595703125, 1.28643798828125, 1.3372802734375, 1.38812255859375, 1.43896484375, 1.48980712890625, 1.5406494140625, 1.59149169921875, 1.642333984375, 1.69317626953125, 1.7440185546875, 1.79486083984375, 1.845703125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 9.0, 6.0, 11.0, 18.0, 25.0, 24.0, 27.0, 39.0, 45.0, 53.0, 60.0, 59.0, 71.0, 72.0, 66.0, 64.0, 68.0, 51.0, 44.0, 33.0, 35.0, 35.0, 20.0, 20.0, 10.0, 7.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.033203125, -1.0024871826171875, -0.971771240234375, -0.9410552978515625, -0.91033935546875, -0.8796234130859375, -0.848907470703125, -0.8181915283203125, -0.7874755859375, -0.7567596435546875, -0.726043701171875, -0.6953277587890625, -0.66461181640625, -0.6338958740234375, -0.603179931640625, -0.5724639892578125, -0.541748046875, -0.5110321044921875, -0.480316162109375, -0.4496002197265625, -0.41888427734375, -0.3881683349609375, -0.357452392578125, -0.3267364501953125, -0.2960205078125, -0.2653045654296875, -0.234588623046875, -0.2038726806640625, -0.17315673828125, -0.1424407958984375, -0.111724853515625, -0.0810089111328125, -0.05029296875, -0.0195770263671875, 0.011138916015625, 0.0418548583984375, 0.07257080078125, 0.1032867431640625, 0.134002685546875, 0.1647186279296875, 0.1954345703125, 0.2261505126953125, 0.256866455078125, 0.2875823974609375, 0.31829833984375, 0.3490142822265625, 0.379730224609375, 0.4104461669921875, 0.441162109375, 0.4718780517578125, 0.502593994140625, 0.5333099365234375, 0.56402587890625, 0.5947418212890625, 0.625457763671875, 0.6561737060546875, 0.6868896484375, 0.7176055908203125, 0.748321533203125, 0.7790374755859375, 0.80975341796875, 0.8404693603515625, 0.871185302734375, 0.9019012451171875, 0.9326171875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 8.0, 11.0, 18.0, 28.0, 42.0, 55.0, 82.0, 125.0, 198.0, 335.0, 651.0, 1397.0, 3369.0, 15184.0, 805484.0, 3330768.0, 28126.0, 4833.0, 1685.0, 758.0, 428.0, 224.0, 137.0, 94.0, 70.0, 45.0, 24.0, 18.0, 12.0, 14.0, 10.0, 5.0, 3.0, 2.0, 6.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.69140625, -4.553955078125, -4.41650390625, -4.279052734375, -4.1416015625, -4.004150390625, -3.86669921875, -3.729248046875, -3.591796875, -3.454345703125, -3.31689453125, -3.179443359375, -3.0419921875, -2.904541015625, -2.76708984375, -2.629638671875, -2.4921875, -2.354736328125, -2.21728515625, -2.079833984375, -1.9423828125, -1.804931640625, -1.66748046875, -1.530029296875, -1.392578125, -1.255126953125, -1.11767578125, -0.980224609375, -0.8427734375, -0.705322265625, -0.56787109375, -0.430419921875, -0.29296875, -0.155517578125, -0.01806640625, 0.119384765625, 0.2568359375, 0.394287109375, 0.53173828125, 0.669189453125, 0.806640625, 0.944091796875, 1.08154296875, 1.218994140625, 1.3564453125, 1.493896484375, 1.63134765625, 1.768798828125, 1.90625, 2.043701171875, 2.18115234375, 2.318603515625, 2.4560546875, 2.593505859375, 2.73095703125, 2.868408203125, 3.005859375, 3.143310546875, 3.28076171875, 3.418212890625, 3.5556640625, 3.693115234375, 3.83056640625, 3.968017578125, 4.10546875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 8.0, 3.0, 7.0, 12.0, 20.0, 26.0, 52.0, 71.0, 120.0, 169.0, 277.0, 471.0, 624.0, 753.0, 539.0, 333.0, 226.0, 140.0, 78.0, 50.0, 36.0, 16.0, 19.0, 12.0, 6.0, 3.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.091796875, -1.993377685546875, -1.89495849609375, -1.796539306640625, -1.6981201171875, -1.599700927734375, -1.50128173828125, -1.402862548828125, -1.304443359375, -1.206024169921875, -1.10760498046875, -1.009185791015625, -0.9107666015625, -0.812347412109375, -0.71392822265625, -0.615509033203125, -0.51708984375, -0.418670654296875, -0.32025146484375, -0.221832275390625, -0.1234130859375, -0.024993896484375, 0.07342529296875, 0.171844482421875, 0.270263671875, 0.368682861328125, 0.46710205078125, 0.565521240234375, 0.6639404296875, 0.762359619140625, 0.86077880859375, 0.959197998046875, 1.0576171875, 1.156036376953125, 1.25445556640625, 1.352874755859375, 1.4512939453125, 1.549713134765625, 1.64813232421875, 1.746551513671875, 1.844970703125, 1.943389892578125, 2.04180908203125, 2.140228271484375, 2.2386474609375, 2.337066650390625, 2.43548583984375, 2.533905029296875, 2.63232421875, 2.730743408203125, 2.82916259765625, 2.927581787109375, 3.0260009765625, 3.124420166015625, 3.22283935546875, 3.321258544921875, 3.419677734375, 3.518096923828125, 3.61651611328125, 3.714935302734375, 3.8133544921875, 3.911773681640625, 4.01019287109375, 4.108612060546875, 4.20703125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 5.0, 3.0, 6.0, 10.0, 12.0, 13.0, 20.0, 40.0, 56.0, 111.0, 148.0, 149.0, 155.0, 102.0, 67.0, 29.0, 24.0, 8.0, 12.0, 6.0, 7.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.542396545410156, -17.761537551879883, -16.980680465698242, -16.19982147216797, -15.418964385986328, -14.638105392456055, -13.857247352600098, -13.07638931274414, -12.295531272888184, -11.514673233032227, -10.73381519317627, -9.952957153320312, -9.172098159790039, -8.391241073608398, -7.610382080078125, -6.829524040222168, -6.048666000366211, -5.267807960510254, -4.486949920654297, -3.7060914039611816, -2.9252333641052246, -2.1443753242492676, -1.3635168075561523, -0.5826587677001953, 0.19819927215576172, 0.9790574312210083, 1.7599155902862549, 2.540773868560791, 3.321631908416748, 4.102489948272705, 4.88334846496582, 5.664206504821777, 6.445064544677734, 7.225922584533691, 8.006780624389648, 8.787639617919922, 9.568496704101562, 10.349355697631836, 11.130213737487793, 11.91107177734375, 12.691929817199707, 13.472787857055664, 14.253645896911621, 15.034503936767578, 15.815362930297852, 16.596220016479492, 17.377079010009766, 18.157936096191406, 18.93879508972168, 19.719654083251953, 20.500511169433594, 21.281370162963867, 22.062227249145508, 22.84308624267578, 23.623943328857422, 24.404802322387695, 25.18566131591797, 25.966520309448242, 26.747377395629883, 27.528236389160156, 28.309093475341797, 29.08995246887207, 29.870811462402344, 30.651668548583984, 31.432525634765625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 8.0, 11.0, 12.0, 19.0, 17.0, 25.0, 24.0, 28.0, 32.0, 49.0, 48.0, 58.0, 57.0, 78.0, 77.0, 73.0, 50.0, 58.0, 42.0, 40.0, 34.0, 34.0, 31.0, 21.0, 17.0, 17.0, 11.0, 11.0, 3.0, 3.0, 8.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-19.986719131469727, -19.46503448486328, -18.943347930908203, -18.421663284301758, -17.899978637695312, -17.378293991088867, -16.856609344482422, -16.334922790527344, -15.813238143920898, -15.291553497314453, -14.769867897033691, -14.24818229675293, -13.726497650146484, -13.204813003540039, -12.683127403259277, -12.161441802978516, -11.63975715637207, -11.118072509765625, -10.596386909484863, -10.074701309204102, -9.553016662597656, -9.031332015991211, -8.50964641571045, -7.987961292266846, -7.466276168823242, -6.944591045379639, -6.422905921936035, -5.901220798492432, -5.379535675048828, -4.857850551605225, -4.336165428161621, -3.8144803047180176, -3.2927932739257812, -2.7711081504821777, -2.249423027038574, -1.7277379035949707, -1.2060527801513672, -0.6843676567077637, -0.16268253326416016, 0.35900259017944336, 0.8806877136230469, 1.4023728370666504, 1.924057960510254, 2.4457430839538574, 2.967428207397461, 3.4891133308410645, 4.010798454284668, 4.5324835777282715, 5.054168701171875, 5.5758538246154785, 6.097538948059082, 6.6192240715026855, 7.140909194946289, 7.662594318389893, 8.184279441833496, 8.705965042114258, 9.227649688720703, 9.749334335327148, 10.27101993560791, 10.792705535888672, 11.314390182495117, 11.836074829101562, 12.357760429382324, 12.879446029663086, 13.401130676269531]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 5.0, 11.0, 12.0, 16.0, 26.0, 44.0, 64.0, 91.0, 186.0, 328.0, 584.0, 1239.0, 2754.0, 7103.0, 22062.0, 103008.0, 647099.0, 208863.0, 37366.0, 10425.0, 3812.0, 1715.0, 749.0, 405.0, 208.0, 133.0, 85.0, 60.0, 35.0, 13.0, 10.0, 9.0, 7.0, 3.0, 4.0, 8.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6220703125, -1.5708770751953125, -1.519683837890625, -1.4684906005859375, -1.41729736328125, -1.3661041259765625, -1.314910888671875, -1.2637176513671875, -1.2125244140625, -1.1613311767578125, -1.110137939453125, -1.0589447021484375, -1.00775146484375, -0.9565582275390625, -0.905364990234375, -0.8541717529296875, -0.802978515625, -0.7517852783203125, -0.700592041015625, -0.6493988037109375, -0.59820556640625, -0.5470123291015625, -0.495819091796875, -0.4446258544921875, -0.3934326171875, -0.3422393798828125, -0.291046142578125, -0.2398529052734375, -0.18865966796875, -0.1374664306640625, -0.086273193359375, -0.0350799560546875, 0.01611328125, 0.0673065185546875, 0.118499755859375, 0.1696929931640625, 0.22088623046875, 0.2720794677734375, 0.323272705078125, 0.3744659423828125, 0.4256591796875, 0.4768524169921875, 0.528045654296875, 0.5792388916015625, 0.63043212890625, 0.6816253662109375, 0.732818603515625, 0.7840118408203125, 0.835205078125, 0.8863983154296875, 0.937591552734375, 0.9887847900390625, 1.03997802734375, 1.0911712646484375, 1.142364501953125, 1.1935577392578125, 1.2447509765625, 1.2959442138671875, 1.347137451171875, 1.3983306884765625, 1.44952392578125, 1.5007171630859375, 1.551910400390625, 1.6031036376953125, 1.654296875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 6.0, 8.0, 15.0, 21.0, 30.0, 33.0, 32.0, 38.0, 60.0, 59.0, 65.0, 89.0, 76.0, 79.0, 67.0, 78.0, 52.0, 57.0, 29.0, 29.0, 16.0, 18.0, 7.0, 10.0, 6.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97998046875, -0.9381942749023438, -0.8964080810546875, -0.8546218872070312, -0.812835693359375, -0.7710494995117188, -0.7292633056640625, -0.6874771118164062, -0.64569091796875, -0.6039047241210938, -0.5621185302734375, -0.5203323364257812, -0.478546142578125, -0.43675994873046875, -0.3949737548828125, -0.35318756103515625, -0.3114013671875, -0.26961517333984375, -0.2278289794921875, -0.18604278564453125, -0.144256591796875, -0.10247039794921875, -0.0606842041015625, -0.01889801025390625, 0.02288818359375, 0.06467437744140625, 0.1064605712890625, 0.14824676513671875, 0.190032958984375, 0.23181915283203125, 0.2736053466796875, 0.31539154052734375, 0.357177734375, 0.39896392822265625, 0.4407501220703125, 0.48253631591796875, 0.524322509765625, 0.5661087036132812, 0.6078948974609375, 0.6496810913085938, 0.69146728515625, 0.7332534790039062, 0.7750396728515625, 0.8168258666992188, 0.858612060546875, 0.9003982543945312, 0.9421844482421875, 0.9839706420898438, 1.0257568359375, 1.0675430297851562, 1.1093292236328125, 1.1511154174804688, 1.192901611328125, 1.2346878051757812, 1.2764739990234375, 1.3182601928710938, 1.36004638671875, 1.4018325805664062, 1.4436187744140625, 1.4854049682617188, 1.527191162109375, 1.5689773559570312, 1.6107635498046875, 1.6525497436523438, 1.6943359375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 6.0, 12.0, 9.0, 18.0, 23.0, 16.0, 38.0, 74.0, 90.0, 159.0, 275.0, 564.0, 1422.0, 6433.0, 86486.0, 920026.0, 27400.0, 3420.0, 1023.0, 436.0, 224.0, 127.0, 87.0, 51.0, 38.0, 27.0, 11.0, 13.0, 11.0, 7.0, 5.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.5390625, -2.455291748046875, -2.37152099609375, -2.287750244140625, -2.2039794921875, -2.120208740234375, -2.03643798828125, -1.952667236328125, -1.868896484375, -1.785125732421875, -1.70135498046875, -1.617584228515625, -1.5338134765625, -1.450042724609375, -1.36627197265625, -1.282501220703125, -1.19873046875, -1.114959716796875, -1.03118896484375, -0.947418212890625, -0.8636474609375, -0.779876708984375, -0.69610595703125, -0.612335205078125, -0.528564453125, -0.444793701171875, -0.36102294921875, -0.277252197265625, -0.1934814453125, -0.109710693359375, -0.02593994140625, 0.057830810546875, 0.1416015625, 0.225372314453125, 0.30914306640625, 0.392913818359375, 0.4766845703125, 0.560455322265625, 0.64422607421875, 0.727996826171875, 0.811767578125, 0.895538330078125, 0.97930908203125, 1.063079833984375, 1.1468505859375, 1.230621337890625, 1.31439208984375, 1.398162841796875, 1.48193359375, 1.565704345703125, 1.64947509765625, 1.733245849609375, 1.8170166015625, 1.900787353515625, 1.98455810546875, 2.068328857421875, 2.152099609375, 2.235870361328125, 2.31964111328125, 2.403411865234375, 2.4871826171875, 2.570953369140625, 2.65472412109375, 2.738494873046875, 2.822265625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 12.0, 7.0, 8.0, 10.0, 4.0, 7.0, 18.0, 15.0, 27.0, 34.0, 34.0, 47.0, 59.0, 79.0, 74.0, 92.0, 77.0, 68.0, 59.0, 47.0, 33.0, 34.0, 36.0, 11.0, 24.0, 17.0, 12.0, 11.0, 11.0, 10.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.53125, -4.4041748046875, -4.277099609375, -4.1500244140625, -4.02294921875, -3.8958740234375, -3.768798828125, -3.6417236328125, -3.5146484375, -3.3875732421875, -3.260498046875, -3.1334228515625, -3.00634765625, -2.8792724609375, -2.752197265625, -2.6251220703125, -2.498046875, -2.3709716796875, -2.243896484375, -2.1168212890625, -1.98974609375, -1.8626708984375, -1.735595703125, -1.6085205078125, -1.4814453125, -1.3543701171875, -1.227294921875, -1.1002197265625, -0.97314453125, -0.8460693359375, -0.718994140625, -0.5919189453125, -0.46484375, -0.3377685546875, -0.210693359375, -0.0836181640625, 0.04345703125, 0.1705322265625, 0.297607421875, 0.4246826171875, 0.5517578125, 0.6788330078125, 0.805908203125, 0.9329833984375, 1.06005859375, 1.1871337890625, 1.314208984375, 1.4412841796875, 1.568359375, 1.6954345703125, 1.822509765625, 1.9495849609375, 2.07666015625, 2.2037353515625, 2.330810546875, 2.4578857421875, 2.5849609375, 2.7120361328125, 2.839111328125, 2.9661865234375, 3.09326171875, 3.2203369140625, 3.347412109375, 3.4744873046875, 3.6015625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 12.0, 24.0, 50.0, 90.0, 197.0, 400.0, 1116.0, 4497.0, 39464.0, 949375.0, 46394.0, 4900.0, 1245.0, 409.0, 154.0, 93.0, 43.0, 38.0, 17.0, 13.0, 13.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.357421875, -0.33911895751953125, -0.3208160400390625, -0.30251312255859375, -0.284210205078125, -0.26590728759765625, -0.2476043701171875, -0.22930145263671875, -0.21099853515625, -0.19269561767578125, -0.1743927001953125, -0.15608978271484375, -0.137786865234375, -0.11948394775390625, -0.1011810302734375, -0.08287811279296875, -0.0645751953125, -0.04627227783203125, -0.0279693603515625, -0.00966644287109375, 0.008636474609375, 0.02693939208984375, 0.0452423095703125, 0.06354522705078125, 0.08184814453125, 0.10015106201171875, 0.1184539794921875, 0.13675689697265625, 0.155059814453125, 0.17336273193359375, 0.1916656494140625, 0.20996856689453125, 0.228271484375, 0.24657440185546875, 0.2648773193359375, 0.28318023681640625, 0.301483154296875, 0.31978607177734375, 0.3380889892578125, 0.35639190673828125, 0.37469482421875, 0.39299774169921875, 0.4113006591796875, 0.42960357666015625, 0.447906494140625, 0.46620941162109375, 0.4845123291015625, 0.5028152465820312, 0.5211181640625, 0.5394210815429688, 0.5577239990234375, 0.5760269165039062, 0.594329833984375, 0.6126327514648438, 0.6309356689453125, 0.6492385864257812, 0.66754150390625, 0.6858444213867188, 0.7041473388671875, 0.7224502563476562, 0.740753173828125, 0.7590560913085938, 0.7773590087890625, 0.7956619262695312, 0.81396484375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 8.0, 7.0, 16.0, 19.0, 26.0, 52.0, 60.0, 139.0, 204.0, 171.0, 98.0, 67.0, 41.0, 34.0, 15.0, 11.0, 9.0, 7.0, 8.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001138448715209961, -0.00010922178626060486, -0.00010459870100021362, -9.997561573982239e-05, -9.535253047943115e-05, -9.072944521903992e-05, -8.610635995864868e-05, -8.148327469825745e-05, -7.686018943786621e-05, -7.223710417747498e-05, -6.761401891708374e-05, -6.29909336566925e-05, -5.836784839630127e-05, -5.3744763135910034e-05, -4.91216778755188e-05, -4.4498592615127563e-05, -3.987550735473633e-05, -3.525242209434509e-05, -3.062933683395386e-05, -2.6006251573562622e-05, -2.1383166313171387e-05, -1.676008105278015e-05, -1.2136995792388916e-05, -7.513910531997681e-06, -2.8908252716064453e-06, 1.73225998878479e-06, 6.355345249176025e-06, 1.097843050956726e-05, 1.5601515769958496e-05, 2.022460103034973e-05, 2.4847686290740967e-05, 2.9470771551132202e-05, 3.409385681152344e-05, 3.871694207191467e-05, 4.334002733230591e-05, 4.7963112592697144e-05, 5.258619785308838e-05, 5.7209283113479614e-05, 6.183236837387085e-05, 6.645545363426208e-05, 7.107853889465332e-05, 7.570162415504456e-05, 8.032470941543579e-05, 8.494779467582703e-05, 8.957087993621826e-05, 9.41939651966095e-05, 9.881705045700073e-05, 0.00010344013571739197, 0.0001080632209777832, 0.00011268630623817444, 0.00011730939149856567, 0.00012193247675895691, 0.00012655556201934814, 0.00013117864727973938, 0.00013580173254013062, 0.00014042481780052185, 0.00014504790306091309, 0.00014967098832130432, 0.00015429407358169556, 0.0001589171588420868, 0.00016354024410247803, 0.00016816332936286926, 0.0001727864146232605, 0.00017740949988365173, 0.00018203258514404297]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 2.0, 6.0, 8.0, 12.0, 16.0, 21.0, 47.0, 82.0, 169.0, 324.0, 649.0, 1666.0, 5229.0, 21971.0, 188074.0, 783976.0, 34883.0, 7513.0, 2241.0, 820.0, 391.0, 185.0, 98.0, 56.0, 48.0, 25.0, 6.0, 6.0, 11.0, 8.0, 0.0, 5.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3662109375, -0.3544464111328125, -0.342681884765625, -0.3309173583984375, -0.31915283203125, -0.3073883056640625, -0.295623779296875, -0.2838592529296875, -0.2720947265625, -0.2603302001953125, -0.248565673828125, -0.2368011474609375, -0.22503662109375, -0.2132720947265625, -0.201507568359375, -0.1897430419921875, -0.177978515625, -0.1662139892578125, -0.154449462890625, -0.1426849365234375, -0.13092041015625, -0.1191558837890625, -0.107391357421875, -0.0956268310546875, -0.0838623046875, -0.0720977783203125, -0.060333251953125, -0.0485687255859375, -0.03680419921875, -0.0250396728515625, -0.013275146484375, -0.0015106201171875, 0.01025390625, 0.0220184326171875, 0.033782958984375, 0.0455474853515625, 0.05731201171875, 0.0690765380859375, 0.080841064453125, 0.0926055908203125, 0.1043701171875, 0.1161346435546875, 0.127899169921875, 0.1396636962890625, 0.15142822265625, 0.1631927490234375, 0.174957275390625, 0.1867218017578125, 0.198486328125, 0.2102508544921875, 0.222015380859375, 0.2337799072265625, 0.24554443359375, 0.2573089599609375, 0.269073486328125, 0.2808380126953125, 0.2926025390625, 0.3043670654296875, 0.316131591796875, 0.3278961181640625, 0.33966064453125, 0.3514251708984375, 0.363189697265625, 0.3749542236328125, 0.38671875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 5.0, 4.0, 7.0, 12.0, 10.0, 12.0, 25.0, 41.0, 47.0, 70.0, 101.0, 108.0, 115.0, 102.0, 95.0, 72.0, 53.0, 39.0, 25.0, 15.0, 8.0, 8.0, 7.0, 4.0, 5.0, 1.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.50390625, -0.49108123779296875, -0.4782562255859375, -0.46543121337890625, -0.452606201171875, -0.43978118896484375, -0.4269561767578125, -0.41413116455078125, -0.40130615234375, -0.38848114013671875, -0.3756561279296875, -0.36283111572265625, -0.350006103515625, -0.33718109130859375, -0.3243560791015625, -0.31153106689453125, -0.2987060546875, -0.28588104248046875, -0.2730560302734375, -0.26023101806640625, -0.247406005859375, -0.23458099365234375, -0.2217559814453125, -0.20893096923828125, -0.19610595703125, -0.18328094482421875, -0.1704559326171875, -0.15763092041015625, -0.144805908203125, -0.13198089599609375, -0.1191558837890625, -0.10633087158203125, -0.093505859375, -0.08068084716796875, -0.0678558349609375, -0.05503082275390625, -0.042205810546875, -0.02938079833984375, -0.0165557861328125, -0.00373077392578125, 0.00909423828125, 0.02191925048828125, 0.0347442626953125, 0.04756927490234375, 0.060394287109375, 0.07321929931640625, 0.0860443115234375, 0.09886932373046875, 0.1116943359375, 0.12451934814453125, 0.1373443603515625, 0.15016937255859375, 0.162994384765625, 0.17581939697265625, 0.1886444091796875, 0.20146942138671875, 0.21429443359375, 0.22711944580078125, 0.2399444580078125, 0.25276947021484375, 0.265594482421875, 0.27841949462890625, 0.2912445068359375, 0.30406951904296875, 0.31689453125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 24.0, 63.0, 265.0, 394.0, 168.0, 49.0, 13.0, 8.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.317867279052734, -14.431597709655762, -13.545327186584473, -12.6590576171875, -11.772788047790527, -10.886518478393555, -10.000247955322266, -9.113978385925293, -8.22770881652832, -7.3414387702941895, -6.455169200897217, -5.568899154663086, -4.682629585266113, -3.7963595390319824, -2.9100894927978516, -2.023819923400879, -1.1375494003295898, -0.2512795329093933, 0.6349903345108032, 1.5212602615356445, 2.4075300693511963, 3.293799877166748, 4.180069923400879, 5.066339492797852, 5.952609539031982, 6.838879585266113, 7.725149154663086, 8.611419677734375, 9.497689247131348, 10.38395881652832, 11.27022933959961, 12.156497955322266, 13.042768478393555, 13.929038047790527, 14.815308570861816, 15.701578140258789, 16.587848663330078, 17.474117279052734, 18.360387802124023, 19.246658325195312, 20.13292694091797, 21.019197463989258, 21.905466079711914, 22.791736602783203, 23.678007125854492, 24.56427574157715, 25.450546264648438, 26.336814880371094, 27.223087310791016, 28.109357833862305, 28.99562644958496, 29.88189697265625, 30.76816749572754, 31.654436111450195, 32.540706634521484, 33.42697525024414, 34.3132438659668, 35.19951248168945, 36.085784912109375, 36.97205352783203, 37.85832214355469, 38.74459457397461, 39.630863189697266, 40.51713180541992, 41.403404235839844]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 1.0, 2.0, 6.0, 5.0, 7.0, 9.0, 5.0, 19.0, 11.0, 11.0, 18.0, 22.0, 23.0, 42.0, 56.0, 55.0, 80.0, 52.0, 43.0, 34.0, 44.0, 35.0, 44.0, 54.0, 79.0, 50.0, 40.0, 31.0, 19.0, 16.0, 11.0, 12.0, 14.0, 5.0, 9.0, 4.0, 7.0, 8.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.57175064086914, -8.276681900024414, -7.981612682342529, -7.686543941497803, -7.391474723815918, -7.096405982971191, -6.801337242126465, -6.50626802444458, -6.211198806762695, -5.916130065917969, -5.621060848236084, -5.325992107391357, -5.030922889709473, -4.735854148864746, -4.4407854080200195, -4.145716190338135, -3.850647449493408, -3.5555784702301025, -3.260509490966797, -2.9654407501220703, -2.6703715324401855, -2.375302791595459, -2.0802338123321533, -1.7851648330688477, -1.490095853805542, -1.1950268745422363, -0.8999579548835754, -0.6048890352249146, -0.3098200559616089, -0.014751076698303223, 0.2803177833557129, 0.5753867626190186, 0.8704557418823242, 1.1655247211456299, 1.4605937004089355, 1.7556625604629517, 2.050731658935547, 2.3458003997802734, 2.640869379043579, 2.9359383583068848, 3.2310073375701904, 3.526076316833496, 3.8211452960968018, 4.116214275360107, 4.411283016204834, 4.706352233886719, 5.001420974731445, 5.296489715576172, 5.591558933258057, 5.886627674102783, 6.181696891784668, 6.4767656326293945, 6.771834850311279, 7.066903591156006, 7.361972808837891, 7.657041549682617, 7.952110290527344, 8.24717903137207, 8.542247772216797, 8.83731746673584, 9.132386207580566, 9.427454948425293, 9.72252368927002, 10.017593383789062, 10.312662124633789]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 7.0, 8.0, 8.0, 13.0, 11.0, 20.0, 18.0, 16.0, 18.0, 22.0, 33.0, 37.0, 38.0, 54.0, 189.0, 170.0, 68.0, 47.0, 39.0, 35.0, 34.0, 26.0, 25.0, 20.0, 10.0, 8.0, 3.0, 9.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9248046875, -0.89288330078125, -0.8609619140625, -0.82904052734375, -0.797119140625, -0.76519775390625, -0.7332763671875, -0.70135498046875, -0.66943359375, -0.63751220703125, -0.6055908203125, -0.57366943359375, -0.541748046875, -0.50982666015625, -0.4779052734375, -0.44598388671875, -0.4140625, -0.38214111328125, -0.3502197265625, -0.31829833984375, -0.286376953125, -0.25445556640625, -0.2225341796875, -0.19061279296875, -0.15869140625, -0.12677001953125, -0.0948486328125, -0.06292724609375, -0.031005859375, 0.00091552734375, 0.0328369140625, 0.06475830078125, 0.0966796875, 0.12860107421875, 0.1605224609375, 0.19244384765625, 0.224365234375, 0.25628662109375, 0.2882080078125, 0.32012939453125, 0.35205078125, 0.38397216796875, 0.4158935546875, 0.44781494140625, 0.479736328125, 0.51165771484375, 0.5435791015625, 0.57550048828125, 0.607421875, 0.63934326171875, 0.6712646484375, 0.70318603515625, 0.735107421875, 0.76702880859375, 0.7989501953125, 0.83087158203125, 0.86279296875, 0.89471435546875, 0.9266357421875, 0.95855712890625, 0.990478515625, 1.02239990234375, 1.0543212890625, 1.08624267578125, 1.1181640625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 3.0, 11.0, 2.0, 12.0, 20.0, 23.0, 18.0, 36.0, 44.0, 78.0, 140.0, 289.0, 960.0, 4871.0, 8264847.0, 112195.0, 3584.0, 821.0, 265.0, 140.0, 67.0, 38.0, 33.0, 18.0, 15.0, 10.0, 9.0, 5.0, 5.0, 4.0, 3.0, 2.0, 6.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.571640014648438, -10.229765892028809, -9.88789176940918, -9.54601764678955, -9.204143524169922, -8.862268447875977, -8.520394325256348, -8.178520202636719, -7.83664608001709, -7.494771957397461, -7.152897834777832, -6.811023235321045, -6.469149112701416, -6.127274990081787, -5.785400390625, -5.443526268005371, -5.101652145385742, -4.759778022766113, -4.417903900146484, -4.076029300689697, -3.7341551780700684, -3.3922810554504395, -3.0504066944122314, -2.7085323333740234, -2.3666582107543945, -2.0247840881347656, -1.6829097270965576, -1.3410354852676392, -0.9991612434387207, -0.6572870016098022, -0.3154127597808838, 0.02646160125732422, 0.36833667755126953, 0.710210919380188, 1.0520851612091064, 1.393959403038025, 1.7358336448669434, 2.0777077674865723, 2.4195821285247803, 2.7614564895629883, 3.103330612182617, 3.445204734802246, 3.787079095840454, 4.128953456878662, 4.470827579498291, 4.81270170211792, 5.154576301574707, 5.496450424194336, 5.838324546813965, 6.180198669433594, 6.522072792053223, 6.86394739151001, 7.205821514129639, 7.547695636749268, 7.889570236206055, 8.231444358825684, 8.573318481445312, 8.915192604064941, 9.25706672668457, 9.5989408493042, 9.940814971923828, 10.282690048217773, 10.624564170837402, 10.966438293457031, 11.30831241607666]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 1.0, 3.0, 5.0, 7.0, 4.0, 3.0, 5.0, 4.0, 6.0, 3.0, 4.0, 5.0, 2.0, 6.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.34718894958496, -20.727449417114258, -20.107707977294922, -19.48796844482422, -18.868228912353516, -18.248489379882812, -17.628747940063477, -17.009008407592773, -16.389266967773438, -15.769526481628418, -15.149786949157715, -14.530046463012695, -13.910306930541992, -13.290566444396973, -12.670825958251953, -12.05108642578125, -11.431346893310547, -10.811606407165527, -10.191866874694824, -9.572126388549805, -8.952386856079102, -8.332646369934082, -7.7129058837890625, -7.093165874481201, -6.47342586517334, -5.8536858558654785, -5.233945846557617, -4.614205360412598, -3.9944653511047363, -3.374725341796875, -2.7549850940704346, -2.135244846343994, -1.5155048370361328, -0.8957647085189819, -0.27602458000183105, 0.3437155485153198, 0.9634556770324707, 1.583195686340332, 2.2029359340667725, 2.822676181793213, 3.442416191101074, 4.0621562004089355, 4.681896209716797, 5.301636695861816, 5.921376705169678, 6.541116714477539, 7.160857200622559, 7.78059720993042, 8.400337219238281, 9.0200777053833, 9.639817237854004, 10.259557723999023, 10.879297256469727, 11.499037742614746, 12.118778228759766, 12.738517761230469, 13.358258247375488, 13.977998733520508, 14.597738265991211, 15.21747875213623, 15.83721923828125, 16.456958770751953, 17.076698303222656, 17.696439743041992, 18.316179275512695]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 6.0, 6.0, 4.0, 11.0, 11.0, 17.0, 35.0, 41.0, 55.0, 51.0, 65.0, 78.0, 82.0, 100.0, 92.0, 73.0, 61.0, 63.0, 40.0, 37.0, 23.0, 16.0, 15.0, 8.0, 6.0, 6.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77880859375, -0.7573089599609375, -0.735809326171875, -0.7143096923828125, -0.69281005859375, -0.6713104248046875, -0.649810791015625, -0.6283111572265625, -0.6068115234375, -0.5853118896484375, -0.563812255859375, -0.5423126220703125, -0.52081298828125, -0.4993133544921875, -0.477813720703125, -0.4563140869140625, -0.434814453125, -0.4133148193359375, -0.391815185546875, -0.3703155517578125, -0.34881591796875, -0.3273162841796875, -0.305816650390625, -0.2843170166015625, -0.2628173828125, -0.2413177490234375, -0.219818115234375, -0.1983184814453125, -0.17681884765625, -0.1553192138671875, -0.133819580078125, -0.1123199462890625, -0.0908203125, -0.0693206787109375, -0.047821044921875, -0.0263214111328125, -0.00482177734375, 0.0166778564453125, 0.038177490234375, 0.0596771240234375, 0.0811767578125, 0.1026763916015625, 0.124176025390625, 0.1456756591796875, 0.16717529296875, 0.1886749267578125, 0.210174560546875, 0.2316741943359375, 0.253173828125, 0.2746734619140625, 0.296173095703125, 0.3176727294921875, 0.33917236328125, 0.3606719970703125, 0.382171630859375, 0.4036712646484375, 0.4251708984375, 0.4466705322265625, 0.468170166015625, 0.4896697998046875, 0.51116943359375, 0.5326690673828125, 0.554168701171875, 0.5756683349609375, 0.59716796875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 11.0, 10.0, 22.0, 41.0, 67.0, 104.0, 164.0, 266.0, 478.0, 999.0, 2232.0, 5545.0, 14589.0, 39114.0, 105669.0, 186991.0, 104236.0, 39030.0, 14551.0, 5450.0, 2346.0, 1024.0, 513.0, 272.0, 175.0, 112.0, 79.0, 40.0, 42.0, 25.0, 9.0, 16.0, 14.0, 7.0, 3.0, 9.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.076416015625, -3.90283203125, -3.729248046875, -3.5556640625, -3.382080078125, -3.20849609375, -3.034912109375, -2.861328125, -2.687744140625, -2.51416015625, -2.340576171875, -2.1669921875, -1.993408203125, -1.81982421875, -1.646240234375, -1.47265625, -1.299072265625, -1.12548828125, -0.951904296875, -0.7783203125, -0.604736328125, -0.43115234375, -0.257568359375, -0.083984375, 0.089599609375, 0.26318359375, 0.436767578125, 0.6103515625, 0.783935546875, 0.95751953125, 1.131103515625, 1.3046875, 1.478271484375, 1.65185546875, 1.825439453125, 1.9990234375, 2.172607421875, 2.34619140625, 2.519775390625, 2.693359375, 2.866943359375, 3.04052734375, 3.214111328125, 3.3876953125, 3.561279296875, 3.73486328125, 3.908447265625, 4.08203125, 4.255615234375, 4.42919921875, 4.602783203125, 4.7763671875, 4.949951171875, 5.12353515625, 5.297119140625, 5.470703125, 5.644287109375, 5.81787109375, 5.991455078125, 6.1650390625, 6.338623046875, 6.51220703125, 6.685791015625, 6.859375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 6.0, 11.0, 11.0, 18.0, 18.0, 26.0, 33.0, 28.0, 44.0, 58.0, 50.0, 78.0, 80.0, 84.0, 68.0, 55.0, 66.0, 58.0, 40.0, 26.0, 24.0, 26.0, 18.0, 11.0, 12.0, 11.0, 8.0, 3.0, 2.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9453125, -0.9126739501953125, -0.880035400390625, -0.8473968505859375, -0.81475830078125, -0.7821197509765625, -0.749481201171875, -0.7168426513671875, -0.6842041015625, -0.6515655517578125, -0.618927001953125, -0.5862884521484375, -0.55364990234375, -0.5210113525390625, -0.488372802734375, -0.4557342529296875, -0.423095703125, -0.3904571533203125, -0.357818603515625, -0.3251800537109375, -0.29254150390625, -0.2599029541015625, -0.227264404296875, -0.1946258544921875, -0.1619873046875, -0.1293487548828125, -0.096710205078125, -0.0640716552734375, -0.03143310546875, 0.0012054443359375, 0.033843994140625, 0.0664825439453125, 0.09912109375, 0.1317596435546875, 0.164398193359375, 0.1970367431640625, 0.22967529296875, 0.2623138427734375, 0.294952392578125, 0.3275909423828125, 0.3602294921875, 0.3928680419921875, 0.425506591796875, 0.4581451416015625, 0.49078369140625, 0.5234222412109375, 0.556060791015625, 0.5886993408203125, 0.621337890625, 0.6539764404296875, 0.686614990234375, 0.7192535400390625, 0.75189208984375, 0.7845306396484375, 0.817169189453125, 0.8498077392578125, 0.8824462890625, 0.9150848388671875, 0.947723388671875, 0.9803619384765625, 1.01300048828125, 1.0456390380859375, 1.078277587890625, 1.1109161376953125, 1.1435546875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 5.0, 4.0, 10.0, 14.0, 15.0, 35.0, 63.0, 70.0, 79.0, 60.0, 45.0, 29.0, 13.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.537603378295898, -6.334583282470703, -6.131563663482666, -5.928544044494629, -5.725523948669434, -5.522503852844238, -5.319484233856201, -5.116464614868164, -4.913444519042969, -4.710424423217773, -4.507404804229736, -4.304385185241699, -4.101365089416504, -3.8983452320098877, -3.6953253746032715, -3.4923055171966553, -3.289285659790039, -3.086265802383423, -2.8832459449768066, -2.6802260875701904, -2.477206230163574, -2.274186372756958, -2.071166515350342, -1.8681466579437256, -1.6651268005371094, -1.4621069431304932, -1.259087085723877, -1.0560672283172607, -0.8530473709106445, -0.6500275135040283, -0.4470076560974121, -0.2439877986907959, -0.040967464447021484, 0.16205239295959473, 0.36507225036621094, 0.5680921077728271, 0.7711119651794434, 0.9741318225860596, 1.1771516799926758, 1.380171537399292, 1.5831913948059082, 1.7862112522125244, 1.9892311096191406, 2.192250967025757, 2.395270824432373, 2.5982906818389893, 2.8013105392456055, 3.0043303966522217, 3.207350254058838, 3.410370111465454, 3.6133899688720703, 3.8164098262786865, 4.019429683685303, 4.22244930267334, 4.425469398498535, 4.6284894943237305, 4.831509113311768, 5.034528732299805, 5.237548828125, 5.440568923950195, 5.643588542938232, 5.8466081619262695, 6.049628257751465, 6.25264835357666, 6.455667972564697]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 2.0, 5.0, 2.0, 11.0, 7.0, 16.0, 31.0, 49.0, 90.0, 90.0, 73.0, 35.0, 14.0, 12.0, 12.0, 5.0, 5.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.248214244842529, -5.071316242218018, -4.894417762756348, -4.717519760131836, -4.540621757507324, -4.3637237548828125, -4.186825275421143, -4.009927272796631, -3.83302903175354, -3.656130790710449, -3.4792327880859375, -3.3023345470428467, -3.125436305999756, -2.948538303375244, -2.7716400623321533, -2.5947418212890625, -2.417843818664551, -2.24094557762146, -2.0640475749969482, -1.8871493339538574, -1.7102512121200562, -1.5333530902862549, -1.356454849243164, -1.1795567274093628, -1.0026586055755615, -0.8257604837417603, -0.6488623023033142, -0.47196412086486816, -0.2950659990310669, -0.11816787719726562, 0.058730363845825195, 0.23562848567962646, 0.41252613067626953, 0.5894242525100708, 0.7663224339485168, 0.9432206153869629, 1.1201187372207642, 1.2970168590545654, 1.4739151000976562, 1.6508132219314575, 1.8277113437652588, 2.0046095848083496, 2.1815075874328613, 2.358405828475952, 2.535304069519043, 2.7122020721435547, 2.8891003131866455, 3.0659985542297363, 3.242896556854248, 3.419794797897339, 3.5966928005218506, 3.7735910415649414, 3.950489044189453, 4.127387046813965, 4.304285526275635, 4.4811835289001465, 4.658082008361816, 4.834980010986328, 5.011878490447998, 5.18877649307251, 5.3656744956970215, 5.542572975158691, 5.719470977783203, 5.896368980407715, 6.073266983032227]}, "eval/loss": 4.240406036376953, "eval/wer": 1.8401428004760016, "eval/runtime": 1267.491, "eval/samples_per_second": 2.084, "eval/steps_per_second": 0.261} \ No newline at end of file +{"train/loss": 2.9073, "train/learning_rate": 8.831353919239906e-05, "train/epoch": 3.33, "train/global_step": 2971, "_runtime": 19442, "_timestamp": 1647554716, "_step": 2971, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 13.0, 23.0, 55.0, 94.0, 146.0, 173.0, 189.0, 145.0, 85.0, 37.0, 19.0, 9.0, 3.0, 9.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-114.22661590576172, -111.75013732910156, -109.27365112304688, -106.79717254638672, -104.32069396972656, -101.84420776367188, -99.36772918701172, -96.89125061035156, -94.41476440429688, -91.93828582763672, -89.46179962158203, -86.98532104492188, -84.50883483886719, -82.03235626220703, -79.55587768554688, -77.07939147949219, -74.60291290283203, -72.12643432617188, -69.64994812011719, -67.17346954345703, -64.69699096679688, -62.22050476074219, -59.74402618408203, -57.26754379272461, -54.79106140136719, -52.314579010009766, -49.838096618652344, -47.36161804199219, -44.885135650634766, -42.408653259277344, -39.93217468261719, -37.455692291259766, -34.979217529296875, -32.50273513793945, -30.026254653930664, -27.549774169921875, -25.073291778564453, -22.59680938720703, -20.120328903198242, -17.643848419189453, -15.167366027832031, -12.690884590148926, -10.21440315246582, -7.737921714782715, -5.261440277099609, -2.784958839416504, -0.30847740173339844, 2.1680030822753906, 4.6444854736328125, 7.120966911315918, 9.597448348999023, 12.073929786682129, 14.550411224365234, 17.026893615722656, 19.503374099731445, 21.979854583740234, 24.456336975097656, 26.932819366455078, 29.409299850463867, 31.885780334472656, 34.36226272583008, 36.8387451171875, 39.315223693847656, 41.79170608520508, 44.2681884765625]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 1.0, 5.0, 3.0, 2.0, 8.0, 14.0, 11.0, 14.0, 10.0, 34.0, 38.0, 57.0, 64.0, 72.0, 83.0, 95.0, 82.0, 64.0, 58.0, 59.0, 58.0, 40.0, 27.0, 37.0, 18.0, 16.0, 7.0, 9.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-103.64295196533203, -100.50665283203125, -97.370361328125, -94.23406219482422, -91.09777069091797, -87.96147155761719, -84.82518005371094, -81.68888092041016, -78.55258178710938, -75.4162826538086, -72.27999114990234, -69.14369201660156, -66.00740051269531, -62.87110137939453, -59.734806060791016, -56.5985107421875, -53.46221923828125, -50.325923919677734, -47.18962860107422, -44.05332946777344, -40.91703796386719, -37.780738830566406, -34.64444351196289, -31.508148193359375, -28.37185287475586, -25.235557556152344, -22.099262237548828, -18.96296501159668, -15.826669692993164, -12.690374374389648, -9.5540771484375, -6.417781829833984, -3.2814788818359375, -0.14518308639526367, 2.99111270904541, 6.127408981323242, 9.263704299926758, 12.399999618530273, 15.536296844482422, 18.672592163085938, 21.808887481689453, 24.94518280029297, 28.081478118896484, 31.217775344848633, 34.35407257080078, 37.49036407470703, 40.62666320800781, 43.76295852661133, 46.899253845214844, 50.03554916381836, 53.171844482421875, 56.308143615722656, 59.444435119628906, 62.58073425292969, 65.71702575683594, 68.85332489013672, 71.9896240234375, 75.12592315673828, 78.26221466064453, 81.39851379394531, 84.53480529785156, 87.67110443115234, 90.80740356445312, 93.94369506835938, 97.07998657226562]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 12.0, 6.0, 18.0, 17.0, 23.0, 29.0, 31.0, 57.0, 65.0, 61.0, 61.0, 60.0, 70.0, 69.0, 62.0, 52.0, 57.0, 53.0, 23.0, 35.0, 24.0, 33.0, 14.0, 25.0, 7.0, 4.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.87109375, -4.73046875, -4.58984375, -4.44921875, -4.30859375, -4.16796875, -4.02734375, -3.88671875, -3.74609375, -3.60546875, -3.46484375, -3.32421875, -3.18359375, -3.04296875, -2.90234375, -2.76171875, -2.62109375, -2.48046875, -2.33984375, -2.19921875, -2.05859375, -1.91796875, -1.77734375, -1.63671875, -1.49609375, -1.35546875, -1.21484375, -1.07421875, -0.93359375, -0.79296875, -0.65234375, -0.51171875, -0.37109375, -0.23046875, -0.08984375, 0.05078125, 0.19140625, 0.33203125, 0.47265625, 0.61328125, 0.75390625, 0.89453125, 1.03515625, 1.17578125, 1.31640625, 1.45703125, 1.59765625, 1.73828125, 1.87890625, 2.01953125, 2.16015625, 2.30078125, 2.44140625, 2.58203125, 2.72265625, 2.86328125, 3.00390625, 3.14453125, 3.28515625, 3.42578125, 3.56640625, 3.70703125, 3.84765625, 3.98828125, 4.12890625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 0.0, 5.0, 8.0, 8.0, 13.0, 15.0, 22.0, 38.0, 44.0, 80.0, 91.0, 174.0, 332.0, 532.0, 965.0, 1770.0, 3720.0, 10185.0, 60492.0, 1051006.0, 2856963.0, 177978.0, 18947.0, 5387.0, 2409.0, 1210.0, 695.0, 447.0, 258.0, 148.0, 123.0, 66.0, 56.0, 26.0, 23.0, 13.0, 10.0, 9.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.828125, -16.3056640625, -15.783203125, -15.2607421875, -14.73828125, -14.2158203125, -13.693359375, -13.1708984375, -12.6484375, -12.1259765625, -11.603515625, -11.0810546875, -10.55859375, -10.0361328125, -9.513671875, -8.9912109375, -8.46875, -7.9462890625, -7.423828125, -6.9013671875, -6.37890625, -5.8564453125, -5.333984375, -4.8115234375, -4.2890625, -3.7666015625, -3.244140625, -2.7216796875, -2.19921875, -1.6767578125, -1.154296875, -0.6318359375, -0.109375, 0.4130859375, 0.935546875, 1.4580078125, 1.98046875, 2.5029296875, 3.025390625, 3.5478515625, 4.0703125, 4.5927734375, 5.115234375, 5.6376953125, 6.16015625, 6.6826171875, 7.205078125, 7.7275390625, 8.25, 8.7724609375, 9.294921875, 9.8173828125, 10.33984375, 10.8623046875, 11.384765625, 11.9072265625, 12.4296875, 12.9521484375, 13.474609375, 13.9970703125, 14.51953125, 15.0419921875, 15.564453125, 16.0869140625, 16.609375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 3.0, 5.0, 3.0, 9.0, 8.0, 23.0, 33.0, 48.0, 65.0, 112.0, 149.0, 272.0, 373.0, 508.0, 623.0, 557.0, 437.0, 273.0, 184.0, 139.0, 84.0, 55.0, 41.0, 24.0, 14.0, 7.0, 6.0, 5.0, 3.0, 0.0, 2.0, 0.0, 6.0, 0.0, 0.0, 3.0], "bins": [-21.46875, -20.964599609375, -20.46044921875, -19.956298828125, -19.4521484375, -18.947998046875, -18.44384765625, -17.939697265625, -17.435546875, -16.931396484375, -16.42724609375, -15.923095703125, -15.4189453125, -14.914794921875, -14.41064453125, -13.906494140625, -13.40234375, -12.898193359375, -12.39404296875, -11.889892578125, -11.3857421875, -10.881591796875, -10.37744140625, -9.873291015625, -9.369140625, -8.864990234375, -8.36083984375, -7.856689453125, -7.3525390625, -6.848388671875, -6.34423828125, -5.840087890625, -5.3359375, -4.831787109375, -4.32763671875, -3.823486328125, -3.3193359375, -2.815185546875, -2.31103515625, -1.806884765625, -1.302734375, -0.798583984375, -0.29443359375, 0.209716796875, 0.7138671875, 1.218017578125, 1.72216796875, 2.226318359375, 2.73046875, 3.234619140625, 3.73876953125, 4.242919921875, 4.7470703125, 5.251220703125, 5.75537109375, 6.259521484375, 6.763671875, 7.267822265625, 7.77197265625, 8.276123046875, 8.7802734375, 9.284423828125, 9.78857421875, 10.292724609375, 10.796875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 8.0, 13.0, 16.0, 16.0, 15.0, 30.0, 39.0, 89.0, 149.0, 309.0, 706.0, 1664.0, 7476.0, 339203.0, 3790244.0, 48340.0, 3725.0, 1201.0, 486.0, 238.0, 139.0, 70.0, 34.0, 25.0, 8.0, 11.0, 13.0, 14.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-59.09375, -57.2646484375, -55.435546875, -53.6064453125, -51.77734375, -49.9482421875, -48.119140625, -46.2900390625, -44.4609375, -42.6318359375, -40.802734375, -38.9736328125, -37.14453125, -35.3154296875, -33.486328125, -31.6572265625, -29.828125, -27.9990234375, -26.169921875, -24.3408203125, -22.51171875, -20.6826171875, -18.853515625, -17.0244140625, -15.1953125, -13.3662109375, -11.537109375, -9.7080078125, -7.87890625, -6.0498046875, -4.220703125, -2.3916015625, -0.5625, 1.2666015625, 3.095703125, 4.9248046875, 6.75390625, 8.5830078125, 10.412109375, 12.2412109375, 14.0703125, 15.8994140625, 17.728515625, 19.5576171875, 21.38671875, 23.2158203125, 25.044921875, 26.8740234375, 28.703125, 30.5322265625, 32.361328125, 34.1904296875, 36.01953125, 37.8486328125, 39.677734375, 41.5068359375, 43.3359375, 45.1650390625, 46.994140625, 48.8232421875, 50.65234375, 52.4814453125, 54.310546875, 56.1396484375, 57.96875]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 19.0, 234.0, 540.0, 198.0, 20.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-362.0631408691406, -355.2765808105469, -348.49005126953125, -341.7034912109375, -334.91693115234375, -328.13037109375, -321.34381103515625, -314.5572814941406, -307.7707214355469, -300.9841613769531, -294.1976318359375, -287.41107177734375, -280.62451171875, -273.83795166015625, -267.0513916015625, -260.2648620605469, -253.47830200195312, -246.69174194335938, -239.9051971435547, -233.11865234375, -226.33209228515625, -219.5455322265625, -212.7589874267578, -205.97244262695312, -199.18588256835938, -192.39932250976562, -185.61277770996094, -178.82623291015625, -172.0396728515625, -165.25311279296875, -158.46656799316406, -151.68002319335938, -144.89346313476562, -138.10690307617188, -131.3203582763672, -124.53380584716797, -117.74725341796875, -110.96070098876953, -104.17414855957031, -97.3875961303711, -90.6010513305664, -83.81449890136719, -77.02794647216797, -70.24139404296875, -63.45484161376953, -56.66828918457031, -49.881736755371094, -43.095184326171875, -36.308631896972656, -29.522079467773438, -22.73552703857422, -15.948974609375, -9.162422180175781, -2.3758697509765625, 4.410682678222656, 11.197235107421875, 17.983787536621094, 24.770339965820312, 31.55689239501953, 38.34344482421875, 45.12999725341797, 51.91654968261719, 58.703102111816406, 65.48965454101562, 72.27620697021484]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 8.0, 7.0, 11.0, 14.0, 9.0, 12.0, 26.0, 26.0, 32.0, 37.0, 45.0, 39.0, 51.0, 38.0, 53.0, 54.0, 39.0, 42.0, 46.0, 40.0, 57.0, 35.0, 44.0, 34.0, 35.0, 31.0, 25.0, 25.0, 26.0, 9.0, 8.0, 10.0, 9.0, 8.0, 5.0, 5.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-72.1844482421875, -70.28089904785156, -68.3773422241211, -66.47379302978516, -64.57024383544922, -62.666690826416016, -60.76313781738281, -58.859588623046875, -56.95603942871094, -55.052486419677734, -53.1489372253418, -51.245384216308594, -49.341835021972656, -47.43828201293945, -45.53472900390625, -43.63117980957031, -41.72762680053711, -39.824073791503906, -37.92052459716797, -36.016971588134766, -34.11342239379883, -32.209869384765625, -30.306318283081055, -28.402767181396484, -26.499216079711914, -24.595664978027344, -22.692113876342773, -20.788562774658203, -18.885009765625, -16.981460571289062, -15.07790756225586, -13.174356460571289, -11.270805358886719, -9.367254257202148, -7.46370267868042, -5.560151100158691, -3.656599998474121, -1.7530488967895508, 0.15050315856933594, 2.0540542602539062, 3.9576053619384766, 5.861156463623047, 7.764708042144775, 9.668259620666504, 11.571810722351074, 13.475361824035645, 15.378913879394531, 17.2824649810791, 19.186016082763672, 21.089567184448242, 22.993118286132812, 24.896671295166016, 26.800220489501953, 28.703773498535156, 30.607324600219727, 32.5108757019043, 34.4144287109375, 36.3179817199707, 38.22153091430664, 40.125083923339844, 42.02863311767578, 43.932186126708984, 45.83573913574219, 47.739288330078125, 49.64283752441406]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 9.0, 7.0, 14.0, 13.0, 12.0, 27.0, 20.0, 39.0, 31.0, 38.0, 50.0, 45.0, 57.0, 53.0, 68.0, 64.0, 51.0, 51.0, 44.0, 43.0, 38.0, 38.0, 38.0, 26.0, 33.0, 21.0, 16.0, 9.0, 6.0, 9.0, 10.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.23828125, -4.114166259765625, -3.99005126953125, -3.865936279296875, -3.7418212890625, -3.617706298828125, -3.49359130859375, -3.369476318359375, -3.245361328125, -3.121246337890625, -2.99713134765625, -2.873016357421875, -2.7489013671875, -2.624786376953125, -2.50067138671875, -2.376556396484375, -2.25244140625, -2.128326416015625, -2.00421142578125, -1.880096435546875, -1.7559814453125, -1.631866455078125, -1.50775146484375, -1.383636474609375, -1.259521484375, -1.135406494140625, -1.01129150390625, -0.887176513671875, -0.7630615234375, -0.638946533203125, -0.51483154296875, -0.390716552734375, -0.2666015625, -0.142486572265625, -0.01837158203125, 0.105743408203125, 0.2298583984375, 0.353973388671875, 0.47808837890625, 0.602203369140625, 0.726318359375, 0.850433349609375, 0.97454833984375, 1.098663330078125, 1.2227783203125, 1.346893310546875, 1.47100830078125, 1.595123291015625, 1.71923828125, 1.843353271484375, 1.96746826171875, 2.091583251953125, 2.2156982421875, 2.339813232421875, 2.46392822265625, 2.588043212890625, 2.712158203125, 2.836273193359375, 2.96038818359375, 3.084503173828125, 3.2086181640625, 3.332733154296875, 3.45684814453125, 3.580963134765625, 3.705078125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 12.0, 10.0, 21.0, 29.0, 34.0, 42.0, 66.0, 105.0, 146.0, 208.0, 267.0, 468.0, 688.0, 1119.0, 1754.0, 2965.0, 5822.0, 13478.0, 42109.0, 158098.0, 407375.0, 287692.0, 83446.0, 23375.0, 8715.0, 4295.0, 2244.0, 1335.0, 851.0, 561.0, 388.0, 240.0, 170.0, 117.0, 80.0, 55.0, 49.0, 34.0, 15.0, 21.0, 14.0, 12.0, 9.0, 6.0, 6.0, 1.0, 2.0, 6.0, 4.0], "bins": [-3.845703125, -3.7381591796875, -3.630615234375, -3.5230712890625, -3.41552734375, -3.3079833984375, -3.200439453125, -3.0928955078125, -2.9853515625, -2.8778076171875, -2.770263671875, -2.6627197265625, -2.55517578125, -2.4476318359375, -2.340087890625, -2.2325439453125, -2.125, -2.0174560546875, -1.909912109375, -1.8023681640625, -1.69482421875, -1.5872802734375, -1.479736328125, -1.3721923828125, -1.2646484375, -1.1571044921875, -1.049560546875, -0.9420166015625, -0.83447265625, -0.7269287109375, -0.619384765625, -0.5118408203125, -0.404296875, -0.2967529296875, -0.189208984375, -0.0816650390625, 0.02587890625, 0.1334228515625, 0.240966796875, 0.3485107421875, 0.4560546875, 0.5635986328125, 0.671142578125, 0.7786865234375, 0.88623046875, 0.9937744140625, 1.101318359375, 1.2088623046875, 1.31640625, 1.4239501953125, 1.531494140625, 1.6390380859375, 1.74658203125, 1.8541259765625, 1.961669921875, 2.0692138671875, 2.1767578125, 2.2843017578125, 2.391845703125, 2.4993896484375, 2.60693359375, 2.7144775390625, 2.822021484375, 2.9295654296875, 3.037109375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 4.0, 14.0, 14.0, 9.0, 10.0, 11.0, 16.0, 20.0, 28.0, 29.0, 30.0, 33.0, 34.0, 27.0, 37.0, 37.0, 43.0, 42.0, 1083.0, 40.0, 35.0, 44.0, 45.0, 39.0, 25.0, 34.0, 35.0, 28.0, 41.0, 30.0, 16.0, 24.0, 13.0, 17.0, 15.0, 7.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.748046875, -3.647796630859375, -3.54754638671875, -3.447296142578125, -3.3470458984375, -3.246795654296875, -3.14654541015625, -3.046295166015625, -2.946044921875, -2.845794677734375, -2.74554443359375, -2.645294189453125, -2.5450439453125, -2.444793701171875, -2.34454345703125, -2.244293212890625, -2.14404296875, -2.043792724609375, -1.94354248046875, -1.843292236328125, -1.7430419921875, -1.642791748046875, -1.54254150390625, -1.442291259765625, -1.342041015625, -1.241790771484375, -1.14154052734375, -1.041290283203125, -0.9410400390625, -0.840789794921875, -0.74053955078125, -0.640289306640625, -0.5400390625, -0.439788818359375, -0.33953857421875, -0.239288330078125, -0.1390380859375, -0.038787841796875, 0.06146240234375, 0.161712646484375, 0.261962890625, 0.362213134765625, 0.46246337890625, 0.562713623046875, 0.6629638671875, 0.763214111328125, 0.86346435546875, 0.963714599609375, 1.06396484375, 1.164215087890625, 1.26446533203125, 1.364715576171875, 1.4649658203125, 1.565216064453125, 1.66546630859375, 1.765716552734375, 1.865966796875, 1.966217041015625, 2.06646728515625, 2.166717529296875, 2.2669677734375, 2.367218017578125, 2.46746826171875, 2.567718505859375, 2.66796875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 3.0, 5.0, 8.0, 18.0, 24.0, 24.0, 43.0, 62.0, 103.0, 164.0, 282.0, 449.0, 723.0, 1275.0, 2294.0, 4336.0, 7882.0, 15058.0, 31957.0, 161546.0, 1797913.0, 36740.0, 16843.0, 8714.0, 4747.0, 2526.0, 1356.0, 764.0, 496.0, 246.0, 165.0, 130.0, 66.0, 49.0, 36.0, 25.0, 18.0, 13.0, 4.0, 5.0, 4.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.05859375, -2.971405029296875, -2.88421630859375, -2.797027587890625, -2.7098388671875, -2.622650146484375, -2.53546142578125, -2.448272705078125, -2.361083984375, -2.273895263671875, -2.18670654296875, -2.099517822265625, -2.0123291015625, -1.925140380859375, -1.83795166015625, -1.750762939453125, -1.66357421875, -1.576385498046875, -1.48919677734375, -1.402008056640625, -1.3148193359375, -1.227630615234375, -1.14044189453125, -1.053253173828125, -0.966064453125, -0.878875732421875, -0.79168701171875, -0.704498291015625, -0.6173095703125, -0.530120849609375, -0.44293212890625, -0.355743408203125, -0.2685546875, -0.181365966796875, -0.09417724609375, -0.006988525390625, 0.0802001953125, 0.167388916015625, 0.25457763671875, 0.341766357421875, 0.428955078125, 0.516143798828125, 0.60333251953125, 0.690521240234375, 0.7777099609375, 0.864898681640625, 0.95208740234375, 1.039276123046875, 1.12646484375, 1.213653564453125, 1.30084228515625, 1.388031005859375, 1.4752197265625, 1.562408447265625, 1.64959716796875, 1.736785888671875, 1.823974609375, 1.911163330078125, 1.99835205078125, 2.085540771484375, 2.1727294921875, 2.259918212890625, 2.34710693359375, 2.434295654296875, 2.521484375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 6.0, 6.0, 12.0, 3.0, 12.0, 18.0, 25.0, 27.0, 23.0, 43.0, 41.0, 46.0, 57.0, 57.0, 80.0, 78.0, 79.0, 74.0, 50.0, 44.0, 42.0, 22.0, 20.0, 23.0, 13.0, 15.0, 13.0, 8.0, 8.0, 7.0, 5.0, 5.0, 2.0, 4.0, 3.0, 5.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1304931640625, -0.12590789794921875, -0.1213226318359375, -0.11673736572265625, -0.112152099609375, -0.10756683349609375, -0.1029815673828125, -0.09839630126953125, -0.09381103515625, -0.08922576904296875, -0.0846405029296875, -0.08005523681640625, -0.075469970703125, -0.07088470458984375, -0.0662994384765625, -0.06171417236328125, -0.05712890625, -0.05254364013671875, -0.0479583740234375, -0.04337310791015625, -0.038787841796875, -0.03420257568359375, -0.0296173095703125, -0.02503204345703125, -0.02044677734375, -0.01586151123046875, -0.0112762451171875, -0.00669097900390625, -0.002105712890625, 0.00247955322265625, 0.0070648193359375, 0.01165008544921875, 0.0162353515625, 0.02082061767578125, 0.0254058837890625, 0.02999114990234375, 0.034576416015625, 0.03916168212890625, 0.0437469482421875, 0.04833221435546875, 0.05291748046875, 0.05750274658203125, 0.0620880126953125, 0.06667327880859375, 0.071258544921875, 0.07584381103515625, 0.0804290771484375, 0.08501434326171875, 0.089599609375, 0.09418487548828125, 0.0987701416015625, 0.10335540771484375, 0.107940673828125, 0.11252593994140625, 0.1171112060546875, 0.12169647216796875, 0.12628173828125, 0.13086700439453125, 0.1354522705078125, 0.14003753662109375, 0.144622802734375, 0.14920806884765625, 0.1537933349609375, 0.15837860107421875, 0.1629638671875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 10.0, 7.0, 10.0, 7.0, 9.0, 12.0, 12.0, 16.0, 16.0, 31.0, 31.0, 31.0, 43.0, 58.0, 87.0, 95.0, 114.0, 169.0, 200.0, 327.0, 1508.0, 96955.0, 944089.0, 3312.0, 424.0, 212.0, 149.0, 128.0, 102.0, 84.0, 60.0, 42.0, 34.0, 32.0, 26.0, 26.0, 19.0, 13.0, 8.0, 13.0, 7.0, 6.0, 10.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.748046875, -2.66259765625, -2.5771484375, -2.49169921875, -2.40625, -2.32080078125, -2.2353515625, -2.14990234375, -2.064453125, -1.97900390625, -1.8935546875, -1.80810546875, -1.72265625, -1.63720703125, -1.5517578125, -1.46630859375, -1.380859375, -1.29541015625, -1.2099609375, -1.12451171875, -1.0390625, -0.95361328125, -0.8681640625, -0.78271484375, -0.697265625, -0.61181640625, -0.5263671875, -0.44091796875, -0.35546875, -0.27001953125, -0.1845703125, -0.09912109375, -0.013671875, 0.07177734375, 0.1572265625, 0.24267578125, 0.328125, 0.41357421875, 0.4990234375, 0.58447265625, 0.669921875, 0.75537109375, 0.8408203125, 0.92626953125, 1.01171875, 1.09716796875, 1.1826171875, 1.26806640625, 1.353515625, 1.43896484375, 1.5244140625, 1.60986328125, 1.6953125, 1.78076171875, 1.8662109375, 1.95166015625, 2.037109375, 2.12255859375, 2.2080078125, 2.29345703125, 2.37890625, 2.46435546875, 2.5498046875, 2.63525390625, 2.720703125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 34.0, 134.0, 753.0, 86.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.2052998542785645, -6.077407360076904, -5.949514865875244, -5.821622848510742, -5.693730354309082, -5.565837860107422, -5.437945365905762, -5.310052871704102, -5.182160377502441, -5.054267883300781, -4.926375389099121, -4.798483371734619, -4.670590877532959, -4.542698383331299, -4.414805889129639, -4.2869133949279785, -4.159021377563477, -4.031128883361816, -3.9032366275787354, -3.775344133377075, -3.647451877593994, -3.519559383392334, -3.391666889190674, -3.2637743949890137, -3.1358821392059326, -3.0079896450042725, -2.8800973892211914, -2.7522048950195312, -2.624312400817871, -2.49642014503479, -2.36852765083313, -2.240635395050049, -2.1127424240112305, -1.9848500490188599, -1.8569576740264893, -1.729065179824829, -1.6011728048324585, -1.473280429840088, -1.3453879356384277, -1.2174955606460571, -1.089603304862976, -0.9617109298706055, -0.8338184952735901, -0.7059260606765747, -0.5780336856842041, -0.4501413106918335, -0.3222488760948181, -0.19435644149780273, -0.06646406650543213, 0.061428338289260864, 0.18932074308395386, 0.31721314787864685, 0.44510555267333984, 0.5729979276657104, 0.7008903622627258, 0.8287827968597412, 0.9566751718521118, 1.0845675468444824, 1.2124600410461426, 1.3403524160385132, 1.4682447910308838, 1.5961371660232544, 1.724029541015625, 1.8519220352172852, 1.9798144102096558]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 8.0, 5.0, 10.0, 19.0, 22.0, 17.0, 29.0, 27.0, 34.0, 50.0, 43.0, 57.0, 63.0, 54.0, 38.0, 72.0, 57.0, 48.0, 44.0, 43.0, 41.0, 35.0, 33.0, 27.0, 27.0, 19.0, 17.0, 10.0, 21.0, 5.0, 9.0, 9.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8219520449638367, -0.7973197102546692, -0.7726873159408569, -0.7480549812316895, -0.723422646522522, -0.6987902522087097, -0.6741579174995422, -0.64952552318573, -0.6248931884765625, -0.600260853767395, -0.5756284594535828, -0.5509961247444153, -0.526363730430603, -0.5017313957214355, -0.47709906101226807, -0.4524666965007782, -0.42783433198928833, -0.40320196747779846, -0.3785696029663086, -0.3539372682571411, -0.32930490374565125, -0.3046725392341614, -0.2800402045249939, -0.25540784001350403, -0.23077547550201416, -0.2061431109905243, -0.18151076138019562, -0.15687841176986694, -0.13224604725837708, -0.1076136901974678, -0.08298133313655853, -0.05834898352622986, -0.033716678619384766, -0.009084321558475494, 0.015548035502433777, 0.04018039256334305, 0.06481274962425232, 0.08944510668516159, 0.11407746374607086, 0.13870981335639954, 0.1633421778678894, 0.18797454237937927, 0.21260689198970795, 0.23723924160003662, 0.2618716061115265, 0.28650397062301636, 0.31113630533218384, 0.3357686698436737, 0.3604010343551636, 0.38503339886665344, 0.4096657633781433, 0.4342980980873108, 0.45893046259880066, 0.4835628271102905, 0.508195161819458, 0.5328274965286255, 0.5574598908424377, 0.5820922255516052, 0.6067246198654175, 0.631356954574585, 0.6559892892837524, 0.6806216835975647, 0.7052540183067322, 0.7298864126205444, 0.7545187473297119]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 10.0, 7.0, 9.0, 15.0, 11.0, 24.0, 22.0, 25.0, 36.0, 61.0, 53.0, 60.0, 65.0, 71.0, 73.0, 53.0, 64.0, 53.0, 47.0, 35.0, 37.0, 30.0, 24.0, 27.0, 19.0, 19.0, 9.0, 9.0, 10.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.91015625, -4.775970458984375, -4.64178466796875, -4.507598876953125, -4.3734130859375, -4.239227294921875, -4.10504150390625, -3.970855712890625, -3.836669921875, -3.702484130859375, -3.56829833984375, -3.434112548828125, -3.2999267578125, -3.165740966796875, -3.03155517578125, -2.897369384765625, -2.76318359375, -2.628997802734375, -2.49481201171875, -2.360626220703125, -2.2264404296875, -2.092254638671875, -1.95806884765625, -1.823883056640625, -1.689697265625, -1.555511474609375, -1.42132568359375, -1.287139892578125, -1.1529541015625, -1.018768310546875, -0.88458251953125, -0.750396728515625, -0.6162109375, -0.482025146484375, -0.34783935546875, -0.213653564453125, -0.0794677734375, 0.054718017578125, 0.18890380859375, 0.323089599609375, 0.457275390625, 0.591461181640625, 0.72564697265625, 0.859832763671875, 0.9940185546875, 1.128204345703125, 1.26239013671875, 1.396575927734375, 1.53076171875, 1.664947509765625, 1.79913330078125, 1.933319091796875, 2.0675048828125, 2.201690673828125, 2.33587646484375, 2.470062255859375, 2.604248046875, 2.738433837890625, 2.87261962890625, 3.006805419921875, 3.1409912109375, 3.275177001953125, 3.40936279296875, 3.543548583984375, 3.677734375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 6.0, 4.0, 10.0, 10.0, 14.0, 18.0, 27.0, 32.0, 40.0, 60.0, 89.0, 124.0, 162.0, 255.0, 429.0, 670.0, 1145.0, 2065.0, 3949.0, 8387.0, 21117.0, 64695.0, 217336.0, 417325.0, 210493.0, 62537.0, 20412.0, 8186.0, 3778.0, 2017.0, 1137.0, 692.0, 409.0, 289.0, 180.0, 115.0, 92.0, 62.0, 42.0, 45.0, 18.0, 26.0, 12.0, 12.0, 8.0, 4.0, 5.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-9.75, -9.43017578125, -9.1103515625, -8.79052734375, -8.470703125, -8.15087890625, -7.8310546875, -7.51123046875, -7.19140625, -6.87158203125, -6.5517578125, -6.23193359375, -5.912109375, -5.59228515625, -5.2724609375, -4.95263671875, -4.6328125, -4.31298828125, -3.9931640625, -3.67333984375, -3.353515625, -3.03369140625, -2.7138671875, -2.39404296875, -2.07421875, -1.75439453125, -1.4345703125, -1.11474609375, -0.794921875, -0.47509765625, -0.1552734375, 0.16455078125, 0.484375, 0.80419921875, 1.1240234375, 1.44384765625, 1.763671875, 2.08349609375, 2.4033203125, 2.72314453125, 3.04296875, 3.36279296875, 3.6826171875, 4.00244140625, 4.322265625, 4.64208984375, 4.9619140625, 5.28173828125, 5.6015625, 5.92138671875, 6.2412109375, 6.56103515625, 6.880859375, 7.20068359375, 7.5205078125, 7.84033203125, 8.16015625, 8.47998046875, 8.7998046875, 9.11962890625, 9.439453125, 9.75927734375, 10.0791015625, 10.39892578125, 10.71875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 5.0, 11.0, 4.0, 5.0, 13.0, 11.0, 13.0, 11.0, 27.0, 17.0, 20.0, 20.0, 30.0, 40.0, 47.0, 50.0, 60.0, 87.0, 107.0, 152.0, 219.0, 1250.0, 211.0, 133.0, 95.0, 69.0, 39.0, 41.0, 35.0, 37.0, 31.0, 29.0, 22.0, 21.0, 13.0, 12.0, 9.0, 6.0, 10.0, 6.0, 8.0, 7.0, 2.0, 7.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-11.0703125, -10.7384033203125, -10.406494140625, -10.0745849609375, -9.74267578125, -9.4107666015625, -9.078857421875, -8.7469482421875, -8.4150390625, -8.0831298828125, -7.751220703125, -7.4193115234375, -7.08740234375, -6.7554931640625, -6.423583984375, -6.0916748046875, -5.759765625, -5.4278564453125, -5.095947265625, -4.7640380859375, -4.43212890625, -4.1002197265625, -3.768310546875, -3.4364013671875, -3.1044921875, -2.7725830078125, -2.440673828125, -2.1087646484375, -1.77685546875, -1.4449462890625, -1.113037109375, -0.7811279296875, -0.44921875, -0.1173095703125, 0.214599609375, 0.5465087890625, 0.87841796875, 1.2103271484375, 1.542236328125, 1.8741455078125, 2.2060546875, 2.5379638671875, 2.869873046875, 3.2017822265625, 3.53369140625, 3.8656005859375, 4.197509765625, 4.5294189453125, 4.861328125, 5.1932373046875, 5.525146484375, 5.8570556640625, 6.18896484375, 6.5208740234375, 6.852783203125, 7.1846923828125, 7.5166015625, 7.8485107421875, 8.180419921875, 8.5123291015625, 8.84423828125, 9.1761474609375, 9.508056640625, 9.8399658203125, 10.171875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 12.0, 5.0, 7.0, 6.0, 6.0, 9.0, 19.0, 24.0, 25.0, 23.0, 28.0, 32.0, 39.0, 67.0, 128.0, 265.0, 828.0, 6527.0, 586105.0, 2528675.0, 20598.0, 1355.0, 374.0, 169.0, 84.0, 57.0, 34.0, 24.0, 26.0, 21.0, 32.0, 16.0, 12.0, 13.0, 11.0, 5.0, 6.0, 3.0, 9.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-36.4375, -35.2294921875, -34.021484375, -32.8134765625, -31.60546875, -30.3974609375, -29.189453125, -27.9814453125, -26.7734375, -25.5654296875, -24.357421875, -23.1494140625, -21.94140625, -20.7333984375, -19.525390625, -18.3173828125, -17.109375, -15.9013671875, -14.693359375, -13.4853515625, -12.27734375, -11.0693359375, -9.861328125, -8.6533203125, -7.4453125, -6.2373046875, -5.029296875, -3.8212890625, -2.61328125, -1.4052734375, -0.197265625, 1.0107421875, 2.21875, 3.4267578125, 4.634765625, 5.8427734375, 7.05078125, 8.2587890625, 9.466796875, 10.6748046875, 11.8828125, 13.0908203125, 14.298828125, 15.5068359375, 16.71484375, 17.9228515625, 19.130859375, 20.3388671875, 21.546875, 22.7548828125, 23.962890625, 25.1708984375, 26.37890625, 27.5869140625, 28.794921875, 30.0029296875, 31.2109375, 32.4189453125, 33.626953125, 34.8349609375, 36.04296875, 37.2509765625, 38.458984375, 39.6669921875, 40.875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 91.0, 363.0, 423.0, 118.0, 12.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-183.71298217773438, -180.37814331054688, -177.04330444335938, -173.70846557617188, -170.37362670898438, -167.03878784179688, -163.70394897460938, -160.3690948486328, -157.0342559814453, -153.6994171142578, -150.3645782470703, -147.0297393798828, -143.6949005126953, -140.36004638671875, -137.02520751953125, -133.69036865234375, -130.35552978515625, -127.02069091796875, -123.68585205078125, -120.35101318359375, -117.01616668701172, -113.68132781982422, -110.34648895263672, -107.01165008544922, -103.67681884765625, -100.34197998046875, -97.00714111328125, -93.67230224609375, -90.33745574951172, -87.00261688232422, -83.66777801513672, -80.33293914794922, -76.99809265136719, -73.66325378417969, -70.32841491699219, -66.99357604980469, -63.658729553222656, -60.323890686035156, -56.989051818847656, -53.654212951660156, -50.319366455078125, -46.984527587890625, -43.64968490600586, -40.31484603881836, -36.980003356933594, -33.645164489746094, -30.310325622558594, -26.97548484802246, -23.64064598083496, -20.305805206298828, -16.970966339111328, -13.636125564575195, -10.301284790039062, -6.96644401550293, -3.6316051483154297, -0.2967643737792969, 3.038076400756836, 6.3729166984558105, 9.707756996154785, 13.042596817016602, 16.377437591552734, 19.712278366088867, 23.047117233276367, 26.3819580078125, 29.716798782348633]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 7.0, 6.0, 9.0, 12.0, 12.0, 16.0, 21.0, 18.0, 24.0, 20.0, 26.0, 28.0, 30.0, 27.0, 28.0, 43.0, 42.0, 36.0, 38.0, 41.0, 43.0, 44.0, 35.0, 41.0, 39.0, 38.0, 30.0, 28.0, 25.0, 25.0, 17.0, 17.0, 15.0, 15.0, 15.0, 19.0, 12.0, 13.0, 9.0, 4.0, 10.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-36.574195861816406, -35.43645477294922, -34.29871368408203, -33.160972595214844, -32.023231506347656, -30.8854923248291, -29.747753143310547, -28.61001205444336, -27.472270965576172, -26.334529876708984, -25.196788787841797, -24.059049606323242, -22.921308517456055, -21.783567428588867, -20.645828247070312, -19.508087158203125, -18.370346069335938, -17.23260498046875, -16.094863891601562, -14.957124710083008, -13.81938362121582, -12.681642532348633, -11.543902397155762, -10.40616226196289, -9.268421173095703, -8.130680084228516, -6.9929399490356445, -5.855199337005615, -4.717458724975586, -3.5797181129455566, -2.4419775009155273, -1.304236888885498, -0.16649627685546875, 0.9712443351745605, 2.10898494720459, 3.246725559234619, 4.384466171264648, 5.522206783294678, 6.659947395324707, 7.797688007354736, 8.935428619384766, 10.073169708251953, 11.210909843444824, 12.348649978637695, 13.486391067504883, 14.62413215637207, 15.761872291564941, 16.899612426757812, 18.037353515625, 19.175094604492188, 20.312835693359375, 21.45057487487793, 22.588315963745117, 23.726057052612305, 24.86379623413086, 26.001537322998047, 27.139278411865234, 28.277019500732422, 29.41476058959961, 30.552499771118164, 31.69024085998535, 32.827980041503906, 33.965721130371094, 35.10346221923828, 36.24120330810547]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 5.0, 8.0, 6.0, 5.0, 7.0, 10.0, 14.0, 17.0, 26.0, 28.0, 36.0, 25.0, 43.0, 54.0, 59.0, 42.0, 67.0, 50.0, 56.0, 54.0, 53.0, 47.0, 44.0, 32.0, 34.0, 32.0, 23.0, 26.0, 23.0, 24.0, 16.0, 7.0, 10.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.8203125, -4.682708740234375, -4.54510498046875, -4.407501220703125, -4.2698974609375, -4.132293701171875, -3.99468994140625, -3.857086181640625, -3.719482421875, -3.581878662109375, -3.44427490234375, -3.306671142578125, -3.1690673828125, -3.031463623046875, -2.89385986328125, -2.756256103515625, -2.61865234375, -2.481048583984375, -2.34344482421875, -2.205841064453125, -2.0682373046875, -1.930633544921875, -1.79302978515625, -1.655426025390625, -1.517822265625, -1.380218505859375, -1.24261474609375, -1.105010986328125, -0.9674072265625, -0.829803466796875, -0.69219970703125, -0.554595947265625, -0.4169921875, -0.279388427734375, -0.14178466796875, -0.004180908203125, 0.1334228515625, 0.271026611328125, 0.40863037109375, 0.546234130859375, 0.683837890625, 0.821441650390625, 0.95904541015625, 1.096649169921875, 1.2342529296875, 1.371856689453125, 1.50946044921875, 1.647064208984375, 1.78466796875, 1.922271728515625, 2.05987548828125, 2.197479248046875, 2.3350830078125, 2.472686767578125, 2.61029052734375, 2.747894287109375, 2.885498046875, 3.023101806640625, 3.16070556640625, 3.298309326171875, 3.4359130859375, 3.573516845703125, 3.71112060546875, 3.848724365234375, 3.986328125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 8.0, 7.0, 21.0, 19.0, 26.0, 29.0, 44.0, 70.0, 101.0, 163.0, 265.0, 413.0, 621.0, 1034.0, 1912.0, 4185.0, 13360.0, 90856.0, 1309875.0, 2555030.0, 184263.0, 20983.0, 5304.0, 2256.0, 1207.0, 710.0, 476.0, 316.0, 208.0, 145.0, 120.0, 69.0, 46.0, 43.0, 33.0, 12.0, 12.0, 9.0, 5.0, 3.0, 4.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-18.71875, -18.1861572265625, -17.653564453125, -17.1209716796875, -16.58837890625, -16.0557861328125, -15.523193359375, -14.9906005859375, -14.4580078125, -13.9254150390625, -13.392822265625, -12.8602294921875, -12.32763671875, -11.7950439453125, -11.262451171875, -10.7298583984375, -10.197265625, -9.6646728515625, -9.132080078125, -8.5994873046875, -8.06689453125, -7.5343017578125, -7.001708984375, -6.4691162109375, -5.9365234375, -5.4039306640625, -4.871337890625, -4.3387451171875, -3.80615234375, -3.2735595703125, -2.740966796875, -2.2083740234375, -1.67578125, -1.1431884765625, -0.610595703125, -0.0780029296875, 0.45458984375, 0.9871826171875, 1.519775390625, 2.0523681640625, 2.5849609375, 3.1175537109375, 3.650146484375, 4.1827392578125, 4.71533203125, 5.2479248046875, 5.780517578125, 6.3131103515625, 6.845703125, 7.3782958984375, 7.910888671875, 8.4434814453125, 8.97607421875, 9.5086669921875, 10.041259765625, 10.5738525390625, 11.1064453125, 11.6390380859375, 12.171630859375, 12.7042236328125, 13.23681640625, 13.7694091796875, 14.302001953125, 14.8345947265625, 15.3671875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 8.0, 3.0, 3.0, 8.0, 17.0, 23.0, 30.0, 42.0, 55.0, 112.0, 157.0, 249.0, 412.0, 593.0, 642.0, 562.0, 422.0, 278.0, 156.0, 108.0, 65.0, 38.0, 36.0, 21.0, 15.0, 9.0, 7.0, 4.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6796875, -12.1422119140625, -11.604736328125, -11.0672607421875, -10.52978515625, -9.9923095703125, -9.454833984375, -8.9173583984375, -8.3798828125, -7.8424072265625, -7.304931640625, -6.7674560546875, -6.22998046875, -5.6925048828125, -5.155029296875, -4.6175537109375, -4.080078125, -3.5426025390625, -3.005126953125, -2.4676513671875, -1.93017578125, -1.3927001953125, -0.855224609375, -0.3177490234375, 0.2197265625, 0.7572021484375, 1.294677734375, 1.8321533203125, 2.36962890625, 2.9071044921875, 3.444580078125, 3.9820556640625, 4.51953125, 5.0570068359375, 5.594482421875, 6.1319580078125, 6.66943359375, 7.2069091796875, 7.744384765625, 8.2818603515625, 8.8193359375, 9.3568115234375, 9.894287109375, 10.4317626953125, 10.96923828125, 11.5067138671875, 12.044189453125, 12.5816650390625, 13.119140625, 13.6566162109375, 14.194091796875, 14.7315673828125, 15.26904296875, 15.8065185546875, 16.343994140625, 16.8814697265625, 17.4189453125, 17.9564208984375, 18.493896484375, 19.0313720703125, 19.56884765625, 20.1063232421875, 20.643798828125, 21.1812744140625, 21.71875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 6.0, 12.0, 15.0, 29.0, 50.0, 63.0, 138.0, 222.0, 429.0, 857.0, 1981.0, 5812.0, 26115.0, 217151.0, 2357394.0, 1440400.0, 119767.0, 16581.0, 4177.0, 1562.0, 700.0, 376.0, 198.0, 95.0, 46.0, 39.0, 21.0, 13.0, 6.0, 6.0, 6.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.875, -23.048095703125, -22.22119140625, -21.394287109375, -20.5673828125, -19.740478515625, -18.91357421875, -18.086669921875, -17.259765625, -16.432861328125, -15.60595703125, -14.779052734375, -13.9521484375, -13.125244140625, -12.29833984375, -11.471435546875, -10.64453125, -9.817626953125, -8.99072265625, -8.163818359375, -7.3369140625, -6.510009765625, -5.68310546875, -4.856201171875, -4.029296875, -3.202392578125, -2.37548828125, -1.548583984375, -0.7216796875, 0.105224609375, 0.93212890625, 1.759033203125, 2.5859375, 3.412841796875, 4.23974609375, 5.066650390625, 5.8935546875, 6.720458984375, 7.54736328125, 8.374267578125, 9.201171875, 10.028076171875, 10.85498046875, 11.681884765625, 12.5087890625, 13.335693359375, 14.16259765625, 14.989501953125, 15.81640625, 16.643310546875, 17.47021484375, 18.297119140625, 19.1240234375, 19.950927734375, 20.77783203125, 21.604736328125, 22.431640625, 23.258544921875, 24.08544921875, 24.912353515625, 25.7392578125, 26.566162109375, 27.39306640625, 28.219970703125, 29.046875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [2.0, 9.0, 24.0, 121.0, 234.0, 263.0, 235.0, 95.0, 24.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.041736602783203, -18.807376861572266, -14.573019027709961, -10.33866024017334, -6.104301452636719, -1.8699417114257812, 2.3644161224365234, 6.598773956298828, 10.833133697509766, 15.067492485046387, 19.301851272583008, 23.536209106445312, 27.77056884765625, 32.00492858886719, 36.239288330078125, 40.4736442565918, 44.708003997802734, 48.94236373901367, 53.176719665527344, 57.41107940673828, 61.64543914794922, 65.87979888916016, 70.1141586303711, 74.3485107421875, 78.58287048339844, 82.81723022460938, 87.05158996582031, 91.28594970703125, 95.52030944824219, 99.75466918945312, 103.98902130126953, 108.22338104248047, 112.45773315429688, 116.69209289550781, 120.92645263671875, 125.16081237792969, 129.39517211914062, 133.62953186035156, 137.8638916015625, 142.09823608398438, 146.33261108398438, 150.5669708251953, 154.80133056640625, 159.0356903076172, 163.27005004882812, 167.50440979003906, 171.73876953125, 175.97311401367188, 180.2074737548828, 184.44183349609375, 188.6761932373047, 192.91055297851562, 197.14491271972656, 201.3792724609375, 205.61363220214844, 209.84799194335938, 214.08233642578125, 218.3166961669922, 222.55105590820312, 226.78541564941406, 231.019775390625, 235.25413513183594, 239.48849487304688, 243.72283935546875, 247.95721435546875]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 8.0, 9.0, 6.0, 7.0, 7.0, 12.0, 9.0, 15.0, 22.0, 25.0, 15.0, 22.0, 27.0, 38.0, 29.0, 36.0, 37.0, 33.0, 32.0, 44.0, 39.0, 37.0, 40.0, 41.0, 46.0, 42.0, 35.0, 31.0, 30.0, 28.0, 28.0, 16.0, 29.0, 25.0, 15.0, 19.0, 12.0, 9.0, 7.0, 12.0, 2.0, 6.0, 7.0, 2.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.5577392578125, -40.31534957885742, -39.07296371459961, -37.83057403564453, -36.58818817138672, -35.34579849243164, -34.10340881347656, -32.86102294921875, -31.618633270263672, -30.376245498657227, -29.13385772705078, -27.891468048095703, -26.649080276489258, -25.406692504882812, -24.164304733276367, -22.921916961669922, -21.679529190063477, -20.43714141845703, -19.194753646850586, -17.95236587524414, -16.709976196289062, -15.467588424682617, -14.225200653076172, -12.98281192779541, -11.740424156188965, -10.49803638458252, -9.255647659301758, -8.013259887695312, -6.770871639251709, -5.5284833908081055, -4.28609561920166, -3.0437068939208984, -1.8013191223144531, -0.5589309930801392, 0.6834571361541748, 1.9258451461791992, 3.1682333946228027, 4.410621643066406, 5.653009414672852, 6.895398139953613, 8.137785911560059, 9.380173683166504, 10.622562408447266, 11.864950180053711, 13.107337951660156, 14.349726676940918, 15.592114448547363, 16.834503173828125, 18.07689094543457, 19.319278717041016, 20.56166648864746, 21.804054260253906, 23.046443939208984, 24.28883171081543, 25.531219482421875, 26.773609161376953, 28.015995025634766, 29.25838279724121, 30.500770568847656, 31.743160247802734, 32.98554611206055, 34.227935791015625, 35.47032165527344, 36.712711334228516, 37.955101013183594]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 6.0, 4.0, 5.0, 2.0, 3.0, 10.0, 9.0, 14.0, 20.0, 21.0, 19.0, 24.0, 30.0, 32.0, 40.0, 48.0, 38.0, 42.0, 63.0, 60.0, 69.0, 52.0, 52.0, 43.0, 46.0, 34.0, 32.0, 34.0, 26.0, 17.0, 26.0, 21.0, 15.0, 14.0, 13.0, 7.0, 7.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.703125, -4.569549560546875, -4.43597412109375, -4.302398681640625, -4.1688232421875, -4.035247802734375, -3.90167236328125, -3.768096923828125, -3.634521484375, -3.500946044921875, -3.36737060546875, -3.233795166015625, -3.1002197265625, -2.966644287109375, -2.83306884765625, -2.699493408203125, -2.56591796875, -2.432342529296875, -2.29876708984375, -2.165191650390625, -2.0316162109375, -1.898040771484375, -1.76446533203125, -1.630889892578125, -1.497314453125, -1.363739013671875, -1.23016357421875, -1.096588134765625, -0.9630126953125, -0.829437255859375, -0.69586181640625, -0.562286376953125, -0.4287109375, -0.295135498046875, -0.16156005859375, -0.027984619140625, 0.1055908203125, 0.239166259765625, 0.37274169921875, 0.506317138671875, 0.639892578125, 0.773468017578125, 0.90704345703125, 1.040618896484375, 1.1741943359375, 1.307769775390625, 1.44134521484375, 1.574920654296875, 1.70849609375, 1.842071533203125, 1.97564697265625, 2.109222412109375, 2.2427978515625, 2.376373291015625, 2.50994873046875, 2.643524169921875, 2.777099609375, 2.910675048828125, 3.04425048828125, 3.177825927734375, 3.3114013671875, 3.444976806640625, 3.57855224609375, 3.712127685546875, 3.845703125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 10.0, 6.0, 9.0, 11.0, 20.0, 41.0, 50.0, 62.0, 67.0, 114.0, 204.0, 271.0, 423.0, 693.0, 1084.0, 2045.0, 3863.0, 9516.0, 26455.0, 80270.0, 216261.0, 346284.0, 227361.0, 85704.0, 28176.0, 10080.0, 4218.0, 2070.0, 1188.0, 699.0, 426.0, 289.0, 179.0, 117.0, 76.0, 65.0, 44.0, 25.0, 27.0, 9.0, 9.0, 8.0, 4.0, 5.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.515625, -2.43829345703125, -2.3609619140625, -2.28363037109375, -2.206298828125, -2.12896728515625, -2.0516357421875, -1.97430419921875, -1.89697265625, -1.81964111328125, -1.7423095703125, -1.66497802734375, -1.587646484375, -1.51031494140625, -1.4329833984375, -1.35565185546875, -1.2783203125, -1.20098876953125, -1.1236572265625, -1.04632568359375, -0.968994140625, -0.89166259765625, -0.8143310546875, -0.73699951171875, -0.65966796875, -0.58233642578125, -0.5050048828125, -0.42767333984375, -0.350341796875, -0.27301025390625, -0.1956787109375, -0.11834716796875, -0.041015625, 0.03631591796875, 0.1136474609375, 0.19097900390625, 0.268310546875, 0.34564208984375, 0.4229736328125, 0.50030517578125, 0.57763671875, 0.65496826171875, 0.7322998046875, 0.80963134765625, 0.886962890625, 0.96429443359375, 1.0416259765625, 1.11895751953125, 1.1962890625, 1.27362060546875, 1.3509521484375, 1.42828369140625, 1.505615234375, 1.58294677734375, 1.6602783203125, 1.73760986328125, 1.81494140625, 1.89227294921875, 1.9696044921875, 2.04693603515625, 2.124267578125, 2.20159912109375, 2.2789306640625, 2.35626220703125, 2.43359375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 6.0, 7.0, 3.0, 4.0, 5.0, 10.0, 11.0, 13.0, 14.0, 10.0, 9.0, 23.0, 17.0, 19.0, 29.0, 28.0, 24.0, 31.0, 35.0, 16.0, 25.0, 35.0, 37.0, 42.0, 29.0, 1060.0, 39.0, 29.0, 41.0, 35.0, 37.0, 37.0, 33.0, 22.0, 21.0, 26.0, 24.0, 16.0, 16.0, 16.0, 22.0, 14.0, 13.0, 14.0, 4.0, 5.0, 5.0, 4.0, 1.0, 5.0, 3.0, 3.0, 1.0, 0.0, 7.0], "bins": [-2.599609375, -2.52471923828125, -2.4498291015625, -2.37493896484375, -2.300048828125, -2.22515869140625, -2.1502685546875, -2.07537841796875, -2.00048828125, -1.92559814453125, -1.8507080078125, -1.77581787109375, -1.700927734375, -1.62603759765625, -1.5511474609375, -1.47625732421875, -1.4013671875, -1.32647705078125, -1.2515869140625, -1.17669677734375, -1.101806640625, -1.02691650390625, -0.9520263671875, -0.87713623046875, -0.80224609375, -0.72735595703125, -0.6524658203125, -0.57757568359375, -0.502685546875, -0.42779541015625, -0.3529052734375, -0.27801513671875, -0.203125, -0.12823486328125, -0.0533447265625, 0.02154541015625, 0.096435546875, 0.17132568359375, 0.2462158203125, 0.32110595703125, 0.39599609375, 0.47088623046875, 0.5457763671875, 0.62066650390625, 0.695556640625, 0.77044677734375, 0.8453369140625, 0.92022705078125, 0.9951171875, 1.07000732421875, 1.1448974609375, 1.21978759765625, 1.294677734375, 1.36956787109375, 1.4444580078125, 1.51934814453125, 1.59423828125, 1.66912841796875, 1.7440185546875, 1.81890869140625, 1.893798828125, 1.96868896484375, 2.0435791015625, 2.11846923828125, 2.193359375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 3.0, 3.0, 7.0, 11.0, 19.0, 20.0, 31.0, 48.0, 68.0, 104.0, 129.0, 247.0, 358.0, 650.0, 1134.0, 1990.0, 3506.0, 6405.0, 11633.0, 21962.0, 49277.0, 1893835.0, 54600.0, 23196.0, 12183.0, 6728.0, 3745.0, 2144.0, 1218.0, 687.0, 418.0, 261.0, 171.0, 107.0, 69.0, 40.0, 30.0, 31.0, 24.0, 10.0, 7.0, 9.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.576171875, -2.5015869140625, -2.427001953125, -2.3524169921875, -2.27783203125, -2.2032470703125, -2.128662109375, -2.0540771484375, -1.9794921875, -1.9049072265625, -1.830322265625, -1.7557373046875, -1.68115234375, -1.6065673828125, -1.531982421875, -1.4573974609375, -1.3828125, -1.3082275390625, -1.233642578125, -1.1590576171875, -1.08447265625, -1.0098876953125, -0.935302734375, -0.8607177734375, -0.7861328125, -0.7115478515625, -0.636962890625, -0.5623779296875, -0.48779296875, -0.4132080078125, -0.338623046875, -0.2640380859375, -0.189453125, -0.1148681640625, -0.040283203125, 0.0343017578125, 0.10888671875, 0.1834716796875, 0.258056640625, 0.3326416015625, 0.4072265625, 0.4818115234375, 0.556396484375, 0.6309814453125, 0.70556640625, 0.7801513671875, 0.854736328125, 0.9293212890625, 1.00390625, 1.0784912109375, 1.153076171875, 1.2276611328125, 1.30224609375, 1.3768310546875, 1.451416015625, 1.5260009765625, 1.6005859375, 1.6751708984375, 1.749755859375, 1.8243408203125, 1.89892578125, 1.9735107421875, 2.048095703125, 2.1226806640625, 2.197265625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 2.0, 5.0, 9.0, 9.0, 14.0, 17.0, 18.0, 19.0, 23.0, 27.0, 32.0, 38.0, 38.0, 40.0, 53.0, 67.0, 89.0, 75.0, 77.0, 51.0, 44.0, 39.0, 42.0, 34.0, 17.0, 17.0, 10.0, 14.0, 13.0, 14.0, 12.0, 9.0, 8.0, 3.0, 6.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1273193359375, -0.12338542938232422, -0.11945152282714844, -0.11551761627197266, -0.11158370971679688, -0.1076498031616211, -0.10371589660644531, -0.09978199005126953, -0.09584808349609375, -0.09191417694091797, -0.08798027038574219, -0.0840463638305664, -0.08011245727539062, -0.07617855072021484, -0.07224464416503906, -0.06831073760986328, -0.0643768310546875, -0.06044292449951172, -0.05650901794433594, -0.052575111389160156, -0.048641204833984375, -0.044707298278808594, -0.04077339172363281, -0.03683948516845703, -0.03290557861328125, -0.02897167205810547, -0.025037765502929688, -0.021103858947753906, -0.017169952392578125, -0.013236045837402344, -0.009302139282226562, -0.005368232727050781, -0.001434326171875, 0.0024995803833007812, 0.0064334869384765625, 0.010367393493652344, 0.014301300048828125, 0.018235206604003906, 0.022169113159179688, 0.02610301971435547, 0.03003692626953125, 0.03397083282470703, 0.03790473937988281, 0.041838645935058594, 0.045772552490234375, 0.049706459045410156, 0.05364036560058594, 0.05757427215576172, 0.0615081787109375, 0.06544208526611328, 0.06937599182128906, 0.07330989837646484, 0.07724380493164062, 0.0811777114868164, 0.08511161804199219, 0.08904552459716797, 0.09297943115234375, 0.09691333770751953, 0.10084724426269531, 0.1047811508178711, 0.10871505737304688, 0.11264896392822266, 0.11658287048339844, 0.12051677703857422, 0.12445068359375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 1.0, 3.0, 4.0, 3.0, 7.0, 3.0, 10.0, 13.0, 10.0, 15.0, 21.0, 32.0, 41.0, 46.0, 53.0, 41.0, 60.0, 67.0, 90.0, 124.0, 126.0, 178.0, 250.0, 677.0, 19946.0, 1010243.0, 14739.0, 606.0, 271.0, 162.0, 134.0, 97.0, 89.0, 50.0, 52.0, 48.0, 39.0, 47.0, 31.0, 37.0, 12.0, 14.0, 17.0, 10.0, 9.0, 5.0, 3.0, 5.0, 1.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-2.080078125, -2.016021728515625, -1.95196533203125, -1.887908935546875, -1.8238525390625, -1.759796142578125, -1.69573974609375, -1.631683349609375, -1.567626953125, -1.503570556640625, -1.43951416015625, -1.375457763671875, -1.3114013671875, -1.247344970703125, -1.18328857421875, -1.119232177734375, -1.05517578125, -0.991119384765625, -0.92706298828125, -0.863006591796875, -0.7989501953125, -0.734893798828125, -0.67083740234375, -0.606781005859375, -0.542724609375, -0.478668212890625, -0.41461181640625, -0.350555419921875, -0.2864990234375, -0.222442626953125, -0.15838623046875, -0.094329833984375, -0.0302734375, 0.033782958984375, 0.09783935546875, 0.161895751953125, 0.2259521484375, 0.290008544921875, 0.35406494140625, 0.418121337890625, 0.482177734375, 0.546234130859375, 0.61029052734375, 0.674346923828125, 0.7384033203125, 0.802459716796875, 0.86651611328125, 0.930572509765625, 0.99462890625, 1.058685302734375, 1.12274169921875, 1.186798095703125, 1.2508544921875, 1.314910888671875, 1.37896728515625, 1.443023681640625, 1.507080078125, 1.571136474609375, 1.63519287109375, 1.699249267578125, 1.7633056640625, 1.827362060546875, 1.89141845703125, 1.955474853515625, 2.01953125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 19.0, 689.0, 306.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.654077529907227, -8.469683647155762, -8.28528881072998, -8.100894927978516, -7.916501045227051, -7.732106685638428, -7.547712326049805, -7.36331844329834, -7.178924083709717, -6.994529724121094, -6.810135841369629, -6.625741481781006, -6.441347599029541, -6.256953239440918, -6.072559356689453, -5.88816499710083, -5.703770637512207, -5.519376277923584, -5.334982395172119, -5.150588035583496, -4.966194152832031, -4.781799793243408, -4.597405433654785, -4.41301155090332, -4.2286176681518555, -4.044223308563232, -3.8598294258117676, -3.6754350662231445, -3.4910409450531006, -3.3066468238830566, -3.1222527027130127, -2.9378585815429688, -2.7534639835357666, -2.5690698623657227, -2.3846757411956787, -2.2002816200256348, -2.0158872604370117, -1.8314931392669678, -1.6470990180969238, -1.4627047777175903, -1.2783106565475464, -1.0939165353775024, -0.909522294998169, -0.725128173828125, -0.5407339930534363, -0.35633981227874756, -0.1719456911087036, 0.012448549270629883, 0.19684267044067383, 0.38123685121536255, 0.5656310319900513, 0.7500251531600952, 0.9344193339347839, 1.1188135147094727, 1.3032076358795166, 1.48760187625885, 1.671995997428894, 1.856390118598938, 2.0407843589782715, 2.2251784801483154, 2.4095726013183594, 2.5939669609069824, 2.7783608436584473, 2.9627552032470703, 3.1471493244171143]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 9.0, 10.0, 15.0, 19.0, 17.0, 33.0, 28.0, 41.0, 35.0, 46.0, 59.0, 46.0, 72.0, 60.0, 67.0, 49.0, 51.0, 48.0, 46.0, 49.0, 34.0, 38.0, 23.0, 22.0, 20.0, 19.0, 13.0, 7.0, 7.0, 7.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6053920984268188, -0.5840582847595215, -0.5627245306968689, -0.5413907170295715, -0.520056962966919, -0.4987231492996216, -0.4773893654346466, -0.45605558156967163, -0.43472179770469666, -0.4133880138397217, -0.3920542299747467, -0.37072044610977173, -0.34938663244247437, -0.3280528783798218, -0.3067190647125244, -0.28538528084754944, -0.26405149698257446, -0.2427177131175995, -0.2213839292526245, -0.20005013048648834, -0.17871634662151337, -0.1573825627565384, -0.13604876399040222, -0.11471498012542725, -0.09338119626045227, -0.0720474123954773, -0.05071362107992172, -0.02937982976436615, -0.008046045899391174, 0.013287737965583801, 0.03462153673171997, 0.055955320596694946, 0.07728904485702515, 0.09862282872200012, 0.1199566200375557, 0.14129041135311127, 0.16262419521808624, 0.18395797908306122, 0.2052917778491974, 0.22662556171417236, 0.24795934557914734, 0.2692931294441223, 0.2906269133090973, 0.31196069717407227, 0.33329451084136963, 0.3546282649040222, 0.3759620785713196, 0.39729586243629456, 0.41862964630126953, 0.4399634301662445, 0.4612972140312195, 0.48263102769851685, 0.5039647817611694, 0.5252985954284668, 0.5466324090957642, 0.5679661631584167, 0.5892999172210693, 0.6106337308883667, 0.6319674849510193, 0.6533012986183167, 0.6746350526809692, 0.6959688663482666, 0.717302680015564, 0.7386364340782166, 0.7599702477455139]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 4.0, 6.0, 5.0, 8.0, 9.0, 6.0, 17.0, 24.0, 28.0, 32.0, 31.0, 24.0, 35.0, 35.0, 45.0, 51.0, 59.0, 58.0, 52.0, 63.0, 45.0, 43.0, 38.0, 42.0, 39.0, 27.0, 30.0, 21.0, 25.0, 18.0, 16.0, 12.0, 10.0, 9.0, 6.0, 7.0, 7.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-4.37890625, -4.251953125, -4.125, -3.998046875, -3.87109375, -3.744140625, -3.6171875, -3.490234375, -3.36328125, -3.236328125, -3.109375, -2.982421875, -2.85546875, -2.728515625, -2.6015625, -2.474609375, -2.34765625, -2.220703125, -2.09375, -1.966796875, -1.83984375, -1.712890625, -1.5859375, -1.458984375, -1.33203125, -1.205078125, -1.078125, -0.951171875, -0.82421875, -0.697265625, -0.5703125, -0.443359375, -0.31640625, -0.189453125, -0.0625, 0.064453125, 0.19140625, 0.318359375, 0.4453125, 0.572265625, 0.69921875, 0.826171875, 0.953125, 1.080078125, 1.20703125, 1.333984375, 1.4609375, 1.587890625, 1.71484375, 1.841796875, 1.96875, 2.095703125, 2.22265625, 2.349609375, 2.4765625, 2.603515625, 2.73046875, 2.857421875, 2.984375, 3.111328125, 3.23828125, 3.365234375, 3.4921875, 3.619140625, 3.74609375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 9.0, 8.0, 11.0, 16.0, 27.0, 33.0, 43.0, 69.0, 121.0, 163.0, 271.0, 400.0, 774.0, 1381.0, 2848.0, 8029.0, 31948.0, 166979.0, 516946.0, 251496.0, 48389.0, 11076.0, 3588.0, 1667.0, 884.0, 506.0, 308.0, 155.0, 131.0, 88.0, 62.0, 39.0, 18.0, 22.0, 15.0, 11.0, 6.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.125, -9.814697265625, -9.50439453125, -9.194091796875, -8.8837890625, -8.573486328125, -8.26318359375, -7.952880859375, -7.642578125, -7.332275390625, -7.02197265625, -6.711669921875, -6.4013671875, -6.091064453125, -5.78076171875, -5.470458984375, -5.16015625, -4.849853515625, -4.53955078125, -4.229248046875, -3.9189453125, -3.608642578125, -3.29833984375, -2.988037109375, -2.677734375, -2.367431640625, -2.05712890625, -1.746826171875, -1.4365234375, -1.126220703125, -0.81591796875, -0.505615234375, -0.1953125, 0.114990234375, 0.42529296875, 0.735595703125, 1.0458984375, 1.356201171875, 1.66650390625, 1.976806640625, 2.287109375, 2.597412109375, 2.90771484375, 3.218017578125, 3.5283203125, 3.838623046875, 4.14892578125, 4.459228515625, 4.76953125, 5.079833984375, 5.39013671875, 5.700439453125, 6.0107421875, 6.321044921875, 6.63134765625, 6.941650390625, 7.251953125, 7.562255859375, 7.87255859375, 8.182861328125, 8.4931640625, 8.803466796875, 9.11376953125, 9.424072265625, 9.734375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 7.0, 1.0, 3.0, 3.0, 4.0, 11.0, 4.0, 10.0, 8.0, 6.0, 18.0, 10.0, 8.0, 20.0, 24.0, 28.0, 23.0, 41.0, 40.0, 45.0, 58.0, 83.0, 108.0, 161.0, 275.0, 1279.0, 169.0, 107.0, 83.0, 62.0, 47.0, 36.0, 37.0, 29.0, 27.0, 32.0, 19.0, 18.0, 11.0, 21.0, 15.0, 14.0, 8.0, 16.0, 2.0, 5.0, 10.0, 2.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.15625, -11.76513671875, -11.3740234375, -10.98291015625, -10.591796875, -10.20068359375, -9.8095703125, -9.41845703125, -9.02734375, -8.63623046875, -8.2451171875, -7.85400390625, -7.462890625, -7.07177734375, -6.6806640625, -6.28955078125, -5.8984375, -5.50732421875, -5.1162109375, -4.72509765625, -4.333984375, -3.94287109375, -3.5517578125, -3.16064453125, -2.76953125, -2.37841796875, -1.9873046875, -1.59619140625, -1.205078125, -0.81396484375, -0.4228515625, -0.03173828125, 0.359375, 0.75048828125, 1.1416015625, 1.53271484375, 1.923828125, 2.31494140625, 2.7060546875, 3.09716796875, 3.48828125, 3.87939453125, 4.2705078125, 4.66162109375, 5.052734375, 5.44384765625, 5.8349609375, 6.22607421875, 6.6171875, 7.00830078125, 7.3994140625, 7.79052734375, 8.181640625, 8.57275390625, 8.9638671875, 9.35498046875, 9.74609375, 10.13720703125, 10.5283203125, 10.91943359375, 11.310546875, 11.70166015625, 12.0927734375, 12.48388671875, 12.875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 10.0, 6.0, 7.0, 5.0, 10.0, 11.0, 16.0, 10.0, 22.0, 18.0, 17.0, 28.0, 40.0, 28.0, 48.0, 79.0, 119.0, 214.0, 416.0, 1118.0, 3514.0, 17771.0, 193745.0, 2356199.0, 529157.0, 34741.0, 5528.0, 1471.0, 573.0, 275.0, 149.0, 98.0, 57.0, 41.0, 39.0, 23.0, 21.0, 9.0, 10.0, 9.0, 6.0, 6.0, 8.0, 8.0, 8.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0], "bins": [-19.03125, -18.43017578125, -17.8291015625, -17.22802734375, -16.626953125, -16.02587890625, -15.4248046875, -14.82373046875, -14.22265625, -13.62158203125, -13.0205078125, -12.41943359375, -11.818359375, -11.21728515625, -10.6162109375, -10.01513671875, -9.4140625, -8.81298828125, -8.2119140625, -7.61083984375, -7.009765625, -6.40869140625, -5.8076171875, -5.20654296875, -4.60546875, -4.00439453125, -3.4033203125, -2.80224609375, -2.201171875, -1.60009765625, -0.9990234375, -0.39794921875, 0.203125, 0.80419921875, 1.4052734375, 2.00634765625, 2.607421875, 3.20849609375, 3.8095703125, 4.41064453125, 5.01171875, 5.61279296875, 6.2138671875, 6.81494140625, 7.416015625, 8.01708984375, 8.6181640625, 9.21923828125, 9.8203125, 10.42138671875, 11.0224609375, 11.62353515625, 12.224609375, 12.82568359375, 13.4267578125, 14.02783203125, 14.62890625, 15.22998046875, 15.8310546875, 16.43212890625, 17.033203125, 17.63427734375, 18.2353515625, 18.83642578125, 19.4375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 29.0, 145.0, 362.0, 347.0, 101.0, 20.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.53934097290039, -43.61045455932617, -40.68156814575195, -37.752681732177734, -34.823795318603516, -31.894908905029297, -28.966020584106445, -26.037134170532227, -23.108247756958008, -20.17936134338379, -17.25047492980957, -14.321587562561035, -11.392701148986816, -8.463814735412598, -5.5349273681640625, -2.6060409545898438, 0.322845458984375, 3.251732110977173, 6.180618762969971, 9.109505653381348, 12.038392066955566, 14.967278480529785, 17.89616584777832, 20.82505226135254, 23.753938674926758, 26.682825088500977, 29.611711502075195, 32.54059982299805, 35.469486236572266, 38.398372650146484, 41.3272590637207, 44.25614547729492, 47.185035705566406, 50.113922119140625, 53.042808532714844, 55.97169494628906, 58.90058135986328, 61.8294677734375, 64.75835418701172, 67.68724060058594, 70.61612701416016, 73.54501342773438, 76.4738998413086, 79.40278625488281, 82.33167266845703, 85.26055908203125, 88.18944549560547, 91.11833190917969, 94.04722595214844, 96.97611236572266, 99.90499877929688, 102.8338851928711, 105.76277160644531, 108.69165802001953, 111.62054443359375, 114.54943084716797, 117.47831726074219, 120.4072036743164, 123.33609008789062, 126.26497650146484, 129.19386291503906, 132.1227569580078, 135.0516357421875, 137.98052978515625, 140.90940856933594]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 7.0, 9.0, 3.0, 9.0, 12.0, 12.0, 9.0, 16.0, 21.0, 29.0, 25.0, 25.0, 21.0, 23.0, 25.0, 25.0, 34.0, 23.0, 48.0, 43.0, 52.0, 46.0, 37.0, 43.0, 48.0, 39.0, 32.0, 28.0, 30.0, 25.0, 30.0, 27.0, 21.0, 22.0, 21.0, 16.0, 9.0, 8.0, 14.0, 10.0, 7.0, 4.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-41.615257263183594, -40.30926513671875, -39.003273010253906, -37.6972770690918, -36.39128494262695, -35.08529281616211, -33.779296875, -32.473304748535156, -31.167312622070312, -29.86132049560547, -28.555326461791992, -27.249332427978516, -25.943340301513672, -24.637348175048828, -23.33135414123535, -22.025360107421875, -20.71936798095703, -19.413375854492188, -18.10738182067871, -16.801387786865234, -15.49539566040039, -14.18940258026123, -12.88340950012207, -11.57741641998291, -10.27142333984375, -8.96543025970459, -7.65943717956543, -6.3534440994262695, -5.047451019287109, -3.741457939147949, -2.435464859008789, -1.129471778869629, 0.17652511596679688, 1.482518196105957, 2.788511276245117, 4.094504356384277, 5.4004974365234375, 6.706490516662598, 8.012483596801758, 9.318476676940918, 10.624469757080078, 11.930462837219238, 13.236455917358398, 14.542448997497559, 15.848442077636719, 17.154434204101562, 18.46042823791504, 19.766422271728516, 21.07241439819336, 22.378406524658203, 23.68440055847168, 24.990394592285156, 26.29638671875, 27.602378845214844, 28.90837287902832, 30.214366912841797, 31.52035903930664, 32.826351165771484, 34.132347106933594, 35.43833923339844, 36.74433135986328, 38.050323486328125, 39.35631561279297, 40.66231155395508, 41.96830368041992]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 9.0, 11.0, 10.0, 9.0, 11.0, 13.0, 22.0, 31.0, 30.0, 28.0, 45.0, 39.0, 60.0, 38.0, 64.0, 45.0, 59.0, 55.0, 63.0, 54.0, 34.0, 35.0, 36.0, 33.0, 30.0, 23.0, 26.0, 16.0, 16.0, 16.0, 15.0, 6.0, 9.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.3515625, -5.20458984375, -5.0576171875, -4.91064453125, -4.763671875, -4.61669921875, -4.4697265625, -4.32275390625, -4.17578125, -4.02880859375, -3.8818359375, -3.73486328125, -3.587890625, -3.44091796875, -3.2939453125, -3.14697265625, -3.0, -2.85302734375, -2.7060546875, -2.55908203125, -2.412109375, -2.26513671875, -2.1181640625, -1.97119140625, -1.82421875, -1.67724609375, -1.5302734375, -1.38330078125, -1.236328125, -1.08935546875, -0.9423828125, -0.79541015625, -0.6484375, -0.50146484375, -0.3544921875, -0.20751953125, -0.060546875, 0.08642578125, 0.2333984375, 0.38037109375, 0.52734375, 0.67431640625, 0.8212890625, 0.96826171875, 1.115234375, 1.26220703125, 1.4091796875, 1.55615234375, 1.703125, 1.85009765625, 1.9970703125, 2.14404296875, 2.291015625, 2.43798828125, 2.5849609375, 2.73193359375, 2.87890625, 3.02587890625, 3.1728515625, 3.31982421875, 3.466796875, 3.61376953125, 3.7607421875, 3.90771484375, 4.0546875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 6.0, 8.0, 19.0, 25.0, 29.0, 42.0, 86.0, 87.0, 154.0, 245.0, 319.0, 537.0, 887.0, 1552.0, 3163.0, 8931.0, 44580.0, 470282.0, 3092475.0, 506955.0, 46767.0, 9361.0, 3331.0, 1624.0, 946.0, 556.0, 409.0, 237.0, 196.0, 128.0, 97.0, 70.0, 49.0, 34.0, 32.0, 18.0, 12.0, 7.0, 6.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.203125, -15.672119140625, -15.14111328125, -14.610107421875, -14.0791015625, -13.548095703125, -13.01708984375, -12.486083984375, -11.955078125, -11.424072265625, -10.89306640625, -10.362060546875, -9.8310546875, -9.300048828125, -8.76904296875, -8.238037109375, -7.70703125, -7.176025390625, -6.64501953125, -6.114013671875, -5.5830078125, -5.052001953125, -4.52099609375, -3.989990234375, -3.458984375, -2.927978515625, -2.39697265625, -1.865966796875, -1.3349609375, -0.803955078125, -0.27294921875, 0.258056640625, 0.7890625, 1.320068359375, 1.85107421875, 2.382080078125, 2.9130859375, 3.444091796875, 3.97509765625, 4.506103515625, 5.037109375, 5.568115234375, 6.09912109375, 6.630126953125, 7.1611328125, 7.692138671875, 8.22314453125, 8.754150390625, 9.28515625, 9.816162109375, 10.34716796875, 10.878173828125, 11.4091796875, 11.940185546875, 12.47119140625, 13.002197265625, 13.533203125, 14.064208984375, 14.59521484375, 15.126220703125, 15.6572265625, 16.188232421875, 16.71923828125, 17.250244140625, 17.78125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 5.0, 3.0, 3.0, 9.0, 8.0, 9.0, 18.0, 15.0, 21.0, 35.0, 39.0, 59.0, 77.0, 106.0, 140.0, 212.0, 250.0, 351.0, 402.0, 468.0, 452.0, 366.0, 296.0, 194.0, 146.0, 108.0, 72.0, 40.0, 46.0, 27.0, 26.0, 24.0, 16.0, 8.0, 12.0, 4.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.0390625, -11.6700439453125, -11.301025390625, -10.9320068359375, -10.56298828125, -10.1939697265625, -9.824951171875, -9.4559326171875, -9.0869140625, -8.7178955078125, -8.348876953125, -7.9798583984375, -7.61083984375, -7.2418212890625, -6.872802734375, -6.5037841796875, -6.134765625, -5.7657470703125, -5.396728515625, -5.0277099609375, -4.65869140625, -4.2896728515625, -3.920654296875, -3.5516357421875, -3.1826171875, -2.8135986328125, -2.444580078125, -2.0755615234375, -1.70654296875, -1.3375244140625, -0.968505859375, -0.5994873046875, -0.23046875, 0.1385498046875, 0.507568359375, 0.8765869140625, 1.24560546875, 1.6146240234375, 1.983642578125, 2.3526611328125, 2.7216796875, 3.0906982421875, 3.459716796875, 3.8287353515625, 4.19775390625, 4.5667724609375, 4.935791015625, 5.3048095703125, 5.673828125, 6.0428466796875, 6.411865234375, 6.7808837890625, 7.14990234375, 7.5189208984375, 7.887939453125, 8.2569580078125, 8.6259765625, 8.9949951171875, 9.364013671875, 9.7330322265625, 10.10205078125, 10.4710693359375, 10.840087890625, 11.2091064453125, 11.578125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 3.0, 6.0, 10.0, 10.0, 18.0, 10.0, 32.0, 36.0, 72.0, 98.0, 178.0, 276.0, 511.0, 1008.0, 2188.0, 4855.0, 12500.0, 40141.0, 168448.0, 858181.0, 2189825.0, 719226.0, 142075.0, 34939.0, 11209.0, 4357.0, 1980.0, 913.0, 445.0, 290.0, 177.0, 85.0, 49.0, 43.0, 33.0, 16.0, 12.0, 7.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.25, -16.701416015625, -16.15283203125, -15.604248046875, -15.0556640625, -14.507080078125, -13.95849609375, -13.409912109375, -12.861328125, -12.312744140625, -11.76416015625, -11.215576171875, -10.6669921875, -10.118408203125, -9.56982421875, -9.021240234375, -8.47265625, -7.924072265625, -7.37548828125, -6.826904296875, -6.2783203125, -5.729736328125, -5.18115234375, -4.632568359375, -4.083984375, -3.535400390625, -2.98681640625, -2.438232421875, -1.8896484375, -1.341064453125, -0.79248046875, -0.243896484375, 0.3046875, 0.853271484375, 1.40185546875, 1.950439453125, 2.4990234375, 3.047607421875, 3.59619140625, 4.144775390625, 4.693359375, 5.241943359375, 5.79052734375, 6.339111328125, 6.8876953125, 7.436279296875, 7.98486328125, 8.533447265625, 9.08203125, 9.630615234375, 10.17919921875, 10.727783203125, 11.2763671875, 11.824951171875, 12.37353515625, 12.922119140625, 13.470703125, 14.019287109375, 14.56787109375, 15.116455078125, 15.6650390625, 16.213623046875, 16.76220703125, 17.310791015625, 17.859375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 24.0, 125.0, 344.0, 342.0, 147.0, 23.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.22175216674805, -47.50830841064453, -40.79486083984375, -34.081417083740234, -27.36797332763672, -20.654529571533203, -13.941082000732422, -7.227638244628906, -0.5141944885253906, 6.199250221252441, 12.912694931030273, 19.626140594482422, 26.339584350585938, 33.05302810668945, 39.766475677490234, 46.47991943359375, 53.193363189697266, 59.90680694580078, 66.62025451660156, 73.33369445800781, 80.0471420288086, 86.76058959960938, 93.47402954101562, 100.1874771118164, 106.90092468261719, 113.61437225341797, 120.32781219482422, 127.041259765625, 133.75469970703125, 140.4681396484375, 147.1815948486328, 153.89503479003906, 160.60848999023438, 167.32192993164062, 174.03538513183594, 180.7488250732422, 187.46226501464844, 194.17572021484375, 200.88916015625, 207.60260009765625, 214.3160400390625, 221.02947998046875, 227.74293518066406, 234.4563751220703, 241.16981506347656, 247.88327026367188, 254.59671020507812, 261.3101501464844, 268.02362060546875, 274.737060546875, 281.45050048828125, 288.1639404296875, 294.8774108886719, 301.5908508300781, 308.3042907714844, 315.0177307128906, 321.7311706542969, 328.4446105957031, 335.1580505371094, 341.87152099609375, 348.5849609375, 355.29840087890625, 362.0118408203125, 368.72528076171875, 375.438720703125]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 5.0, 4.0, 9.0, 13.0, 4.0, 11.0, 9.0, 21.0, 16.0, 24.0, 26.0, 21.0, 33.0, 35.0, 25.0, 31.0, 36.0, 38.0, 40.0, 44.0, 39.0, 40.0, 36.0, 35.0, 35.0, 37.0, 34.0, 33.0, 33.0, 27.0, 26.0, 23.0, 24.0, 28.0, 22.0, 20.0, 8.0, 12.0, 9.0, 8.0, 10.0, 6.0, 7.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.07294464111328, -32.90985107421875, -31.74675750732422, -30.583663940429688, -29.420570373535156, -28.257476806640625, -27.09438133239746, -25.93128776550293, -24.7681941986084, -23.605100631713867, -22.442007064819336, -21.278913497924805, -20.11581802368164, -18.95272445678711, -17.789630889892578, -16.626537322998047, -15.463443756103516, -14.300350189208984, -13.137256622314453, -11.974162101745605, -10.811068534851074, -9.647974967956543, -8.484880447387695, -7.321786880493164, -6.158693313598633, -4.995599746704102, -3.832505702972412, -2.6694118976593018, -1.5063180923461914, -0.34322452545166016, 0.8198695182800293, 1.9829635620117188, 3.14605712890625, 4.309150695800781, 5.472244739532471, 6.63533878326416, 7.798432350158691, 8.961525917053223, 10.12462043762207, 11.287714004516602, 12.450807571411133, 13.613901138305664, 14.776994705200195, 15.940089225769043, 17.10318374633789, 18.266277313232422, 19.429370880126953, 20.592464447021484, 21.755558013916016, 22.918651580810547, 24.081745147705078, 25.24483871459961, 26.40793228149414, 27.571025848388672, 28.734121322631836, 29.897214889526367, 31.0603084564209, 32.22340393066406, 33.386497497558594, 34.549591064453125, 35.712684631347656, 36.87577819824219, 38.03887176513672, 39.20196533203125, 40.36505889892578]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 3.0, 3.0, 6.0, 3.0, 5.0, 10.0, 8.0, 11.0, 11.0, 17.0, 18.0, 20.0, 20.0, 30.0, 29.0, 44.0, 47.0, 40.0, 39.0, 35.0, 47.0, 38.0, 51.0, 55.0, 49.0, 38.0, 41.0, 37.0, 38.0, 31.0, 35.0, 20.0, 19.0, 18.0, 15.0, 13.0, 13.0, 8.0, 3.0, 6.0, 2.0, 9.0, 9.0, 4.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.37109375, -4.243133544921875, -4.11517333984375, -3.987213134765625, -3.8592529296875, -3.731292724609375, -3.60333251953125, -3.475372314453125, -3.347412109375, -3.219451904296875, -3.09149169921875, -2.963531494140625, -2.8355712890625, -2.707611083984375, -2.57965087890625, -2.451690673828125, -2.32373046875, -2.195770263671875, -2.06781005859375, -1.939849853515625, -1.8118896484375, -1.683929443359375, -1.55596923828125, -1.428009033203125, -1.300048828125, -1.172088623046875, -1.04412841796875, -0.916168212890625, -0.7882080078125, -0.660247802734375, -0.53228759765625, -0.404327392578125, -0.2763671875, -0.148406982421875, -0.02044677734375, 0.107513427734375, 0.2354736328125, 0.363433837890625, 0.49139404296875, 0.619354248046875, 0.747314453125, 0.875274658203125, 1.00323486328125, 1.131195068359375, 1.2591552734375, 1.387115478515625, 1.51507568359375, 1.643035888671875, 1.77099609375, 1.898956298828125, 2.02691650390625, 2.154876708984375, 2.2828369140625, 2.410797119140625, 2.53875732421875, 2.666717529296875, 2.794677734375, 2.922637939453125, 3.05059814453125, 3.178558349609375, 3.3065185546875, 3.434478759765625, 3.56243896484375, 3.690399169921875, 3.818359375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 6.0, 4.0, 15.0, 12.0, 21.0, 31.0, 49.0, 64.0, 83.0, 145.0, 214.0, 324.0, 529.0, 983.0, 1749.0, 3469.0, 7696.0, 18672.0, 49866.0, 126713.0, 253750.0, 291768.0, 172353.0, 72151.0, 27308.0, 10732.0, 4690.0, 2183.0, 1128.0, 643.0, 425.0, 256.0, 166.0, 113.0, 77.0, 49.0, 34.0, 22.0, 20.0, 13.0, 15.0, 10.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.146484375, -2.077667236328125, -2.00885009765625, -1.940032958984375, -1.8712158203125, -1.802398681640625, -1.73358154296875, -1.664764404296875, -1.595947265625, -1.527130126953125, -1.45831298828125, -1.389495849609375, -1.3206787109375, -1.251861572265625, -1.18304443359375, -1.114227294921875, -1.04541015625, -0.976593017578125, -0.90777587890625, -0.838958740234375, -0.7701416015625, -0.701324462890625, -0.63250732421875, -0.563690185546875, -0.494873046875, -0.426055908203125, -0.35723876953125, -0.288421630859375, -0.2196044921875, -0.150787353515625, -0.08197021484375, -0.013153076171875, 0.0556640625, 0.124481201171875, 0.19329833984375, 0.262115478515625, 0.3309326171875, 0.399749755859375, 0.46856689453125, 0.537384033203125, 0.606201171875, 0.675018310546875, 0.74383544921875, 0.812652587890625, 0.8814697265625, 0.950286865234375, 1.01910400390625, 1.087921142578125, 1.15673828125, 1.225555419921875, 1.29437255859375, 1.363189697265625, 1.4320068359375, 1.500823974609375, 1.56964111328125, 1.638458251953125, 1.707275390625, 1.776092529296875, 1.84490966796875, 1.913726806640625, 1.9825439453125, 2.051361083984375, 2.12017822265625, 2.188995361328125, 2.2578125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 8.0, 6.0, 7.0, 13.0, 9.0, 12.0, 14.0, 17.0, 14.0, 20.0, 22.0, 20.0, 26.0, 21.0, 31.0, 42.0, 46.0, 28.0, 47.0, 32.0, 1065.0, 35.0, 41.0, 46.0, 46.0, 27.0, 40.0, 36.0, 44.0, 23.0, 28.0, 21.0, 21.0, 24.0, 14.0, 15.0, 9.0, 12.0, 10.0, 5.0, 7.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.791015625, -2.700592041015625, -2.61016845703125, -2.519744873046875, -2.4293212890625, -2.338897705078125, -2.24847412109375, -2.158050537109375, -2.067626953125, -1.977203369140625, -1.88677978515625, -1.796356201171875, -1.7059326171875, -1.615509033203125, -1.52508544921875, -1.434661865234375, -1.34423828125, -1.253814697265625, -1.16339111328125, -1.072967529296875, -0.9825439453125, -0.892120361328125, -0.80169677734375, -0.711273193359375, -0.620849609375, -0.530426025390625, -0.44000244140625, -0.349578857421875, -0.2591552734375, -0.168731689453125, -0.07830810546875, 0.012115478515625, 0.1025390625, 0.192962646484375, 0.28338623046875, 0.373809814453125, 0.4642333984375, 0.554656982421875, 0.64508056640625, 0.735504150390625, 0.825927734375, 0.916351318359375, 1.00677490234375, 1.097198486328125, 1.1876220703125, 1.278045654296875, 1.36846923828125, 1.458892822265625, 1.54931640625, 1.639739990234375, 1.73016357421875, 1.820587158203125, 1.9110107421875, 2.001434326171875, 2.09185791015625, 2.182281494140625, 2.272705078125, 2.363128662109375, 2.45355224609375, 2.543975830078125, 2.6343994140625, 2.724822998046875, 2.81524658203125, 2.905670166015625, 2.99609375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 2.0, 4.0, 8.0, 10.0, 10.0, 10.0, 16.0, 19.0, 33.0, 41.0, 63.0, 78.0, 108.0, 157.0, 218.0, 338.0, 536.0, 810.0, 1365.0, 2281.0, 3569.0, 6116.0, 9854.0, 16432.0, 29869.0, 132544.0, 1812690.0, 33438.0, 18438.0, 10782.0, 6547.0, 4088.0, 2477.0, 1511.0, 927.0, 579.0, 359.0, 270.0, 144.0, 112.0, 80.0, 43.0, 43.0, 29.0, 20.0, 23.0, 15.0, 12.0, 3.0, 7.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.9501953125, -1.8853912353515625, -1.820587158203125, -1.7557830810546875, -1.69097900390625, -1.6261749267578125, -1.561370849609375, -1.4965667724609375, -1.4317626953125, -1.3669586181640625, -1.302154541015625, -1.2373504638671875, -1.17254638671875, -1.1077423095703125, -1.042938232421875, -0.9781341552734375, -0.913330078125, -0.8485260009765625, -0.783721923828125, -0.7189178466796875, -0.65411376953125, -0.5893096923828125, -0.524505615234375, -0.4597015380859375, -0.3948974609375, -0.3300933837890625, -0.265289306640625, -0.2004852294921875, -0.13568115234375, -0.0708770751953125, -0.006072998046875, 0.0587310791015625, 0.12353515625, 0.1883392333984375, 0.253143310546875, 0.3179473876953125, 0.38275146484375, 0.4475555419921875, 0.512359619140625, 0.5771636962890625, 0.6419677734375, 0.7067718505859375, 0.771575927734375, 0.8363800048828125, 0.90118408203125, 0.9659881591796875, 1.030792236328125, 1.0955963134765625, 1.160400390625, 1.2252044677734375, 1.290008544921875, 1.3548126220703125, 1.41961669921875, 1.4844207763671875, 1.549224853515625, 1.6140289306640625, 1.6788330078125, 1.7436370849609375, 1.808441162109375, 1.8732452392578125, 1.93804931640625, 2.0028533935546875, 2.067657470703125, 2.1324615478515625, 2.197265625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 4.0, 3.0, 6.0, 4.0, 6.0, 2.0, 6.0, 7.0, 10.0, 7.0, 18.0, 16.0, 24.0, 24.0, 38.0, 27.0, 41.0, 43.0, 43.0, 51.0, 39.0, 44.0, 59.0, 59.0, 56.0, 36.0, 43.0, 27.0, 42.0, 28.0, 33.0, 25.0, 16.0, 12.0, 14.0, 8.0, 10.0, 7.0, 10.0, 3.0, 7.0, 8.0, 4.0, 3.0, 3.0, 4.0, 5.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0], "bins": [-0.11700439453125, -0.11348247528076172, -0.10996055603027344, -0.10643863677978516, -0.10291671752929688, -0.0993947982788086, -0.09587287902832031, -0.09235095977783203, -0.08882904052734375, -0.08530712127685547, -0.08178520202636719, -0.0782632827758789, -0.07474136352539062, -0.07121944427490234, -0.06769752502441406, -0.06417560577392578, -0.0606536865234375, -0.05713176727294922, -0.05360984802246094, -0.050087928771972656, -0.046566009521484375, -0.043044090270996094, -0.03952217102050781, -0.03600025177001953, -0.03247833251953125, -0.02895641326904297, -0.025434494018554688, -0.021912574768066406, -0.018390655517578125, -0.014868736267089844, -0.011346817016601562, -0.007824897766113281, -0.004302978515625, -0.0007810592651367188, 0.0027408599853515625, 0.006262779235839844, 0.009784698486328125, 0.013306617736816406, 0.016828536987304688, 0.02035045623779297, 0.02387237548828125, 0.02739429473876953, 0.030916213989257812, 0.034438133239746094, 0.037960052490234375, 0.041481971740722656, 0.04500389099121094, 0.04852581024169922, 0.0520477294921875, 0.05556964874267578, 0.05909156799316406, 0.06261348724365234, 0.06613540649414062, 0.0696573257446289, 0.07317924499511719, 0.07670116424560547, 0.08022308349609375, 0.08374500274658203, 0.08726692199707031, 0.0907888412475586, 0.09431076049804688, 0.09783267974853516, 0.10135459899902344, 0.10487651824951172, 0.1083984375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 3.0, 6.0, 5.0, 6.0, 7.0, 8.0, 10.0, 13.0, 15.0, 15.0, 18.0, 23.0, 18.0, 20.0, 26.0, 24.0, 46.0, 59.0, 65.0, 90.0, 111.0, 132.0, 146.0, 209.0, 348.0, 667.0, 7221.0, 797453.0, 237050.0, 2925.0, 554.0, 223.0, 187.0, 160.0, 131.0, 95.0, 65.0, 73.0, 60.0, 41.0, 39.0, 24.0, 21.0, 22.0, 20.0, 11.0, 19.0, 9.0, 15.0, 6.0, 17.0, 10.0, 8.0, 7.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.6953125, -1.6403961181640625, -1.585479736328125, -1.5305633544921875, -1.47564697265625, -1.4207305908203125, -1.365814208984375, -1.3108978271484375, -1.2559814453125, -1.2010650634765625, -1.146148681640625, -1.0912322998046875, -1.03631591796875, -0.9813995361328125, -0.926483154296875, -0.8715667724609375, -0.816650390625, -0.7617340087890625, -0.706817626953125, -0.6519012451171875, -0.59698486328125, -0.5420684814453125, -0.487152099609375, -0.4322357177734375, -0.3773193359375, -0.3224029541015625, -0.267486572265625, -0.2125701904296875, -0.15765380859375, -0.1027374267578125, -0.047821044921875, 0.0070953369140625, 0.06201171875, 0.1169281005859375, 0.171844482421875, 0.2267608642578125, 0.28167724609375, 0.3365936279296875, 0.391510009765625, 0.4464263916015625, 0.5013427734375, 0.5562591552734375, 0.611175537109375, 0.6660919189453125, 0.72100830078125, 0.7759246826171875, 0.830841064453125, 0.8857574462890625, 0.940673828125, 0.9955902099609375, 1.050506591796875, 1.1054229736328125, 1.16033935546875, 1.2152557373046875, 1.270172119140625, 1.3250885009765625, 1.3800048828125, 1.4349212646484375, 1.489837646484375, 1.5447540283203125, 1.59967041015625, 1.6545867919921875, 1.709503173828125, 1.7644195556640625, 1.8193359375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 44.0, 884.0, 85.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.934218406677246, -9.745674133300781, -9.55712890625, -9.368584632873535, -9.180039405822754, -8.991495132446289, -8.802950859069824, -8.614405632019043, -8.425861358642578, -8.237317085266113, -8.048771858215332, -7.860227584838867, -7.671682834625244, -7.483138084411621, -7.294593334197998, -7.106048583984375, -6.91750431060791, -6.728959560394287, -6.540414810180664, -6.351870536804199, -6.163325786590576, -5.974781036376953, -5.78623628616333, -5.597691535949707, -5.409146785736084, -5.220602035522461, -5.032057285308838, -4.843513011932373, -4.65496826171875, -4.466423511505127, -4.277878761291504, -4.089334487915039, -3.900789737701416, -3.712244987487793, -3.523700475692749, -3.335155725479126, -3.146611213684082, -2.958066463470459, -2.769521713256836, -2.580977201461792, -2.392432689666748, -2.203887939453125, -2.015343427658081, -1.826798677444458, -1.638254165649414, -1.449709415435791, -1.2611647844314575, -1.072620153427124, -0.884075403213501, -0.6955307722091675, -0.506986141204834, -0.3184414505958557, -0.12989681959152222, 0.05864781141281128, 0.24719250202178955, 0.43573713302612305, 0.6242817640304565, 0.81282639503479, 1.0013710260391235, 1.189915657043457, 1.37846040725708, 1.567004919052124, 1.755549669265747, 1.9440943002700806, 2.132638931274414]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 6.0, 13.0, 16.0, 21.0, 30.0, 18.0, 28.0, 33.0, 56.0, 46.0, 54.0, 58.0, 52.0, 52.0, 54.0, 52.0, 55.0, 45.0, 39.0, 39.0, 41.0, 44.0, 35.0, 23.0, 14.0, 18.0, 16.0, 9.0, 6.0, 8.0, 7.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6986128091812134, -0.6745948195457458, -0.6505767703056335, -0.626558780670166, -0.6025407314300537, -0.5785227417945862, -0.5545047521591187, -0.5304867029190063, -0.5064687132835388, -0.4824506938457489, -0.458432674407959, -0.43441468477249146, -0.41039666533470154, -0.3863786458969116, -0.3623606562614441, -0.3383426368236542, -0.31432461738586426, -0.29030659794807434, -0.2662885785102844, -0.2422705888748169, -0.21825256943702698, -0.19423454999923706, -0.17021654546260834, -0.14619854092597961, -0.1221805214881897, -0.09816250950098038, -0.07414449751377106, -0.05012648552656174, -0.026108473539352417, -0.002090461552143097, 0.021927550435066223, 0.045945554971694946, 0.06996357440948486, 0.09398158639669418, 0.1179995983839035, 0.14201760292053223, 0.16603562235832214, 0.19005364179611206, 0.21407164633274078, 0.2380896508693695, 0.2621076703071594, 0.28612568974494934, 0.31014370918273926, 0.3341616988182068, 0.3581797182559967, 0.3821977376937866, 0.40621572732925415, 0.43023374676704407, 0.454251766204834, 0.4782697856426239, 0.5022878050804138, 0.5263057947158813, 0.5503238439559937, 0.5743418335914612, 0.5983598232269287, 0.622377872467041, 0.6463958621025085, 0.6704138517379761, 0.6944319009780884, 0.7184498906135559, 0.7424678802490234, 0.7664859294891357, 0.7905039191246033, 0.8145219087600708, 0.8385399580001831]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 6.0, 7.0, 12.0, 13.0, 13.0, 18.0, 26.0, 25.0, 25.0, 30.0, 37.0, 23.0, 46.0, 49.0, 47.0, 50.0, 43.0, 53.0, 55.0, 42.0, 51.0, 55.0, 33.0, 29.0, 30.0, 25.0, 27.0, 28.0, 12.0, 14.0, 16.0, 11.0, 10.0, 6.0, 3.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-4.60546875, -4.47021484375, -4.3349609375, -4.19970703125, -4.064453125, -3.92919921875, -3.7939453125, -3.65869140625, -3.5234375, -3.38818359375, -3.2529296875, -3.11767578125, -2.982421875, -2.84716796875, -2.7119140625, -2.57666015625, -2.44140625, -2.30615234375, -2.1708984375, -2.03564453125, -1.900390625, -1.76513671875, -1.6298828125, -1.49462890625, -1.359375, -1.22412109375, -1.0888671875, -0.95361328125, -0.818359375, -0.68310546875, -0.5478515625, -0.41259765625, -0.27734375, -0.14208984375, -0.0068359375, 0.12841796875, 0.263671875, 0.39892578125, 0.5341796875, 0.66943359375, 0.8046875, 0.93994140625, 1.0751953125, 1.21044921875, 1.345703125, 1.48095703125, 1.6162109375, 1.75146484375, 1.88671875, 2.02197265625, 2.1572265625, 2.29248046875, 2.427734375, 2.56298828125, 2.6982421875, 2.83349609375, 2.96875, 3.10400390625, 3.2392578125, 3.37451171875, 3.509765625, 3.64501953125, 3.7802734375, 3.91552734375, 4.05078125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 7.0, 7.0, 10.0, 13.0, 25.0, 20.0, 34.0, 45.0, 61.0, 114.0, 172.0, 302.0, 491.0, 967.0, 1769.0, 3824.0, 8506.0, 20224.0, 52389.0, 150088.0, 364488.0, 280467.0, 101406.0, 36089.0, 14691.0, 6457.0, 2806.0, 1301.0, 730.0, 377.0, 207.0, 139.0, 110.0, 61.0, 31.0, 39.0, 17.0, 17.0, 17.0, 8.0, 4.0, 6.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.23828125, -6.03582763671875, -5.8333740234375, -5.63092041015625, -5.428466796875, -5.22601318359375, -5.0235595703125, -4.82110595703125, -4.61865234375, -4.41619873046875, -4.2137451171875, -4.01129150390625, -3.808837890625, -3.60638427734375, -3.4039306640625, -3.20147705078125, -2.9990234375, -2.79656982421875, -2.5941162109375, -2.39166259765625, -2.189208984375, -1.98675537109375, -1.7843017578125, -1.58184814453125, -1.37939453125, -1.17694091796875, -0.9744873046875, -0.77203369140625, -0.569580078125, -0.36712646484375, -0.1646728515625, 0.03778076171875, 0.240234375, 0.44268798828125, 0.6451416015625, 0.84759521484375, 1.050048828125, 1.25250244140625, 1.4549560546875, 1.65740966796875, 1.85986328125, 2.06231689453125, 2.2647705078125, 2.46722412109375, 2.669677734375, 2.87213134765625, 3.0745849609375, 3.27703857421875, 3.4794921875, 3.68194580078125, 3.8843994140625, 4.08685302734375, 4.289306640625, 4.49176025390625, 4.6942138671875, 4.89666748046875, 5.09912109375, 5.30157470703125, 5.5040283203125, 5.70648193359375, 5.908935546875, 6.11138916015625, 6.3138427734375, 6.51629638671875, 6.71875]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 11.0, 6.0, 10.0, 13.0, 24.0, 19.0, 34.0, 30.0, 38.0, 33.0, 41.0, 47.0, 57.0, 82.0, 139.0, 282.0, 1438.0, 220.0, 106.0, 70.0, 51.0, 43.0, 44.0, 36.0, 33.0, 29.0, 17.0, 18.0, 19.0, 17.0, 13.0, 9.0, 6.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.59375, -17.031494140625, -16.46923828125, -15.906982421875, -15.3447265625, -14.782470703125, -14.22021484375, -13.657958984375, -13.095703125, -12.533447265625, -11.97119140625, -11.408935546875, -10.8466796875, -10.284423828125, -9.72216796875, -9.159912109375, -8.59765625, -8.035400390625, -7.47314453125, -6.910888671875, -6.3486328125, -5.786376953125, -5.22412109375, -4.661865234375, -4.099609375, -3.537353515625, -2.97509765625, -2.412841796875, -1.8505859375, -1.288330078125, -0.72607421875, -0.163818359375, 0.3984375, 0.960693359375, 1.52294921875, 2.085205078125, 2.6474609375, 3.209716796875, 3.77197265625, 4.334228515625, 4.896484375, 5.458740234375, 6.02099609375, 6.583251953125, 7.1455078125, 7.707763671875, 8.27001953125, 8.832275390625, 9.39453125, 9.956787109375, 10.51904296875, 11.081298828125, 11.6435546875, 12.205810546875, 12.76806640625, 13.330322265625, 13.892578125, 14.454833984375, 15.01708984375, 15.579345703125, 16.1416015625, 16.703857421875, 17.26611328125, 17.828369140625, 18.390625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 8.0, 6.0, 13.0, 18.0, 22.0, 25.0, 29.0, 38.0, 82.0, 83.0, 164.0, 280.0, 572.0, 1505.0, 5604.0, 53112.0, 2203297.0, 849879.0, 24908.0, 3719.0, 1130.0, 508.0, 262.0, 138.0, 80.0, 39.0, 45.0, 42.0, 26.0, 21.0, 9.0, 8.0, 8.0, 9.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.34375, -23.554931640625, -22.76611328125, -21.977294921875, -21.1884765625, -20.399658203125, -19.61083984375, -18.822021484375, -18.033203125, -17.244384765625, -16.45556640625, -15.666748046875, -14.8779296875, -14.089111328125, -13.30029296875, -12.511474609375, -11.72265625, -10.933837890625, -10.14501953125, -9.356201171875, -8.5673828125, -7.778564453125, -6.98974609375, -6.200927734375, -5.412109375, -4.623291015625, -3.83447265625, -3.045654296875, -2.2568359375, -1.468017578125, -0.67919921875, 0.109619140625, 0.8984375, 1.687255859375, 2.47607421875, 3.264892578125, 4.0537109375, 4.842529296875, 5.63134765625, 6.420166015625, 7.208984375, 7.997802734375, 8.78662109375, 9.575439453125, 10.3642578125, 11.153076171875, 11.94189453125, 12.730712890625, 13.51953125, 14.308349609375, 15.09716796875, 15.885986328125, 16.6748046875, 17.463623046875, 18.25244140625, 19.041259765625, 19.830078125, 20.618896484375, 21.40771484375, 22.196533203125, 22.9853515625, 23.774169921875, 24.56298828125, 25.351806640625, 26.140625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 21.0, 36.0, 101.0, 198.0, 246.0, 216.0, 130.0, 46.0, 12.0, 4.0, 3.0], "bins": [-113.09811401367188, -111.13611602783203, -109.17412567138672, -107.21212768554688, -105.25012969970703, -103.28813171386719, -101.32614135742188, -99.36414337158203, -97.40214538574219, -95.44014739990234, -93.47815704345703, -91.51615905761719, -89.55416107177734, -87.5921630859375, -85.63017272949219, -83.66817474365234, -81.70618438720703, -79.74418640136719, -77.78219604492188, -75.82019805908203, -73.85820007324219, -71.89620971679688, -69.93421173095703, -67.97221374511719, -66.01022338867188, -64.04822540283203, -62.08623123168945, -60.124237060546875, -58.16223907470703, -56.20024490356445, -54.238250732421875, -52.27625274658203, -50.31425476074219, -48.35226058959961, -46.390262603759766, -44.42826843261719, -42.466270446777344, -40.504276275634766, -38.54228210449219, -36.580284118652344, -34.618289947509766, -32.65629577636719, -30.694297790527344, -28.732303619384766, -26.770307540893555, -24.808311462402344, -22.846317291259766, -20.884321212768555, -18.922325134277344, -16.960329055786133, -14.998333930969238, -13.036338806152344, -11.074342727661133, -9.112346649169922, -7.150351524353027, -5.188356399536133, -3.226360321044922, -1.2643647193908691, 0.6976308822631836, 2.6596264839172363, 4.621622085571289, 6.5836181640625, 8.545613288879395, 10.507608413696289, 12.4696044921875]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 9.0, 13.0, 13.0, 12.0, 17.0, 15.0, 22.0, 17.0, 21.0, 14.0, 23.0, 14.0, 24.0, 30.0, 40.0, 37.0, 37.0, 36.0, 36.0, 42.0, 54.0, 35.0, 35.0, 35.0, 46.0, 33.0, 32.0, 30.0, 29.0, 15.0, 21.0, 25.0, 19.0, 11.0, 18.0, 13.0, 7.0, 10.0, 11.0, 6.0, 0.0, 9.0, 8.0, 6.0, 3.0, 0.0, 5.0, 2.0, 5.0, 1.0], "bins": [-51.478057861328125, -49.95014953613281, -48.4222412109375, -46.89433288574219, -45.36642074584961, -43.8385124206543, -42.310604095458984, -40.78269577026367, -39.254783630371094, -37.72687530517578, -36.19896697998047, -34.671058654785156, -33.14314651489258, -31.615238189697266, -30.087329864501953, -28.55942153930664, -27.031513214111328, -25.503604888916016, -23.97569465637207, -22.447786331176758, -20.919876098632812, -19.3919677734375, -17.864059448242188, -16.336151123046875, -14.80824089050293, -13.2803316116333, -11.752422332763672, -10.22451400756836, -8.69660472869873, -7.168695449829102, -5.640787124633789, -4.11287784576416, -2.5849685668945312, -1.0570595264434814, 0.47084951400756836, 1.998758316040039, 3.526667594909668, 5.054576873779297, 6.582485198974609, 8.110394477844238, 9.638303756713867, 11.166213035583496, 12.694122314453125, 14.222030639648438, 15.749939918518066, 17.277849197387695, 18.805757522583008, 20.333667755126953, 21.861576080322266, 23.389484405517578, 24.917394638061523, 26.445302963256836, 27.97321319580078, 29.501121520996094, 31.029029846191406, 32.55693817138672, 34.08484649658203, 35.612754821777344, 37.140663146972656, 38.66857147216797, 40.19648361206055, 41.72439193725586, 43.25230026245117, 44.780208587646484, 46.30812072753906]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 10.0, 10.0, 7.0, 6.0, 13.0, 8.0, 15.0, 17.0, 23.0, 23.0, 37.0, 33.0, 37.0, 35.0, 32.0, 51.0, 42.0, 42.0, 45.0, 39.0, 50.0, 48.0, 48.0, 44.0, 36.0, 43.0, 32.0, 22.0, 25.0, 30.0, 14.0, 18.0, 8.0, 11.0, 9.0, 8.0, 6.0, 5.0, 6.0, 3.0, 2.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-4.9296875, -4.792755126953125, -4.65582275390625, -4.518890380859375, -4.3819580078125, -4.245025634765625, -4.10809326171875, -3.971160888671875, -3.834228515625, -3.697296142578125, -3.56036376953125, -3.423431396484375, -3.2864990234375, -3.149566650390625, -3.01263427734375, -2.875701904296875, -2.73876953125, -2.601837158203125, -2.46490478515625, -2.327972412109375, -2.1910400390625, -2.054107666015625, -1.91717529296875, -1.780242919921875, -1.643310546875, -1.506378173828125, -1.36944580078125, -1.232513427734375, -1.0955810546875, -0.958648681640625, -0.82171630859375, -0.684783935546875, -0.5478515625, -0.410919189453125, -0.27398681640625, -0.137054443359375, -0.0001220703125, 0.136810302734375, 0.27374267578125, 0.410675048828125, 0.547607421875, 0.684539794921875, 0.82147216796875, 0.958404541015625, 1.0953369140625, 1.232269287109375, 1.36920166015625, 1.506134033203125, 1.64306640625, 1.779998779296875, 1.91693115234375, 2.053863525390625, 2.1907958984375, 2.327728271484375, 2.46466064453125, 2.601593017578125, 2.738525390625, 2.875457763671875, 3.01239013671875, 3.149322509765625, 3.2862548828125, 3.423187255859375, 3.56011962890625, 3.697052001953125, 3.833984375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 4.0, 9.0, 16.0, 24.0, 31.0, 54.0, 89.0, 116.0, 208.0, 329.0, 626.0, 1285.0, 3339.0, 13509.0, 167994.0, 3287310.0, 679150.0, 31504.0, 5141.0, 1709.0, 735.0, 465.0, 227.0, 121.0, 112.0, 56.0, 43.0, 27.0, 15.0, 8.0, 10.0, 3.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.734375, -23.008544921875, -22.28271484375, -21.556884765625, -20.8310546875, -20.105224609375, -19.37939453125, -18.653564453125, -17.927734375, -17.201904296875, -16.47607421875, -15.750244140625, -15.0244140625, -14.298583984375, -13.57275390625, -12.846923828125, -12.12109375, -11.395263671875, -10.66943359375, -9.943603515625, -9.2177734375, -8.491943359375, -7.76611328125, -7.040283203125, -6.314453125, -5.588623046875, -4.86279296875, -4.136962890625, -3.4111328125, -2.685302734375, -1.95947265625, -1.233642578125, -0.5078125, 0.218017578125, 0.94384765625, 1.669677734375, 2.3955078125, 3.121337890625, 3.84716796875, 4.572998046875, 5.298828125, 6.024658203125, 6.75048828125, 7.476318359375, 8.2021484375, 8.927978515625, 9.65380859375, 10.379638671875, 11.10546875, 11.831298828125, 12.55712890625, 13.282958984375, 14.0087890625, 14.734619140625, 15.46044921875, 16.186279296875, 16.912109375, 17.637939453125, 18.36376953125, 19.089599609375, 19.8154296875, 20.541259765625, 21.26708984375, 21.992919921875, 22.71875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 11.0, 8.0, 14.0, 12.0, 19.0, 31.0, 36.0, 58.0, 71.0, 99.0, 137.0, 192.0, 263.0, 312.0, 454.0, 464.0, 439.0, 346.0, 290.0, 189.0, 160.0, 138.0, 103.0, 55.0, 42.0, 23.0, 32.0, 18.0, 12.0, 10.0, 5.0, 7.0, 3.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.125, -10.7508544921875, -10.376708984375, -10.0025634765625, -9.62841796875, -9.2542724609375, -8.880126953125, -8.5059814453125, -8.1318359375, -7.7576904296875, -7.383544921875, -7.0093994140625, -6.63525390625, -6.2611083984375, -5.886962890625, -5.5128173828125, -5.138671875, -4.7645263671875, -4.390380859375, -4.0162353515625, -3.64208984375, -3.2679443359375, -2.893798828125, -2.5196533203125, -2.1455078125, -1.7713623046875, -1.397216796875, -1.0230712890625, -0.64892578125, -0.2747802734375, 0.099365234375, 0.4735107421875, 0.84765625, 1.2218017578125, 1.595947265625, 1.9700927734375, 2.34423828125, 2.7183837890625, 3.092529296875, 3.4666748046875, 3.8408203125, 4.2149658203125, 4.589111328125, 4.9632568359375, 5.33740234375, 5.7115478515625, 6.085693359375, 6.4598388671875, 6.833984375, 7.2081298828125, 7.582275390625, 7.9564208984375, 8.33056640625, 8.7047119140625, 9.078857421875, 9.4530029296875, 9.8271484375, 10.2012939453125, 10.575439453125, 10.9495849609375, 11.32373046875, 11.6978759765625, 12.072021484375, 12.4461669921875, 12.8203125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 5.0, 8.0, 12.0, 21.0, 35.0, 46.0, 70.0, 108.0, 224.0, 415.0, 895.0, 2101.0, 5507.0, 17406.0, 82729.0, 599830.0, 2557755.0, 790600.0, 104908.0, 21004.0, 6308.0, 2297.0, 1004.0, 438.0, 228.0, 112.0, 66.0, 38.0, 26.0, 16.0, 23.0, 9.0, 6.0, 6.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-24.859375, -24.160400390625, -23.46142578125, -22.762451171875, -22.0634765625, -21.364501953125, -20.66552734375, -19.966552734375, -19.267578125, -18.568603515625, -17.86962890625, -17.170654296875, -16.4716796875, -15.772705078125, -15.07373046875, -14.374755859375, -13.67578125, -12.976806640625, -12.27783203125, -11.578857421875, -10.8798828125, -10.180908203125, -9.48193359375, -8.782958984375, -8.083984375, -7.385009765625, -6.68603515625, -5.987060546875, -5.2880859375, -4.589111328125, -3.89013671875, -3.191162109375, -2.4921875, -1.793212890625, -1.09423828125, -0.395263671875, 0.3037109375, 1.002685546875, 1.70166015625, 2.400634765625, 3.099609375, 3.798583984375, 4.49755859375, 5.196533203125, 5.8955078125, 6.594482421875, 7.29345703125, 7.992431640625, 8.69140625, 9.390380859375, 10.08935546875, 10.788330078125, 11.4873046875, 12.186279296875, 12.88525390625, 13.584228515625, 14.283203125, 14.982177734375, 15.68115234375, 16.380126953125, 17.0791015625, 17.778076171875, 18.47705078125, 19.176025390625, 19.875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 11.0, 11.0, 49.0, 90.0, 174.0, 195.0, 221.0, 154.0, 67.0, 26.0, 14.0, 6.0, 0.0, 0.0, 1.0], "bins": [-230.38401794433594, -226.18824768066406, -221.9924774169922, -217.7967071533203, -213.60093688964844, -209.40516662597656, -205.2093963623047, -201.0136260986328, -196.81785583496094, -192.62208557128906, -188.4263153076172, -184.2305450439453, -180.03477478027344, -175.83900451660156, -171.6432342529297, -167.4474639892578, -163.25169372558594, -159.05592346191406, -154.8601531982422, -150.6643829345703, -146.46861267089844, -142.27284240722656, -138.0770721435547, -133.8813018798828, -129.68553161621094, -125.48976135253906, -121.29399108886719, -117.09822082519531, -112.90245056152344, -108.70668029785156, -104.51091003417969, -100.31513977050781, -96.11936950683594, -91.92359924316406, -87.72782897949219, -83.53205871582031, -79.33628845214844, -75.14051818847656, -70.94474792480469, -66.74897766113281, -62.55320739746094, -58.35743713378906, -54.16166687011719, -49.96589660644531, -45.77012634277344, -41.57435607910156, -37.37858581542969, -33.18281555175781, -28.987045288085938, -24.791275024414062, -20.595504760742188, -16.399734497070312, -12.203964233398438, -8.008193969726562, -3.8124237060546875, 0.3833465576171875, 4.5791168212890625, 8.774887084960938, 12.970657348632812, 17.166427612304688, 21.362197875976562, 25.557968139648438, 29.753738403320312, 33.94950866699219, 38.14527893066406]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 3.0, 4.0, 8.0, 7.0, 7.0, 8.0, 9.0, 10.0, 17.0, 19.0, 22.0, 24.0, 20.0, 24.0, 28.0, 38.0, 33.0, 34.0, 30.0, 36.0, 35.0, 42.0, 48.0, 37.0, 26.0, 34.0, 37.0, 32.0, 19.0, 31.0, 37.0, 28.0, 21.0, 24.0, 17.0, 18.0, 24.0, 21.0, 20.0, 18.0, 10.0, 8.0, 6.0, 5.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.611610412597656, -33.46760559082031, -32.32360076904297, -31.179597854614258, -30.035594940185547, -28.891590118408203, -27.74758529663086, -26.603580474853516, -25.459577560424805, -24.31557273864746, -23.17156982421875, -22.027565002441406, -20.883560180664062, -19.73955726623535, -18.595552444458008, -17.451549530029297, -16.307544708251953, -15.163540840148926, -14.019536972045898, -12.875532150268555, -11.731528282165527, -10.5875244140625, -9.443519592285156, -8.299515724182129, -7.155511856079102, -6.011507987976074, -4.867503643035889, -3.7234995365142822, -2.579495429992676, -1.4354915618896484, -0.2914872169494629, 0.8525171279907227, 1.9965248107910156, 3.140528917312622, 4.2845330238342285, 5.428537368774414, 6.572541236877441, 7.716545104980469, 8.860549926757812, 10.00455379486084, 11.148557662963867, 12.292561531066895, 13.436565399169922, 14.580570220947266, 15.724574089050293, 16.86857795715332, 18.012582778930664, 19.156585693359375, 20.30059051513672, 21.444595336914062, 22.588598251342773, 23.732603073120117, 24.876605987548828, 26.020610809326172, 27.164615631103516, 28.30862045288086, 29.45262336730957, 30.596628189086914, 31.740631103515625, 32.88463592529297, 34.02864074707031, 35.172645568847656, 36.316646575927734, 37.46065139770508, 38.60465621948242]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 4.0, 5.0, 8.0, 5.0, 7.0, 7.0, 15.0, 22.0, 15.0, 20.0, 26.0, 17.0, 40.0, 47.0, 51.0, 37.0, 30.0, 43.0, 51.0, 52.0, 48.0, 46.0, 41.0, 57.0, 45.0, 37.0, 33.0, 24.0, 35.0, 23.0, 13.0, 20.0, 18.0, 15.0, 5.0, 8.0, 7.0, 6.0, 7.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.49609375, -5.34246826171875, -5.1888427734375, -5.03521728515625, -4.881591796875, -4.72796630859375, -4.5743408203125, -4.42071533203125, -4.26708984375, -4.11346435546875, -3.9598388671875, -3.80621337890625, -3.652587890625, -3.49896240234375, -3.3453369140625, -3.19171142578125, -3.0380859375, -2.88446044921875, -2.7308349609375, -2.57720947265625, -2.423583984375, -2.26995849609375, -2.1163330078125, -1.96270751953125, -1.80908203125, -1.65545654296875, -1.5018310546875, -1.34820556640625, -1.194580078125, -1.04095458984375, -0.8873291015625, -0.73370361328125, -0.580078125, -0.42645263671875, -0.2728271484375, -0.11920166015625, 0.034423828125, 0.18804931640625, 0.3416748046875, 0.49530029296875, 0.64892578125, 0.80255126953125, 0.9561767578125, 1.10980224609375, 1.263427734375, 1.41705322265625, 1.5706787109375, 1.72430419921875, 1.8779296875, 2.03155517578125, 2.1851806640625, 2.33880615234375, 2.492431640625, 2.64605712890625, 2.7996826171875, 2.95330810546875, 3.10693359375, 3.26055908203125, 3.4141845703125, 3.56781005859375, 3.721435546875, 3.87506103515625, 4.0286865234375, 4.18231201171875, 4.3359375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 5.0, 12.0, 10.0, 10.0, 26.0, 35.0, 49.0, 68.0, 98.0, 145.0, 249.0, 337.0, 570.0, 947.0, 1729.0, 3536.0, 7395.0, 16626.0, 39082.0, 90581.0, 181705.0, 263652.0, 221637.0, 122255.0, 54721.0, 23057.0, 9927.0, 4560.0, 2256.0, 1286.0, 701.0, 413.0, 311.0, 168.0, 110.0, 101.0, 50.0, 45.0, 27.0, 10.0, 15.0, 9.0, 10.0, 6.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.248046875, -2.179290771484375, -2.11053466796875, -2.041778564453125, -1.9730224609375, -1.904266357421875, -1.83551025390625, -1.766754150390625, -1.697998046875, -1.629241943359375, -1.56048583984375, -1.491729736328125, -1.4229736328125, -1.354217529296875, -1.28546142578125, -1.216705322265625, -1.14794921875, -1.079193115234375, -1.01043701171875, -0.941680908203125, -0.8729248046875, -0.804168701171875, -0.73541259765625, -0.666656494140625, -0.597900390625, -0.529144287109375, -0.46038818359375, -0.391632080078125, -0.3228759765625, -0.254119873046875, -0.18536376953125, -0.116607666015625, -0.0478515625, 0.020904541015625, 0.08966064453125, 0.158416748046875, 0.2271728515625, 0.295928955078125, 0.36468505859375, 0.433441162109375, 0.502197265625, 0.570953369140625, 0.63970947265625, 0.708465576171875, 0.7772216796875, 0.845977783203125, 0.91473388671875, 0.983489990234375, 1.05224609375, 1.121002197265625, 1.18975830078125, 1.258514404296875, 1.3272705078125, 1.396026611328125, 1.46478271484375, 1.533538818359375, 1.602294921875, 1.671051025390625, 1.73980712890625, 1.808563232421875, 1.8773193359375, 1.946075439453125, 2.01483154296875, 2.083587646484375, 2.15234375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 5.0, 4.0, 5.0, 4.0, 14.0, 13.0, 9.0, 17.0, 30.0, 15.0, 28.0, 28.0, 28.0, 29.0, 30.0, 35.0, 46.0, 38.0, 36.0, 36.0, 34.0, 42.0, 1057.0, 46.0, 46.0, 42.0, 40.0, 39.0, 27.0, 37.0, 30.0, 26.0, 19.0, 11.0, 17.0, 18.0, 9.0, 9.0, 8.0, 6.0, 3.0, 7.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.93359375, -3.8243408203125, -3.715087890625, -3.6058349609375, -3.49658203125, -3.3873291015625, -3.278076171875, -3.1688232421875, -3.0595703125, -2.9503173828125, -2.841064453125, -2.7318115234375, -2.62255859375, -2.5133056640625, -2.404052734375, -2.2947998046875, -2.185546875, -2.0762939453125, -1.967041015625, -1.8577880859375, -1.74853515625, -1.6392822265625, -1.530029296875, -1.4207763671875, -1.3115234375, -1.2022705078125, -1.093017578125, -0.9837646484375, -0.87451171875, -0.7652587890625, -0.656005859375, -0.5467529296875, -0.4375, -0.3282470703125, -0.218994140625, -0.1097412109375, -0.00048828125, 0.1087646484375, 0.218017578125, 0.3272705078125, 0.4365234375, 0.5457763671875, 0.655029296875, 0.7642822265625, 0.87353515625, 0.9827880859375, 1.092041015625, 1.2012939453125, 1.310546875, 1.4197998046875, 1.529052734375, 1.6383056640625, 1.74755859375, 1.8568115234375, 1.966064453125, 2.0753173828125, 2.1845703125, 2.2938232421875, 2.403076171875, 2.5123291015625, 2.62158203125, 2.7308349609375, 2.840087890625, 2.9493408203125, 3.05859375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 8.0, 14.0, 10.0, 14.0, 19.0, 27.0, 23.0, 44.0, 63.0, 81.0, 119.0, 156.0, 280.0, 429.0, 697.0, 1073.0, 1854.0, 3203.0, 5444.0, 9523.0, 16715.0, 30285.0, 116681.0, 1829645.0, 35882.0, 18807.0, 10665.0, 6107.0, 3667.0, 2099.0, 1279.0, 759.0, 474.0, 301.0, 198.0, 126.0, 104.0, 83.0, 45.0, 30.0, 26.0, 20.0, 14.0, 10.0, 15.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.56640625, -2.486480712890625, -2.40655517578125, -2.326629638671875, -2.2467041015625, -2.166778564453125, -2.08685302734375, -2.006927490234375, -1.927001953125, -1.847076416015625, -1.76715087890625, -1.687225341796875, -1.6072998046875, -1.527374267578125, -1.44744873046875, -1.367523193359375, -1.28759765625, -1.207672119140625, -1.12774658203125, -1.047821044921875, -0.9678955078125, -0.887969970703125, -0.80804443359375, -0.728118896484375, -0.648193359375, -0.568267822265625, -0.48834228515625, -0.408416748046875, -0.3284912109375, -0.248565673828125, -0.16864013671875, -0.088714599609375, -0.0087890625, 0.071136474609375, 0.15106201171875, 0.230987548828125, 0.3109130859375, 0.390838623046875, 0.47076416015625, 0.550689697265625, 0.630615234375, 0.710540771484375, 0.79046630859375, 0.870391845703125, 0.9503173828125, 1.030242919921875, 1.11016845703125, 1.190093994140625, 1.27001953125, 1.349945068359375, 1.42987060546875, 1.509796142578125, 1.5897216796875, 1.669647216796875, 1.74957275390625, 1.829498291015625, 1.909423828125, 1.989349365234375, 2.06927490234375, 2.149200439453125, 2.2291259765625, 2.309051513671875, 2.38897705078125, 2.468902587890625, 2.548828125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 8.0, 7.0, 10.0, 13.0, 13.0, 27.0, 56.0, 93.0, 138.0, 238.0, 129.0, 86.0, 79.0, 32.0, 19.0, 10.0, 8.0, 2.0, 6.0, 3.0, 2.0, 5.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.394287109375, -0.38407135009765625, -0.3738555908203125, -0.36363983154296875, -0.353424072265625, -0.34320831298828125, -0.3329925537109375, -0.32277679443359375, -0.31256103515625, -0.30234527587890625, -0.2921295166015625, -0.28191375732421875, -0.271697998046875, -0.26148223876953125, -0.2512664794921875, -0.24105072021484375, -0.2308349609375, -0.22061920166015625, -0.2104034423828125, -0.20018768310546875, -0.189971923828125, -0.17975616455078125, -0.1695404052734375, -0.15932464599609375, -0.14910888671875, -0.13889312744140625, -0.1286773681640625, -0.11846160888671875, -0.108245849609375, -0.09803009033203125, -0.0878143310546875, -0.07759857177734375, -0.0673828125, -0.05716705322265625, -0.0469512939453125, -0.03673553466796875, -0.026519775390625, -0.01630401611328125, -0.0060882568359375, 0.00412750244140625, 0.01434326171875, 0.02455902099609375, 0.0347747802734375, 0.04499053955078125, 0.055206298828125, 0.06542205810546875, 0.0756378173828125, 0.08585357666015625, 0.0960693359375, 0.10628509521484375, 0.1165008544921875, 0.12671661376953125, 0.136932373046875, 0.14714813232421875, 0.1573638916015625, 0.16757965087890625, 0.17779541015625, 0.18801116943359375, 0.1982269287109375, 0.20844268798828125, 0.218658447265625, 0.22887420654296875, 0.2390899658203125, 0.24930572509765625, 0.259521484375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 6.0, 5.0, 6.0, 4.0, 14.0, 14.0, 43.0, 58.0, 87.0, 183.0, 763.0, 5824.0, 1026768.0, 13129.0, 1087.0, 269.0, 88.0, 46.0, 45.0, 22.0, 32.0, 19.0, 12.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.48828125, -4.31304931640625, -4.1378173828125, -3.96258544921875, -3.787353515625, -3.61212158203125, -3.4368896484375, -3.26165771484375, -3.08642578125, -2.91119384765625, -2.7359619140625, -2.56072998046875, -2.385498046875, -2.21026611328125, -2.0350341796875, -1.85980224609375, -1.6845703125, -1.50933837890625, -1.3341064453125, -1.15887451171875, -0.983642578125, -0.80841064453125, -0.6331787109375, -0.45794677734375, -0.28271484375, -0.10748291015625, 0.0677490234375, 0.24298095703125, 0.418212890625, 0.59344482421875, 0.7686767578125, 0.94390869140625, 1.119140625, 1.29437255859375, 1.4696044921875, 1.64483642578125, 1.820068359375, 1.99530029296875, 2.1705322265625, 2.34576416015625, 2.52099609375, 2.69622802734375, 2.8714599609375, 3.04669189453125, 3.221923828125, 3.39715576171875, 3.5723876953125, 3.74761962890625, 3.9228515625, 4.09808349609375, 4.2733154296875, 4.44854736328125, 4.623779296875, 4.79901123046875, 4.9742431640625, 5.14947509765625, 5.32470703125, 5.49993896484375, 5.6751708984375, 5.85040283203125, 6.025634765625, 6.20086669921875, 6.3760986328125, 6.55133056640625, 6.7265625]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 26.0, 196.0, 735.0, 54.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-7.911907196044922, -7.773916721343994, -7.635926723480225, -7.497936248779297, -7.359945774078369, -7.221955299377441, -7.083965301513672, -6.945974826812744, -6.807984352111816, -6.669993877410889, -6.532003879547119, -6.394013404846191, -6.256022930145264, -6.118032455444336, -5.980042457580566, -5.842051982879639, -5.704061508178711, -5.566071033477783, -5.428081035614014, -5.290090560913086, -5.152100086212158, -5.0141096115112305, -4.876119613647461, -4.738129138946533, -4.600139141082764, -4.462148666381836, -4.324158668518066, -4.186168193817139, -4.048177719116211, -3.9101874828338623, -3.7721972465515137, -3.634206771850586, -3.496216297149658, -3.3582260608673096, -3.220235586166382, -3.082245349884033, -2.9442548751831055, -2.806264638900757, -2.668274402618408, -2.5302839279174805, -2.3922934532165527, -2.254303216934204, -2.1163127422332764, -1.9783225059509277, -1.84033203125, -1.7023417949676514, -1.5643514394760132, -1.426361083984375, -1.2883708477020264, -1.1503804922103882, -1.01239013671875, -0.8743998408317566, -0.7364094853401184, -0.5984191298484802, -0.4604288339614868, -0.32243847846984863, -0.18444806337356567, -0.046457722783088684, 0.0915326178073883, 0.2295229434967041, 0.3675132989883423, 0.5055036544799805, 0.6434939503669739, 0.7814843058586121, 0.9194746613502502]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 4.0, 6.0, 9.0, 11.0, 22.0, 12.0, 17.0, 17.0, 18.0, 40.0, 37.0, 42.0, 47.0, 29.0, 56.0, 41.0, 48.0, 48.0, 58.0, 36.0, 47.0, 41.0, 51.0, 37.0, 35.0, 39.0, 27.0, 22.0, 20.0, 15.0, 19.0, 9.0, 10.0, 3.0, 7.0, 7.0, 5.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46747976541519165, -0.45054593682289124, -0.4336121380329132, -0.4166783094406128, -0.39974451065063477, -0.38281068205833435, -0.36587685346603394, -0.3489430546760559, -0.3320092558860779, -0.31507542729377747, -0.29814162850379944, -0.281207799911499, -0.264274001121521, -0.24734017252922058, -0.23040635883808136, -0.21347254514694214, -0.19653871655464172, -0.1796049028635025, -0.16267108917236328, -0.14573726058006287, -0.12880346179008484, -0.11186964064836502, -0.0949358195066452, -0.07800200581550598, -0.06106819212436676, -0.04413437843322754, -0.02720056101679802, -0.0102667436003685, 0.0066670700907707214, 0.023600883781909943, 0.04053470492362976, 0.05746851861476898, 0.0744023323059082, 0.09133614599704742, 0.10826995968818665, 0.12520378828048706, 0.1421375870704651, 0.1590714156627655, 0.17600522935390472, 0.19293904304504395, 0.20987285673618317, 0.2268066704273224, 0.2437404841184616, 0.26067429780960083, 0.27760812640190125, 0.2945419251918793, 0.3114757537841797, 0.3284095525741577, 0.34534338116645813, 0.36227720975875854, 0.3792110085487366, 0.396144837141037, 0.413078635931015, 0.43001246452331543, 0.44694626331329346, 0.46388009190559387, 0.4808139204978943, 0.4977477490901947, 0.5146815776824951, 0.5316153764724731, 0.5485491752624512, 0.5654829740524292, 0.582416832447052, 0.59935063123703, 0.6162844300270081]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 8.0, 5.0, 6.0, 12.0, 12.0, 10.0, 16.0, 22.0, 21.0, 35.0, 32.0, 55.0, 33.0, 47.0, 30.0, 48.0, 51.0, 55.0, 51.0, 50.0, 53.0, 43.0, 47.0, 31.0, 48.0, 39.0, 31.0, 20.0, 17.0, 14.0, 12.0, 14.0, 9.0, 6.0, 5.0, 5.0, 5.0, 7.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.88671875, -5.72271728515625, -5.5587158203125, -5.39471435546875, -5.230712890625, -5.06671142578125, -4.9027099609375, -4.73870849609375, -4.57470703125, -4.41070556640625, -4.2467041015625, -4.08270263671875, -3.918701171875, -3.75469970703125, -3.5906982421875, -3.42669677734375, -3.2626953125, -3.09869384765625, -2.9346923828125, -2.77069091796875, -2.606689453125, -2.44268798828125, -2.2786865234375, -2.11468505859375, -1.95068359375, -1.78668212890625, -1.6226806640625, -1.45867919921875, -1.294677734375, -1.13067626953125, -0.9666748046875, -0.80267333984375, -0.638671875, -0.47467041015625, -0.3106689453125, -0.14666748046875, 0.017333984375, 0.18133544921875, 0.3453369140625, 0.50933837890625, 0.67333984375, 0.83734130859375, 1.0013427734375, 1.16534423828125, 1.329345703125, 1.49334716796875, 1.6573486328125, 1.82135009765625, 1.9853515625, 2.14935302734375, 2.3133544921875, 2.47735595703125, 2.641357421875, 2.80535888671875, 2.9693603515625, 3.13336181640625, 3.29736328125, 3.46136474609375, 3.6253662109375, 3.78936767578125, 3.953369140625, 4.11737060546875, 4.2813720703125, 4.44537353515625, 4.609375]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 1.0, 4.0, 8.0, 3.0, 7.0, 15.0, 15.0, 21.0, 27.0, 52.0, 61.0, 109.0, 179.0, 264.0, 499.0, 864.0, 1989.0, 4750.0, 14769.0, 59718.0, 271514.0, 477148.0, 165141.0, 35125.0, 9581.0, 3431.0, 1489.0, 696.0, 377.0, 224.0, 150.0, 101.0, 64.0, 44.0, 41.0, 24.0, 14.0, 8.0, 7.0, 6.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.0, -6.783447265625, -6.56689453125, -6.350341796875, -6.1337890625, -5.917236328125, -5.70068359375, -5.484130859375, -5.267578125, -5.051025390625, -4.83447265625, -4.617919921875, -4.4013671875, -4.184814453125, -3.96826171875, -3.751708984375, -3.53515625, -3.318603515625, -3.10205078125, -2.885498046875, -2.6689453125, -2.452392578125, -2.23583984375, -2.019287109375, -1.802734375, -1.586181640625, -1.36962890625, -1.153076171875, -0.9365234375, -0.719970703125, -0.50341796875, -0.286865234375, -0.0703125, 0.146240234375, 0.36279296875, 0.579345703125, 0.7958984375, 1.012451171875, 1.22900390625, 1.445556640625, 1.662109375, 1.878662109375, 2.09521484375, 2.311767578125, 2.5283203125, 2.744873046875, 2.96142578125, 3.177978515625, 3.39453125, 3.611083984375, 3.82763671875, 4.044189453125, 4.2607421875, 4.477294921875, 4.69384765625, 4.910400390625, 5.126953125, 5.343505859375, 5.56005859375, 5.776611328125, 5.9931640625, 6.209716796875, 6.42626953125, 6.642822265625, 6.859375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 10.0, 10.0, 11.0, 21.0, 12.0, 20.0, 13.0, 17.0, 27.0, 31.0, 30.0, 41.0, 26.0, 45.0, 40.0, 41.0, 72.0, 132.0, 356.0, 1413.0, 191.0, 79.0, 45.0, 41.0, 36.0, 40.0, 32.0, 26.0, 23.0, 20.0, 24.0, 15.0, 9.0, 16.0, 11.0, 15.0, 11.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-14.3828125, -13.9058837890625, -13.428955078125, -12.9520263671875, -12.47509765625, -11.9981689453125, -11.521240234375, -11.0443115234375, -10.5673828125, -10.0904541015625, -9.613525390625, -9.1365966796875, -8.65966796875, -8.1827392578125, -7.705810546875, -7.2288818359375, -6.751953125, -6.2750244140625, -5.798095703125, -5.3211669921875, -4.84423828125, -4.3673095703125, -3.890380859375, -3.4134521484375, -2.9365234375, -2.4595947265625, -1.982666015625, -1.5057373046875, -1.02880859375, -0.5518798828125, -0.074951171875, 0.4019775390625, 0.87890625, 1.3558349609375, 1.832763671875, 2.3096923828125, 2.78662109375, 3.2635498046875, 3.740478515625, 4.2174072265625, 4.6943359375, 5.1712646484375, 5.648193359375, 6.1251220703125, 6.60205078125, 7.0789794921875, 7.555908203125, 8.0328369140625, 8.509765625, 8.9866943359375, 9.463623046875, 9.9405517578125, 10.41748046875, 10.8944091796875, 11.371337890625, 11.8482666015625, 12.3251953125, 12.8021240234375, 13.279052734375, 13.7559814453125, 14.23291015625, 14.7098388671875, 15.186767578125, 15.6636962890625, 16.140625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 5.0, 3.0, 6.0, 12.0, 11.0, 14.0, 17.0, 15.0, 19.0, 25.0, 27.0, 29.0, 47.0, 71.0, 141.0, 205.0, 448.0, 1107.0, 3672.0, 21705.0, 432951.0, 2586601.0, 85229.0, 9529.0, 2154.0, 726.0, 340.0, 162.0, 114.0, 61.0, 49.0, 39.0, 22.0, 18.0, 15.0, 28.0, 14.0, 14.0, 11.0, 12.0, 11.0, 5.0, 6.0, 2.0, 4.0, 4.0, 0.0, 4.0, 0.0, 2.0], "bins": [-21.328125, -20.7236328125, -20.119140625, -19.5146484375, -18.91015625, -18.3056640625, -17.701171875, -17.0966796875, -16.4921875, -15.8876953125, -15.283203125, -14.6787109375, -14.07421875, -13.4697265625, -12.865234375, -12.2607421875, -11.65625, -11.0517578125, -10.447265625, -9.8427734375, -9.23828125, -8.6337890625, -8.029296875, -7.4248046875, -6.8203125, -6.2158203125, -5.611328125, -5.0068359375, -4.40234375, -3.7978515625, -3.193359375, -2.5888671875, -1.984375, -1.3798828125, -0.775390625, -0.1708984375, 0.43359375, 1.0380859375, 1.642578125, 2.2470703125, 2.8515625, 3.4560546875, 4.060546875, 4.6650390625, 5.26953125, 5.8740234375, 6.478515625, 7.0830078125, 7.6875, 8.2919921875, 8.896484375, 9.5009765625, 10.10546875, 10.7099609375, 11.314453125, 11.9189453125, 12.5234375, 13.1279296875, 13.732421875, 14.3369140625, 14.94140625, 15.5458984375, 16.150390625, 16.7548828125, 17.359375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 29.0, 141.0, 413.0, 334.0, 87.0, 10.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.272987365722656, -31.114578247070312, -27.95616912841797, -24.797760009765625, -21.63935089111328, -18.480941772460938, -15.322532653808594, -12.16412353515625, -9.005714416503906, -5.8473052978515625, -2.6888961791992188, 0.469512939453125, 3.6279220581054688, 6.7863311767578125, 9.944740295410156, 13.1031494140625, 16.261558532714844, 19.419967651367188, 22.57837677001953, 25.736785888671875, 28.89519500732422, 32.05360412597656, 35.212013244628906, 38.37042236328125, 41.528831481933594, 44.68724060058594, 47.84564971923828, 51.004058837890625, 54.16246795654297, 57.32087707519531, 60.479286193847656, 63.6376953125, 66.79611206054688, 69.95452117919922, 73.11293029785156, 76.2713394165039, 79.42974853515625, 82.5881576538086, 85.74656677246094, 88.90497589111328, 92.06338500976562, 95.22179412841797, 98.38020324707031, 101.53861236572266, 104.697021484375, 107.85543060302734, 111.01383972167969, 114.17224884033203, 117.33065795898438, 120.48906707763672, 123.64747619628906, 126.8058853149414, 129.96429443359375, 133.12271118164062, 136.28111267089844, 139.43951416015625, 142.59793090820312, 145.75634765625, 148.9147491455078, 152.07315063476562, 155.2315673828125, 158.38998413085938, 161.5483856201172, 164.706787109375, 167.86520385742188]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 9.0, 9.0, 14.0, 14.0, 15.0, 29.0, 15.0, 30.0, 33.0, 18.0, 46.0, 39.0, 44.0, 45.0, 45.0, 46.0, 42.0, 54.0, 45.0, 55.0, 42.0, 44.0, 39.0, 35.0, 28.0, 24.0, 27.0, 22.0, 19.0, 22.0, 8.0, 10.0, 8.0, 4.0, 4.0, 5.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.20941162109375, -62.33124542236328, -60.45307540893555, -58.57490921020508, -56.696739196777344, -54.818572998046875, -52.940406799316406, -51.06223678588867, -49.18406677246094, -47.30590057373047, -45.427730560302734, -43.549564361572266, -41.67139434814453, -39.79322814941406, -37.915061950683594, -36.03689193725586, -34.15872573852539, -32.28055953979492, -30.402389526367188, -28.52422332763672, -26.646053314208984, -24.767887115478516, -22.889719009399414, -21.011550903320312, -19.13338279724121, -17.25521469116211, -15.377046585083008, -13.498879432678223, -11.620711326599121, -9.74254322052002, -7.864376068115234, -5.986207962036133, -4.108039855957031, -2.229871988296509, -0.35170412063598633, 1.526463508605957, 3.4046316146850586, 5.28279972076416, 7.160966873168945, 9.039134979248047, 10.917303085327148, 12.79547119140625, 14.673639297485352, 16.551807403564453, 18.429973602294922, 20.308143615722656, 22.186309814453125, 24.064477920532227, 25.942646026611328, 27.82081413269043, 29.69898223876953, 31.5771484375, 33.455318450927734, 35.3334846496582, 37.21165466308594, 39.089820861816406, 40.967987060546875, 42.846153259277344, 44.72432327270508, 46.60248947143555, 48.48065948486328, 50.35882568359375, 52.23699188232422, 54.11516189575195, 55.99333190917969]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 4.0, 2.0, 0.0, 5.0, 9.0, 9.0, 8.0, 12.0, 13.0, 21.0, 28.0, 20.0, 24.0, 33.0, 43.0, 33.0, 48.0, 45.0, 43.0, 38.0, 60.0, 46.0, 37.0, 47.0, 46.0, 50.0, 33.0, 43.0, 23.0, 36.0, 30.0, 22.0, 13.0, 18.0, 14.0, 13.0, 5.0, 8.0, 5.0, 11.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.98046875, -4.826171875, -4.671875, -4.517578125, -4.36328125, -4.208984375, -4.0546875, -3.900390625, -3.74609375, -3.591796875, -3.4375, -3.283203125, -3.12890625, -2.974609375, -2.8203125, -2.666015625, -2.51171875, -2.357421875, -2.203125, -2.048828125, -1.89453125, -1.740234375, -1.5859375, -1.431640625, -1.27734375, -1.123046875, -0.96875, -0.814453125, -0.66015625, -0.505859375, -0.3515625, -0.197265625, -0.04296875, 0.111328125, 0.265625, 0.419921875, 0.57421875, 0.728515625, 0.8828125, 1.037109375, 1.19140625, 1.345703125, 1.5, 1.654296875, 1.80859375, 1.962890625, 2.1171875, 2.271484375, 2.42578125, 2.580078125, 2.734375, 2.888671875, 3.04296875, 3.197265625, 3.3515625, 3.505859375, 3.66015625, 3.814453125, 3.96875, 4.123046875, 4.27734375, 4.431640625, 4.5859375, 4.740234375, 4.89453125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 8.0, 2.0, 3.0, 12.0, 13.0, 27.0, 32.0, 42.0, 68.0, 99.0, 167.0, 269.0, 492.0, 829.0, 1550.0, 3552.0, 9992.0, 40881.0, 253900.0, 1975787.0, 1653664.0, 203879.0, 34229.0, 8556.0, 3004.0, 1312.0, 700.0, 407.0, 242.0, 171.0, 104.0, 83.0, 60.0, 56.0, 23.0, 16.0, 19.0, 10.0, 8.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.75, -13.3326416015625, -12.915283203125, -12.4979248046875, -12.08056640625, -11.6632080078125, -11.245849609375, -10.8284912109375, -10.4111328125, -9.9937744140625, -9.576416015625, -9.1590576171875, -8.74169921875, -8.3243408203125, -7.906982421875, -7.4896240234375, -7.072265625, -6.6549072265625, -6.237548828125, -5.8201904296875, -5.40283203125, -4.9854736328125, -4.568115234375, -4.1507568359375, -3.7333984375, -3.3160400390625, -2.898681640625, -2.4813232421875, -2.06396484375, -1.6466064453125, -1.229248046875, -0.8118896484375, -0.39453125, 0.0228271484375, 0.440185546875, 0.8575439453125, 1.27490234375, 1.6922607421875, 2.109619140625, 2.5269775390625, 2.9443359375, 3.3616943359375, 3.779052734375, 4.1964111328125, 4.61376953125, 5.0311279296875, 5.448486328125, 5.8658447265625, 6.283203125, 6.7005615234375, 7.117919921875, 7.5352783203125, 7.95263671875, 8.3699951171875, 8.787353515625, 9.2047119140625, 9.6220703125, 10.0394287109375, 10.456787109375, 10.8741455078125, 11.29150390625, 11.7088623046875, 12.126220703125, 12.5435791015625, 12.9609375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 3.0, 10.0, 8.0, 14.0, 8.0, 9.0, 16.0, 18.0, 42.0, 45.0, 79.0, 76.0, 100.0, 181.0, 170.0, 239.0, 308.0, 343.0, 400.0, 397.0, 384.0, 291.0, 214.0, 176.0, 134.0, 100.0, 88.0, 52.0, 50.0, 28.0, 18.0, 17.0, 10.0, 13.0, 9.0, 6.0, 3.0, 4.0, 3.0, 2.0, 7.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.421875, -9.083251953125, -8.74462890625, -8.406005859375, -8.0673828125, -7.728759765625, -7.39013671875, -7.051513671875, -6.712890625, -6.374267578125, -6.03564453125, -5.697021484375, -5.3583984375, -5.019775390625, -4.68115234375, -4.342529296875, -4.00390625, -3.665283203125, -3.32666015625, -2.988037109375, -2.6494140625, -2.310791015625, -1.97216796875, -1.633544921875, -1.294921875, -0.956298828125, -0.61767578125, -0.279052734375, 0.0595703125, 0.398193359375, 0.73681640625, 1.075439453125, 1.4140625, 1.752685546875, 2.09130859375, 2.429931640625, 2.7685546875, 3.107177734375, 3.44580078125, 3.784423828125, 4.123046875, 4.461669921875, 4.80029296875, 5.138916015625, 5.4775390625, 5.816162109375, 6.15478515625, 6.493408203125, 6.83203125, 7.170654296875, 7.50927734375, 7.847900390625, 8.1865234375, 8.525146484375, 8.86376953125, 9.202392578125, 9.541015625, 9.879638671875, 10.21826171875, 10.556884765625, 10.8955078125, 11.234130859375, 11.57275390625, 11.911376953125, 12.25]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 6.0, 6.0, 11.0, 8.0, 19.0, 29.0, 30.0, 66.0, 107.0, 128.0, 200.0, 330.0, 528.0, 931.0, 1695.0, 3209.0, 6830.0, 16001.0, 43098.0, 137165.0, 485913.0, 1515132.0, 1374640.0, 422207.0, 120517.0, 37745.0, 14475.0, 6285.0, 3039.0, 1656.0, 891.0, 531.0, 317.0, 188.0, 119.0, 63.0, 50.0, 34.0, 28.0, 23.0, 9.0, 11.0, 7.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.7578125, -13.3402099609375, -12.922607421875, -12.5050048828125, -12.08740234375, -11.6697998046875, -11.252197265625, -10.8345947265625, -10.4169921875, -9.9993896484375, -9.581787109375, -9.1641845703125, -8.74658203125, -8.3289794921875, -7.911376953125, -7.4937744140625, -7.076171875, -6.6585693359375, -6.240966796875, -5.8233642578125, -5.40576171875, -4.9881591796875, -4.570556640625, -4.1529541015625, -3.7353515625, -3.3177490234375, -2.900146484375, -2.4825439453125, -2.06494140625, -1.6473388671875, -1.229736328125, -0.8121337890625, -0.39453125, 0.0230712890625, 0.440673828125, 0.8582763671875, 1.27587890625, 1.6934814453125, 2.111083984375, 2.5286865234375, 2.9462890625, 3.3638916015625, 3.781494140625, 4.1990966796875, 4.61669921875, 5.0343017578125, 5.451904296875, 5.8695068359375, 6.287109375, 6.7047119140625, 7.122314453125, 7.5399169921875, 7.95751953125, 8.3751220703125, 8.792724609375, 9.2103271484375, 9.6279296875, 10.0455322265625, 10.463134765625, 10.8807373046875, 11.29833984375, 11.7159423828125, 12.133544921875, 12.5511474609375, 12.96875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 18.0, 26.0, 53.0, 92.0, 144.0, 157.0, 165.0, 140.0, 107.0, 59.0, 29.0, 9.0, 7.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-112.75991821289062, -109.35362243652344, -105.94732666015625, -102.54103088378906, -99.13473510742188, -95.72843933105469, -92.3221435546875, -88.91584777832031, -85.50955200195312, -82.10325622558594, -78.69696044921875, -75.29066467285156, -71.88436889648438, -68.47807312011719, -65.07177734375, -61.66548538208008, -58.259193420410156, -54.85289764404297, -51.44660186767578, -48.040306091308594, -44.634010314941406, -41.22771453857422, -37.8214225769043, -34.41512680053711, -31.008831024169922, -27.602535247802734, -24.196239471435547, -20.789945602416992, -17.383649826049805, -13.977354049682617, -10.571060180664062, -7.164764404296875, -3.7584686279296875, -0.3521733283996582, 3.054121971130371, 6.460416793823242, 9.86671257019043, 13.273008346557617, 16.679302215576172, 20.08559799194336, 23.491893768310547, 26.898189544677734, 30.304485321044922, 33.710777282714844, 37.11707305908203, 40.52336883544922, 43.929664611816406, 47.335960388183594, 50.74225616455078, 54.14855194091797, 57.554847717285156, 60.961143493652344, 64.36743927001953, 67.77373504638672, 71.18002319335938, 74.58631896972656, 77.99261474609375, 81.39891052246094, 84.80520629882812, 88.21150207519531, 91.6177978515625, 95.02409362792969, 98.43038940429688, 101.83668518066406, 105.24298095703125]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 4.0, 11.0, 9.0, 15.0, 13.0, 9.0, 10.0, 29.0, 14.0, 28.0, 23.0, 27.0, 31.0, 30.0, 28.0, 43.0, 36.0, 40.0, 44.0, 39.0, 32.0, 37.0, 37.0, 36.0, 41.0, 36.0, 43.0, 29.0, 35.0, 26.0, 22.0, 23.0, 20.0, 20.0, 11.0, 12.0, 10.0, 10.0, 9.0, 7.0, 5.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.536258697509766, -37.338226318359375, -36.14019012451172, -34.94215774536133, -33.74412155151367, -32.54608917236328, -31.348052978515625, -30.150020599365234, -28.951984405517578, -27.753950119018555, -26.55591583251953, -25.357881546020508, -24.159847259521484, -22.96181297302246, -21.763778686523438, -20.565746307373047, -19.367712020874023, -18.169677734375, -16.971643447875977, -15.773609161376953, -14.57557487487793, -13.377540588378906, -12.1795072555542, -10.981472969055176, -9.783438682556152, -8.585404396057129, -7.3873701095581055, -6.18933629989624, -4.991302013397217, -3.7932677268981934, -2.595233917236328, -1.3971996307373047, -0.19916534423828125, 0.9988688230514526, 2.1969029903411865, 3.394937038421631, 4.592971324920654, 5.791005611419678, 6.989039421081543, 8.187073707580566, 9.38510799407959, 10.583142280578613, 11.781176567077637, 12.979209899902344, 14.177244186401367, 15.37527847290039, 16.573312759399414, 17.771347045898438, 18.96938133239746, 20.167415618896484, 21.365449905395508, 22.56348419189453, 23.761518478393555, 24.959552764892578, 26.15758514404297, 27.355621337890625, 28.553653717041016, 29.75168800354004, 30.949722290039062, 32.14775466918945, 33.34579086303711, 34.5438232421875, 35.741859436035156, 36.93989181518555, 38.1379280090332]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 4.0, 0.0, 3.0, 6.0, 6.0, 5.0, 10.0, 8.0, 12.0, 17.0, 22.0, 18.0, 31.0, 27.0, 39.0, 43.0, 45.0, 52.0, 41.0, 46.0, 46.0, 44.0, 55.0, 51.0, 53.0, 41.0, 30.0, 44.0, 32.0, 38.0, 31.0, 16.0, 13.0, 14.0, 10.0, 11.0, 11.0, 6.0, 9.0, 2.0, 6.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.87890625, -5.7119140625, -5.544921875, -5.3779296875, -5.2109375, -5.0439453125, -4.876953125, -4.7099609375, -4.54296875, -4.3759765625, -4.208984375, -4.0419921875, -3.875, -3.7080078125, -3.541015625, -3.3740234375, -3.20703125, -3.0400390625, -2.873046875, -2.7060546875, -2.5390625, -2.3720703125, -2.205078125, -2.0380859375, -1.87109375, -1.7041015625, -1.537109375, -1.3701171875, -1.203125, -1.0361328125, -0.869140625, -0.7021484375, -0.53515625, -0.3681640625, -0.201171875, -0.0341796875, 0.1328125, 0.2998046875, 0.466796875, 0.6337890625, 0.80078125, 0.9677734375, 1.134765625, 1.3017578125, 1.46875, 1.6357421875, 1.802734375, 1.9697265625, 2.13671875, 2.3037109375, 2.470703125, 2.6376953125, 2.8046875, 2.9716796875, 3.138671875, 3.3056640625, 3.47265625, 3.6396484375, 3.806640625, 3.9736328125, 4.140625, 4.3076171875, 4.474609375, 4.6416015625, 4.80859375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 8.0, 5.0, 9.0, 15.0, 24.0, 33.0, 40.0, 48.0, 82.0, 89.0, 146.0, 220.0, 315.0, 529.0, 824.0, 1345.0, 2402.0, 4760.0, 10016.0, 21870.0, 49230.0, 105545.0, 192061.0, 251052.0, 199562.0, 110549.0, 52206.0, 23455.0, 10611.0, 5026.0, 2672.0, 1465.0, 817.0, 503.0, 307.0, 181.0, 164.0, 112.0, 65.0, 53.0, 40.0, 20.0, 29.0, 15.0, 11.0, 4.0, 10.0, 3.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.427734375, -2.353118896484375, -2.27850341796875, -2.203887939453125, -2.1292724609375, -2.054656982421875, -1.98004150390625, -1.905426025390625, -1.830810546875, -1.756195068359375, -1.68157958984375, -1.606964111328125, -1.5323486328125, -1.457733154296875, -1.38311767578125, -1.308502197265625, -1.23388671875, -1.159271240234375, -1.08465576171875, -1.010040283203125, -0.9354248046875, -0.860809326171875, -0.78619384765625, -0.711578369140625, -0.636962890625, -0.562347412109375, -0.48773193359375, -0.413116455078125, -0.3385009765625, -0.263885498046875, -0.18927001953125, -0.114654541015625, -0.0400390625, 0.034576416015625, 0.10919189453125, 0.183807373046875, 0.2584228515625, 0.333038330078125, 0.40765380859375, 0.482269287109375, 0.556884765625, 0.631500244140625, 0.70611572265625, 0.780731201171875, 0.8553466796875, 0.929962158203125, 1.00457763671875, 1.079193115234375, 1.15380859375, 1.228424072265625, 1.30303955078125, 1.377655029296875, 1.4522705078125, 1.526885986328125, 1.60150146484375, 1.676116943359375, 1.750732421875, 1.825347900390625, 1.89996337890625, 1.974578857421875, 2.0491943359375, 2.123809814453125, 2.19842529296875, 2.273040771484375, 2.34765625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 8.0, 0.0, 5.0, 5.0, 9.0, 14.0, 18.0, 16.0, 17.0, 38.0, 30.0, 29.0, 38.0, 39.0, 45.0, 47.0, 33.0, 41.0, 42.0, 1074.0, 42.0, 54.0, 45.0, 38.0, 33.0, 33.0, 36.0, 39.0, 27.0, 26.0, 22.0, 24.0, 10.0, 12.0, 12.0, 7.0, 1.0, 3.0, 5.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.478515625, -3.358795166015625, -3.23907470703125, -3.119354248046875, -2.9996337890625, -2.879913330078125, -2.76019287109375, -2.640472412109375, -2.520751953125, -2.401031494140625, -2.28131103515625, -2.161590576171875, -2.0418701171875, -1.922149658203125, -1.80242919921875, -1.682708740234375, -1.56298828125, -1.443267822265625, -1.32354736328125, -1.203826904296875, -1.0841064453125, -0.964385986328125, -0.84466552734375, -0.724945068359375, -0.605224609375, -0.485504150390625, -0.36578369140625, -0.246063232421875, -0.1263427734375, -0.006622314453125, 0.11309814453125, 0.232818603515625, 0.3525390625, 0.472259521484375, 0.59197998046875, 0.711700439453125, 0.8314208984375, 0.951141357421875, 1.07086181640625, 1.190582275390625, 1.310302734375, 1.430023193359375, 1.54974365234375, 1.669464111328125, 1.7891845703125, 1.908905029296875, 2.02862548828125, 2.148345947265625, 2.26806640625, 2.387786865234375, 2.50750732421875, 2.627227783203125, 2.7469482421875, 2.866668701171875, 2.98638916015625, 3.106109619140625, 3.225830078125, 3.345550537109375, 3.46527099609375, 3.584991455078125, 3.7047119140625, 3.824432373046875, 3.94415283203125, 4.063873291015625, 4.18359375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 8.0, 6.0, 9.0, 10.0, 23.0, 26.0, 33.0, 41.0, 57.0, 78.0, 131.0, 200.0, 244.0, 441.0, 677.0, 1093.0, 1769.0, 2725.0, 4627.0, 7720.0, 12981.0, 22742.0, 48832.0, 1894272.0, 44900.0, 21892.0, 12339.0, 7412.0, 4469.0, 2747.0, 1669.0, 1064.0, 652.0, 409.0, 267.0, 162.0, 127.0, 88.0, 57.0, 42.0, 23.0, 16.0, 16.0, 15.0, 4.0, 8.0, 4.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.654296875, -2.567169189453125, -2.48004150390625, -2.392913818359375, -2.3057861328125, -2.218658447265625, -2.13153076171875, -2.044403076171875, -1.957275390625, -1.870147705078125, -1.78302001953125, -1.695892333984375, -1.6087646484375, -1.521636962890625, -1.43450927734375, -1.347381591796875, -1.26025390625, -1.173126220703125, -1.08599853515625, -0.998870849609375, -0.9117431640625, -0.824615478515625, -0.73748779296875, -0.650360107421875, -0.563232421875, -0.476104736328125, -0.38897705078125, -0.301849365234375, -0.2147216796875, -0.127593994140625, -0.04046630859375, 0.046661376953125, 0.1337890625, 0.220916748046875, 0.30804443359375, 0.395172119140625, 0.4822998046875, 0.569427490234375, 0.65655517578125, 0.743682861328125, 0.830810546875, 0.917938232421875, 1.00506591796875, 1.092193603515625, 1.1793212890625, 1.266448974609375, 1.35357666015625, 1.440704345703125, 1.52783203125, 1.614959716796875, 1.70208740234375, 1.789215087890625, 1.8763427734375, 1.963470458984375, 2.05059814453125, 2.137725830078125, 2.224853515625, 2.311981201171875, 2.39910888671875, 2.486236572265625, 2.5733642578125, 2.660491943359375, 2.74761962890625, 2.834747314453125, 2.921875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 4.0, 5.0, 8.0, 9.0, 3.0, 12.0, 12.0, 13.0, 15.0, 9.0, 24.0, 22.0, 28.0, 30.0, 33.0, 30.0, 35.0, 39.0, 43.0, 41.0, 70.0, 70.0, 59.0, 51.0, 47.0, 25.0, 33.0, 37.0, 23.0, 24.0, 20.0, 22.0, 15.0, 21.0, 19.0, 13.0, 11.0, 7.0, 4.0, 6.0, 6.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.078369140625, -0.07621002197265625, -0.0740509033203125, -0.07189178466796875, -0.069732666015625, -0.06757354736328125, -0.0654144287109375, -0.06325531005859375, -0.06109619140625, -0.05893707275390625, -0.0567779541015625, -0.05461883544921875, -0.052459716796875, -0.05030059814453125, -0.0481414794921875, -0.04598236083984375, -0.0438232421875, -0.04166412353515625, -0.0395050048828125, -0.03734588623046875, -0.035186767578125, -0.03302764892578125, -0.0308685302734375, -0.02870941162109375, -0.02655029296875, -0.02439117431640625, -0.0222320556640625, -0.02007293701171875, -0.017913818359375, -0.01575469970703125, -0.0135955810546875, -0.01143646240234375, -0.00927734375, -0.00711822509765625, -0.0049591064453125, -0.00279998779296875, -0.000640869140625, 0.00151824951171875, 0.0036773681640625, 0.00583648681640625, 0.00799560546875, 0.01015472412109375, 0.0123138427734375, 0.01447296142578125, 0.016632080078125, 0.01879119873046875, 0.0209503173828125, 0.02310943603515625, 0.0252685546875, 0.02742767333984375, 0.0295867919921875, 0.03174591064453125, 0.033905029296875, 0.03606414794921875, 0.0382232666015625, 0.04038238525390625, 0.04254150390625, 0.04470062255859375, 0.0468597412109375, 0.04901885986328125, 0.051177978515625, 0.05333709716796875, 0.0554962158203125, 0.05765533447265625, 0.059814453125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 6.0, 11.0, 11.0, 14.0, 24.0, 20.0, 34.0, 35.0, 70.0, 72.0, 122.0, 189.0, 245.0, 427.0, 1966.0, 109510.0, 909360.0, 24435.0, 904.0, 343.0, 215.0, 164.0, 117.0, 66.0, 47.0, 38.0, 23.0, 18.0, 8.0, 12.0, 8.0, 11.0, 8.0, 3.0, 6.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.265625, -1.2193145751953125, -1.173004150390625, -1.1266937255859375, -1.08038330078125, -1.0340728759765625, -0.987762451171875, -0.9414520263671875, -0.8951416015625, -0.8488311767578125, -0.802520751953125, -0.7562103271484375, -0.70989990234375, -0.6635894775390625, -0.617279052734375, -0.5709686279296875, -0.524658203125, -0.4783477783203125, -0.432037353515625, -0.3857269287109375, -0.33941650390625, -0.2931060791015625, -0.246795654296875, -0.2004852294921875, -0.1541748046875, -0.1078643798828125, -0.061553955078125, -0.0152435302734375, 0.03106689453125, 0.0773773193359375, 0.123687744140625, 0.1699981689453125, 0.21630859375, 0.2626190185546875, 0.308929443359375, 0.3552398681640625, 0.40155029296875, 0.4478607177734375, 0.494171142578125, 0.5404815673828125, 0.5867919921875, 0.6331024169921875, 0.679412841796875, 0.7257232666015625, 0.77203369140625, 0.8183441162109375, 0.864654541015625, 0.9109649658203125, 0.957275390625, 1.0035858154296875, 1.049896240234375, 1.0962066650390625, 1.14251708984375, 1.1888275146484375, 1.235137939453125, 1.2814483642578125, 1.3277587890625, 1.3740692138671875, 1.420379638671875, 1.4666900634765625, 1.51300048828125, 1.5593109130859375, 1.605621337890625, 1.6519317626953125, 1.6982421875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 16.0, 43.0, 136.0, 541.0, 229.0, 43.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.236189603805542, -3.1709463596343994, -3.105703115463257, -3.0404598712921143, -2.9752166271209717, -2.909973382949829, -2.8447301387786865, -2.779486894607544, -2.7142436504364014, -2.649000406265259, -2.583757162094116, -2.5185139179229736, -2.453270673751831, -2.3880274295806885, -2.322784185409546, -2.2575409412384033, -2.1922974586486816, -2.127054214477539, -2.0618109703063965, -1.996567726135254, -1.9313244819641113, -1.8660812377929688, -1.8008379936218262, -1.7355947494506836, -1.670351505279541, -1.6051082611083984, -1.5398650169372559, -1.4746217727661133, -1.4093785285949707, -1.3441352844238281, -1.2788920402526855, -1.213648796081543, -1.1484057903289795, -1.083162546157837, -1.0179193019866943, -0.9526760578155518, -0.8874328136444092, -0.8221895694732666, -0.7569462656974792, -0.6917030215263367, -0.6264597177505493, -0.5612164735794067, -0.49597322940826416, -0.4307299554347992, -0.3654867112636566, -0.30024346709251404, -0.23500019311904907, -0.1697569489479065, -0.10451370477676392, -0.03927045315504074, 0.025972798466682434, 0.0912160575389862, 0.15645930171012878, 0.22170254588127136, 0.28694581985473633, 0.3521890640258789, 0.4174323081970215, 0.48267555236816406, 0.5479187965393066, 0.6131620407104492, 0.6784052848815918, 0.7436485290527344, 0.8088918328285217, 0.8741350769996643, 0.9393783211708069]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 4.0, 4.0, 7.0, 8.0, 15.0, 15.0, 17.0, 22.0, 23.0, 25.0, 38.0, 27.0, 44.0, 38.0, 46.0, 42.0, 39.0, 42.0, 38.0, 63.0, 49.0, 44.0, 39.0, 38.0, 48.0, 35.0, 29.0, 28.0, 26.0, 29.0, 19.0, 16.0, 11.0, 12.0, 7.0, 5.0, 3.0, 9.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.30739933252334595, -0.2982025742530823, -0.2890058159828186, -0.27980905771255493, -0.27061229944229126, -0.2614155411720276, -0.2522187829017639, -0.24302205443382263, -0.23382529616355896, -0.2246285378932953, -0.21543177962303162, -0.20623502135276794, -0.19703827798366547, -0.1878415197134018, -0.17864476144313812, -0.16944801807403564, -0.16025124490261078, -0.1510544866323471, -0.14185772836208344, -0.13266098499298096, -0.12346422672271729, -0.11426746845245361, -0.10507071018218994, -0.09587395936250687, -0.0866772010922432, -0.07748044282197952, -0.06828369200229645, -0.059086933732032776, -0.0498901791870594, -0.04069342464208603, -0.03149666637182236, -0.022299915552139282, -0.01310315728187561, -0.003906401805579662, 0.005290353670716286, 0.014487110078334808, 0.023683864623308182, 0.032880619168281555, 0.04207737743854523, 0.0512741282582283, 0.060470886528491974, 0.06966764479875565, 0.07886439561843872, 0.08806115388870239, 0.09725791215896606, 0.10645466297864914, 0.11565142124891281, 0.12484817206859589, 0.13404493033885956, 0.14324168860912323, 0.1524384468793869, 0.16163519024848938, 0.17083194851875305, 0.18002870678901672, 0.1892254650592804, 0.19842222332954407, 0.20761898159980774, 0.2168157398700714, 0.22601249814033508, 0.23520925641059875, 0.24440599977970123, 0.2536027431488037, 0.2627995014190674, 0.27199625968933105, 0.2811930179595947]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 1.0, 3.0, 4.0, 8.0, 4.0, 2.0, 11.0, 12.0, 21.0, 20.0, 10.0, 17.0, 23.0, 34.0, 25.0, 51.0, 39.0, 36.0, 40.0, 46.0, 48.0, 48.0, 50.0, 51.0, 49.0, 42.0, 34.0, 32.0, 42.0, 26.0, 20.0, 30.0, 23.0, 19.0, 12.0, 11.0, 12.0, 7.0, 13.0, 7.0, 3.0, 6.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.484375, -4.33050537109375, -4.1766357421875, -4.02276611328125, -3.868896484375, -3.71502685546875, -3.5611572265625, -3.40728759765625, -3.25341796875, -3.09954833984375, -2.9456787109375, -2.79180908203125, -2.637939453125, -2.48406982421875, -2.3302001953125, -2.17633056640625, -2.0224609375, -1.86859130859375, -1.7147216796875, -1.56085205078125, -1.406982421875, -1.25311279296875, -1.0992431640625, -0.94537353515625, -0.79150390625, -0.63763427734375, -0.4837646484375, -0.32989501953125, -0.176025390625, -0.02215576171875, 0.1317138671875, 0.28558349609375, 0.439453125, 0.59332275390625, 0.7471923828125, 0.90106201171875, 1.054931640625, 1.20880126953125, 1.3626708984375, 1.51654052734375, 1.67041015625, 1.82427978515625, 1.9781494140625, 2.13201904296875, 2.285888671875, 2.43975830078125, 2.5936279296875, 2.74749755859375, 2.9013671875, 3.05523681640625, 3.2091064453125, 3.36297607421875, 3.516845703125, 3.67071533203125, 3.8245849609375, 3.97845458984375, 4.13232421875, 4.28619384765625, 4.4400634765625, 4.59393310546875, 4.747802734375, 4.90167236328125, 5.0555419921875, 5.20941162109375, 5.36328125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 3.0, 6.0, 5.0, 8.0, 8.0, 22.0, 18.0, 19.0, 33.0, 45.0, 53.0, 91.0, 162.0, 209.0, 360.0, 609.0, 1129.0, 1975.0, 3693.0, 7341.0, 15126.0, 34632.0, 88830.0, 264864.0, 379396.0, 152075.0, 53500.0, 22451.0, 10463.0, 5204.0, 2674.0, 1416.0, 799.0, 438.0, 285.0, 197.0, 117.0, 78.0, 51.0, 48.0, 35.0, 25.0, 20.0, 9.0, 9.0, 10.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.16796875, -5.9766845703125, -5.785400390625, -5.5941162109375, -5.40283203125, -5.2115478515625, -5.020263671875, -4.8289794921875, -4.6376953125, -4.4464111328125, -4.255126953125, -4.0638427734375, -3.87255859375, -3.6812744140625, -3.489990234375, -3.2987060546875, -3.107421875, -2.9161376953125, -2.724853515625, -2.5335693359375, -2.34228515625, -2.1510009765625, -1.959716796875, -1.7684326171875, -1.5771484375, -1.3858642578125, -1.194580078125, -1.0032958984375, -0.81201171875, -0.6207275390625, -0.429443359375, -0.2381591796875, -0.046875, 0.1444091796875, 0.335693359375, 0.5269775390625, 0.71826171875, 0.9095458984375, 1.100830078125, 1.2921142578125, 1.4833984375, 1.6746826171875, 1.865966796875, 2.0572509765625, 2.24853515625, 2.4398193359375, 2.631103515625, 2.8223876953125, 3.013671875, 3.2049560546875, 3.396240234375, 3.5875244140625, 3.77880859375, 3.9700927734375, 4.161376953125, 4.3526611328125, 4.5439453125, 4.7352294921875, 4.926513671875, 5.1177978515625, 5.30908203125, 5.5003662109375, 5.691650390625, 5.8829345703125, 6.07421875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 4.0, 9.0, 2.0, 7.0, 9.0, 13.0, 11.0, 20.0, 17.0, 15.0, 27.0, 23.0, 33.0, 33.0, 40.0, 40.0, 58.0, 54.0, 129.0, 214.0, 1418.0, 249.0, 145.0, 73.0, 64.0, 47.0, 42.0, 42.0, 36.0, 30.0, 28.0, 21.0, 18.0, 21.0, 10.0, 9.0, 10.0, 8.0, 6.0, 2.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.140625, -15.577392578125, -15.01416015625, -14.450927734375, -13.8876953125, -13.324462890625, -12.76123046875, -12.197998046875, -11.634765625, -11.071533203125, -10.50830078125, -9.945068359375, -9.3818359375, -8.818603515625, -8.25537109375, -7.692138671875, -7.12890625, -6.565673828125, -6.00244140625, -5.439208984375, -4.8759765625, -4.312744140625, -3.74951171875, -3.186279296875, -2.623046875, -2.059814453125, -1.49658203125, -0.933349609375, -0.3701171875, 0.193115234375, 0.75634765625, 1.319580078125, 1.8828125, 2.446044921875, 3.00927734375, 3.572509765625, 4.1357421875, 4.698974609375, 5.26220703125, 5.825439453125, 6.388671875, 6.951904296875, 7.51513671875, 8.078369140625, 8.6416015625, 9.204833984375, 9.76806640625, 10.331298828125, 10.89453125, 11.457763671875, 12.02099609375, 12.584228515625, 13.1474609375, 13.710693359375, 14.27392578125, 14.837158203125, 15.400390625, 15.963623046875, 16.52685546875, 17.090087890625, 17.6533203125, 18.216552734375, 18.77978515625, 19.343017578125, 19.90625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 7.0, 9.0, 14.0, 15.0, 19.0, 23.0, 37.0, 31.0, 57.0, 76.0, 131.0, 228.0, 433.0, 984.0, 2513.0, 8819.0, 60784.0, 1567072.0, 1434072.0, 57354.0, 8690.0, 2384.0, 853.0, 424.0, 207.0, 124.0, 75.0, 57.0, 38.0, 28.0, 25.0, 23.0, 15.0, 16.0, 14.0, 11.0, 4.0, 6.0, 9.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.484375, -22.7724609375, -22.060546875, -21.3486328125, -20.63671875, -19.9248046875, -19.212890625, -18.5009765625, -17.7890625, -17.0771484375, -16.365234375, -15.6533203125, -14.94140625, -14.2294921875, -13.517578125, -12.8056640625, -12.09375, -11.3818359375, -10.669921875, -9.9580078125, -9.24609375, -8.5341796875, -7.822265625, -7.1103515625, -6.3984375, -5.6865234375, -4.974609375, -4.2626953125, -3.55078125, -2.8388671875, -2.126953125, -1.4150390625, -0.703125, 0.0087890625, 0.720703125, 1.4326171875, 2.14453125, 2.8564453125, 3.568359375, 4.2802734375, 4.9921875, 5.7041015625, 6.416015625, 7.1279296875, 7.83984375, 8.5517578125, 9.263671875, 9.9755859375, 10.6875, 11.3994140625, 12.111328125, 12.8232421875, 13.53515625, 14.2470703125, 14.958984375, 15.6708984375, 16.3828125, 17.0947265625, 17.806640625, 18.5185546875, 19.23046875, 19.9423828125, 20.654296875, 21.3662109375, 22.078125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 13.0, 46.0, 79.0, 214.0, 253.0, 216.0, 125.0, 40.0, 18.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.325801849365234, -18.867883682250977, -16.40996551513672, -13.952045440673828, -11.49412727355957, -9.036209106445312, -6.578289985656738, -4.120370864868164, -1.6624526977539062, 0.7954659461975098, 3.253384590148926, 5.711303234100342, 8.169221878051758, 10.627140045166016, 13.08505916595459, 15.542978286743164, 18.000896453857422, 20.45881462097168, 22.916732788085938, 25.374652862548828, 27.832571029663086, 30.290489196777344, 32.748409271240234, 35.206329345703125, 37.66424560546875, 40.12216567993164, 42.580081939697266, 45.038002014160156, 47.49591827392578, 49.95383834838867, 52.41175842285156, 54.86967468261719, 57.32759094238281, 59.7855110168457, 62.24342727661133, 64.70134735107422, 67.15926361083984, 69.6171875, 72.07510375976562, 74.53302001953125, 76.99093627929688, 79.4488525390625, 81.90677642822266, 84.36469268798828, 86.8226089477539, 89.28053283691406, 91.73844909667969, 94.19636535644531, 96.65428924560547, 99.1122055053711, 101.57012939453125, 104.02804565429688, 106.4859619140625, 108.94387817382812, 111.40180206298828, 113.8597183227539, 116.31764221191406, 118.77555847167969, 121.23348236083984, 123.69139862060547, 126.1493148803711, 128.60723876953125, 131.06515502929688, 133.5230712890625, 135.98098754882812]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 8.0, 7.0, 16.0, 6.0, 17.0, 15.0, 20.0, 15.0, 35.0, 21.0, 32.0, 26.0, 35.0, 40.0, 42.0, 42.0, 36.0, 39.0, 34.0, 38.0, 40.0, 33.0, 38.0, 47.0, 27.0, 24.0, 28.0, 25.0, 27.0, 22.0, 21.0, 24.0, 36.0, 11.0, 12.0, 3.0, 6.0, 6.0, 12.0, 8.0, 5.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-53.223636627197266, -51.58935546875, -49.955078125, -48.320796966552734, -46.68651580810547, -45.0522346496582, -43.41795349121094, -41.78367614746094, -40.14939498901367, -38.515113830566406, -36.880836486816406, -35.24655532836914, -33.612274169921875, -31.97799301147461, -30.343713760375977, -28.709434509277344, -27.075153350830078, -25.440872192382812, -23.80659294128418, -22.172313690185547, -20.53803253173828, -18.903751373291016, -17.269472122192383, -15.635191917419434, -14.000911712646484, -12.366631507873535, -10.732351303100586, -9.098071098327637, -7.4637908935546875, -5.829510688781738, -4.195230484008789, -2.56095027923584, -0.9266700744628906, 0.7076101303100586, 2.341890335083008, 3.976170539855957, 5.610450744628906, 7.2447309494018555, 8.879011154174805, 10.513291358947754, 12.147571563720703, 13.781851768493652, 15.416131973266602, 17.050411224365234, 18.6846923828125, 20.318973541259766, 21.9532527923584, 23.58753204345703, 25.221813201904297, 26.856094360351562, 28.490373611450195, 30.124652862548828, 31.758934020996094, 33.39321517944336, 35.027496337890625, 36.661773681640625, 38.29605484008789, 39.930335998535156, 41.564613342285156, 43.19889450073242, 44.83317565917969, 46.46745681762695, 48.10173797607422, 49.73601531982422, 51.370296478271484]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 1.0, 2.0, 5.0, 9.0, 12.0, 9.0, 10.0, 15.0, 9.0, 16.0, 18.0, 28.0, 27.0, 28.0, 31.0, 43.0, 46.0, 31.0, 31.0, 36.0, 42.0, 49.0, 42.0, 37.0, 38.0, 37.0, 32.0, 38.0, 34.0, 38.0, 34.0, 21.0, 26.0, 20.0, 12.0, 17.0, 11.0, 11.0, 6.0, 8.0, 5.0, 8.0, 3.0, 8.0, 6.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.4453125, -4.30218505859375, -4.1590576171875, -4.01593017578125, -3.872802734375, -3.72967529296875, -3.5865478515625, -3.44342041015625, -3.30029296875, -3.15716552734375, -3.0140380859375, -2.87091064453125, -2.727783203125, -2.58465576171875, -2.4415283203125, -2.29840087890625, -2.1552734375, -2.01214599609375, -1.8690185546875, -1.72589111328125, -1.582763671875, -1.43963623046875, -1.2965087890625, -1.15338134765625, -1.01025390625, -0.86712646484375, -0.7239990234375, -0.58087158203125, -0.437744140625, -0.29461669921875, -0.1514892578125, -0.00836181640625, 0.134765625, 0.27789306640625, 0.4210205078125, 0.56414794921875, 0.707275390625, 0.85040283203125, 0.9935302734375, 1.13665771484375, 1.27978515625, 1.42291259765625, 1.5660400390625, 1.70916748046875, 1.852294921875, 1.99542236328125, 2.1385498046875, 2.28167724609375, 2.4248046875, 2.56793212890625, 2.7110595703125, 2.85418701171875, 2.997314453125, 3.14044189453125, 3.2835693359375, 3.42669677734375, 3.56982421875, 3.71295166015625, 3.8560791015625, 3.99920654296875, 4.142333984375, 4.28546142578125, 4.4285888671875, 4.57171630859375, 4.71484375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 4.0, 14.0, 19.0, 29.0, 25.0, 51.0, 69.0, 93.0, 122.0, 222.0, 327.0, 537.0, 868.0, 1632.0, 3089.0, 7105.0, 19179.0, 62455.0, 250995.0, 1068053.0, 1928173.0, 638698.0, 148582.0, 40099.0, 13114.0, 5196.0, 2368.0, 1206.0, 664.0, 402.0, 261.0, 173.0, 123.0, 95.0, 67.0, 49.0, 31.0, 20.0, 19.0, 11.0, 8.0, 12.0, 6.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9453125, -8.6502685546875, -8.355224609375, -8.0601806640625, -7.76513671875, -7.4700927734375, -7.175048828125, -6.8800048828125, -6.5849609375, -6.2899169921875, -5.994873046875, -5.6998291015625, -5.40478515625, -5.1097412109375, -4.814697265625, -4.5196533203125, -4.224609375, -3.9295654296875, -3.634521484375, -3.3394775390625, -3.04443359375, -2.7493896484375, -2.454345703125, -2.1593017578125, -1.8642578125, -1.5692138671875, -1.274169921875, -0.9791259765625, -0.68408203125, -0.3890380859375, -0.093994140625, 0.2010498046875, 0.49609375, 0.7911376953125, 1.086181640625, 1.3812255859375, 1.67626953125, 1.9713134765625, 2.266357421875, 2.5614013671875, 2.8564453125, 3.1514892578125, 3.446533203125, 3.7415771484375, 4.03662109375, 4.3316650390625, 4.626708984375, 4.9217529296875, 5.216796875, 5.5118408203125, 5.806884765625, 6.1019287109375, 6.39697265625, 6.6920166015625, 6.987060546875, 7.2821044921875, 7.5771484375, 7.8721923828125, 8.167236328125, 8.4622802734375, 8.75732421875, 9.0523681640625, 9.347412109375, 9.6424560546875, 9.9375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 10.0, 10.0, 9.0, 4.0, 13.0, 20.0, 26.0, 31.0, 52.0, 69.0, 89.0, 125.0, 174.0, 196.0, 286.0, 335.0, 396.0, 418.0, 354.0, 350.0, 260.0, 174.0, 169.0, 138.0, 84.0, 83.0, 52.0, 39.0, 22.0, 23.0, 18.0, 10.0, 6.0, 4.0, 7.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.28125, -10.9219970703125, -10.562744140625, -10.2034912109375, -9.84423828125, -9.4849853515625, -9.125732421875, -8.7664794921875, -8.4072265625, -8.0479736328125, -7.688720703125, -7.3294677734375, -6.97021484375, -6.6109619140625, -6.251708984375, -5.8924560546875, -5.533203125, -5.1739501953125, -4.814697265625, -4.4554443359375, -4.09619140625, -3.7369384765625, -3.377685546875, -3.0184326171875, -2.6591796875, -2.2999267578125, -1.940673828125, -1.5814208984375, -1.22216796875, -0.8629150390625, -0.503662109375, -0.1444091796875, 0.21484375, 0.5740966796875, 0.933349609375, 1.2926025390625, 1.65185546875, 2.0111083984375, 2.370361328125, 2.7296142578125, 3.0888671875, 3.4481201171875, 3.807373046875, 4.1666259765625, 4.52587890625, 4.8851318359375, 5.244384765625, 5.6036376953125, 5.962890625, 6.3221435546875, 6.681396484375, 7.0406494140625, 7.39990234375, 7.7591552734375, 8.118408203125, 8.4776611328125, 8.8369140625, 9.1961669921875, 9.555419921875, 9.9146728515625, 10.27392578125, 10.6331787109375, 10.992431640625, 11.3516845703125, 11.7109375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 5.0, 7.0, 9.0, 18.0, 29.0, 33.0, 61.0, 96.0, 155.0, 314.0, 519.0, 903.0, 1752.0, 3784.0, 9285.0, 27118.0, 100107.0, 441238.0, 1656899.0, 1464807.0, 364896.0, 83577.0, 23457.0, 8228.0, 3421.0, 1609.0, 841.0, 469.0, 262.0, 129.0, 108.0, 39.0, 25.0, 17.0, 17.0, 10.0, 12.0, 7.0, 4.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-15.609375, -15.12060546875, -14.6318359375, -14.14306640625, -13.654296875, -13.16552734375, -12.6767578125, -12.18798828125, -11.69921875, -11.21044921875, -10.7216796875, -10.23291015625, -9.744140625, -9.25537109375, -8.7666015625, -8.27783203125, -7.7890625, -7.30029296875, -6.8115234375, -6.32275390625, -5.833984375, -5.34521484375, -4.8564453125, -4.36767578125, -3.87890625, -3.39013671875, -2.9013671875, -2.41259765625, -1.923828125, -1.43505859375, -0.9462890625, -0.45751953125, 0.03125, 0.52001953125, 1.0087890625, 1.49755859375, 1.986328125, 2.47509765625, 2.9638671875, 3.45263671875, 3.94140625, 4.43017578125, 4.9189453125, 5.40771484375, 5.896484375, 6.38525390625, 6.8740234375, 7.36279296875, 7.8515625, 8.34033203125, 8.8291015625, 9.31787109375, 9.806640625, 10.29541015625, 10.7841796875, 11.27294921875, 11.76171875, 12.25048828125, 12.7392578125, 13.22802734375, 13.716796875, 14.20556640625, 14.6943359375, 15.18310546875, 15.671875]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 11.0, 16.0, 22.0, 38.0, 39.0, 60.0, 74.0, 73.0, 83.0, 115.0, 117.0, 82.0, 70.0, 66.0, 57.0, 29.0, 26.0, 16.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.72368621826172, -91.61333465576172, -89.50298309326172, -87.39262390136719, -85.28227233886719, -83.17192077636719, -81.06156921386719, -78.95121765136719, -76.84085845947266, -74.73050689697266, -72.62015533447266, -70.50979614257812, -68.39944458007812, -66.28909301757812, -64.17874145507812, -62.06838607788086, -59.95803451538086, -57.84768295288086, -55.737327575683594, -53.626976013183594, -51.51662063598633, -49.40626907348633, -47.29591369628906, -45.18556213378906, -43.07521057128906, -40.96485900878906, -38.8545036315918, -36.7441520690918, -34.63379669189453, -32.52344512939453, -30.4130916595459, -28.302738189697266, -26.192378997802734, -24.0820255279541, -21.97167205810547, -19.86132049560547, -17.750965118408203, -15.640612602233887, -13.53026008605957, -11.419906616210938, -9.309553146362305, -7.199199676513672, -5.088846683502197, -2.9784936904907227, -0.8681402206420898, 1.242213249206543, 3.3525657653808594, 5.462919235229492, 7.573272705078125, 9.683626174926758, 11.79397964477539, 13.904332160949707, 16.014686584472656, 18.125038146972656, 20.23539161682129, 22.345745086669922, 24.456098556518555, 26.566452026367188, 28.67680549621582, 30.787158966064453, 32.89751052856445, 35.00786590576172, 37.11821746826172, 39.22856903076172, 41.338924407958984]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 1.0, 6.0, 5.0, 5.0, 12.0, 5.0, 12.0, 16.0, 15.0, 22.0, 19.0, 20.0, 24.0, 22.0, 25.0, 46.0, 29.0, 36.0, 24.0, 43.0, 28.0, 43.0, 29.0, 43.0, 39.0, 35.0, 36.0, 33.0, 36.0, 25.0, 34.0, 33.0, 22.0, 22.0, 25.0, 19.0, 13.0, 11.0, 12.0, 17.0, 18.0, 12.0, 6.0, 8.0, 6.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0], "bins": [-41.351837158203125, -40.137672424316406, -38.92351150512695, -37.7093505859375, -36.49518585205078, -35.28102111816406, -34.06686019897461, -32.852699279785156, -31.638534545898438, -30.42437171936035, -29.210208892822266, -27.99604606628418, -26.781883239746094, -25.567720413208008, -24.353557586669922, -23.139394760131836, -21.92523193359375, -20.711069107055664, -19.496906280517578, -18.282743453979492, -17.068580627441406, -15.85441780090332, -14.640254974365234, -13.426092147827148, -12.211929321289062, -10.997766494750977, -9.78360366821289, -8.569440841674805, -7.355278015136719, -6.141115188598633, -4.926952362060547, -3.712789535522461, -2.4986228942871094, -1.2844600677490234, -0.0702972412109375, 1.1438655853271484, 2.3580284118652344, 3.5721912384033203, 4.786354064941406, 6.000516891479492, 7.214679718017578, 8.428842544555664, 9.64300537109375, 10.857168197631836, 12.071331024169922, 13.285493850708008, 14.499656677246094, 15.71381950378418, 16.927982330322266, 18.14214515686035, 19.356307983398438, 20.570470809936523, 21.78463363647461, 22.998796463012695, 24.21295928955078, 25.427122116088867, 26.641284942626953, 27.85544776916504, 29.069610595703125, 30.28377342224121, 31.497936248779297, 32.71209716796875, 33.92626190185547, 35.14042663574219, 36.35458755493164]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 5.0, 7.0, 8.0, 5.0, 11.0, 12.0, 21.0, 14.0, 17.0, 21.0, 18.0, 36.0, 38.0, 32.0, 30.0, 44.0, 35.0, 47.0, 42.0, 48.0, 39.0, 45.0, 38.0, 50.0, 34.0, 31.0, 34.0, 41.0, 25.0, 26.0, 20.0, 18.0, 25.0, 7.0, 12.0, 15.0, 11.0, 4.0, 4.0, 8.0, 2.0, 5.0, 2.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.54296875, -4.3870849609375, -4.231201171875, -4.0753173828125, -3.91943359375, -3.7635498046875, -3.607666015625, -3.4517822265625, -3.2958984375, -3.1400146484375, -2.984130859375, -2.8282470703125, -2.67236328125, -2.5164794921875, -2.360595703125, -2.2047119140625, -2.048828125, -1.8929443359375, -1.737060546875, -1.5811767578125, -1.42529296875, -1.2694091796875, -1.113525390625, -0.9576416015625, -0.8017578125, -0.6458740234375, -0.489990234375, -0.3341064453125, -0.17822265625, -0.0223388671875, 0.133544921875, 0.2894287109375, 0.4453125, 0.6011962890625, 0.757080078125, 0.9129638671875, 1.06884765625, 1.2247314453125, 1.380615234375, 1.5364990234375, 1.6923828125, 1.8482666015625, 2.004150390625, 2.1600341796875, 2.31591796875, 2.4718017578125, 2.627685546875, 2.7835693359375, 2.939453125, 3.0953369140625, 3.251220703125, 3.4071044921875, 3.56298828125, 3.7188720703125, 3.874755859375, 4.0306396484375, 4.1865234375, 4.3424072265625, 4.498291015625, 4.6541748046875, 4.81005859375, 4.9659423828125, 5.121826171875, 5.2777099609375, 5.43359375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 12.0, 12.0, 15.0, 38.0, 37.0, 75.0, 94.0, 190.0, 290.0, 479.0, 903.0, 1682.0, 3130.0, 6667.0, 14172.0, 30666.0, 64021.0, 123719.0, 202227.0, 234828.0, 174362.0, 98601.0, 48646.0, 22840.0, 10381.0, 4957.0, 2400.0, 1271.0, 755.0, 416.0, 247.0, 150.0, 84.0, 66.0, 35.0, 29.0, 27.0, 10.0, 8.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.044921875, -1.97515869140625, -1.9053955078125, -1.83563232421875, -1.765869140625, -1.69610595703125, -1.6263427734375, -1.55657958984375, -1.48681640625, -1.41705322265625, -1.3472900390625, -1.27752685546875, -1.207763671875, -1.13800048828125, -1.0682373046875, -0.99847412109375, -0.9287109375, -0.85894775390625, -0.7891845703125, -0.71942138671875, -0.649658203125, -0.57989501953125, -0.5101318359375, -0.44036865234375, -0.37060546875, -0.30084228515625, -0.2310791015625, -0.16131591796875, -0.091552734375, -0.02178955078125, 0.0479736328125, 0.11773681640625, 0.1875, 0.25726318359375, 0.3270263671875, 0.39678955078125, 0.466552734375, 0.53631591796875, 0.6060791015625, 0.67584228515625, 0.74560546875, 0.81536865234375, 0.8851318359375, 0.95489501953125, 1.024658203125, 1.09442138671875, 1.1641845703125, 1.23394775390625, 1.3037109375, 1.37347412109375, 1.4432373046875, 1.51300048828125, 1.582763671875, 1.65252685546875, 1.7222900390625, 1.79205322265625, 1.86181640625, 1.93157958984375, 2.0013427734375, 2.07110595703125, 2.140869140625, 2.21063232421875, 2.2803955078125, 2.35015869140625, 2.419921875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 3.0, 4.0, 9.0, 8.0, 11.0, 5.0, 14.0, 13.0, 15.0, 24.0, 23.0, 22.0, 24.0, 24.0, 35.0, 25.0, 37.0, 25.0, 34.0, 37.0, 21.0, 35.0, 34.0, 1062.0, 51.0, 35.0, 39.0, 35.0, 22.0, 21.0, 31.0, 31.0, 26.0, 27.0, 20.0, 22.0, 17.0, 17.0, 16.0, 14.0, 8.0, 8.0, 4.0, 10.0, 8.0, 8.0, 4.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.19140625, -3.087127685546875, -2.98284912109375, -2.878570556640625, -2.7742919921875, -2.670013427734375, -2.56573486328125, -2.461456298828125, -2.357177734375, -2.252899169921875, -2.14862060546875, -2.044342041015625, -1.9400634765625, -1.835784912109375, -1.73150634765625, -1.627227783203125, -1.52294921875, -1.418670654296875, -1.31439208984375, -1.210113525390625, -1.1058349609375, -1.001556396484375, -0.89727783203125, -0.792999267578125, -0.688720703125, -0.584442138671875, -0.48016357421875, -0.375885009765625, -0.2716064453125, -0.167327880859375, -0.06304931640625, 0.041229248046875, 0.1455078125, 0.249786376953125, 0.35406494140625, 0.458343505859375, 0.5626220703125, 0.666900634765625, 0.77117919921875, 0.875457763671875, 0.979736328125, 1.084014892578125, 1.18829345703125, 1.292572021484375, 1.3968505859375, 1.501129150390625, 1.60540771484375, 1.709686279296875, 1.81396484375, 1.918243408203125, 2.02252197265625, 2.126800537109375, 2.2310791015625, 2.335357666015625, 2.43963623046875, 2.543914794921875, 2.648193359375, 2.752471923828125, 2.85675048828125, 2.961029052734375, 3.0653076171875, 3.169586181640625, 3.27386474609375, 3.378143310546875, 3.482421875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 9.0, 9.0, 17.0, 14.0, 19.0, 34.0, 41.0, 60.0, 109.0, 137.0, 177.0, 295.0, 469.0, 800.0, 1239.0, 1993.0, 3491.0, 5972.0, 10178.0, 18060.0, 34319.0, 1840323.0, 111952.0, 29156.0, 15562.0, 9125.0, 5358.0, 3190.0, 1868.0, 1122.0, 687.0, 429.0, 307.0, 191.0, 140.0, 88.0, 50.0, 41.0, 27.0, 27.0, 17.0, 11.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.76171875, -2.67510986328125, -2.5885009765625, -2.50189208984375, -2.415283203125, -2.32867431640625, -2.2420654296875, -2.15545654296875, -2.06884765625, -1.98223876953125, -1.8956298828125, -1.80902099609375, -1.722412109375, -1.63580322265625, -1.5491943359375, -1.46258544921875, -1.3759765625, -1.28936767578125, -1.2027587890625, -1.11614990234375, -1.029541015625, -0.94293212890625, -0.8563232421875, -0.76971435546875, -0.68310546875, -0.59649658203125, -0.5098876953125, -0.42327880859375, -0.336669921875, -0.25006103515625, -0.1634521484375, -0.07684326171875, 0.009765625, 0.09637451171875, 0.1829833984375, 0.26959228515625, 0.356201171875, 0.44281005859375, 0.5294189453125, 0.61602783203125, 0.70263671875, 0.78924560546875, 0.8758544921875, 0.96246337890625, 1.049072265625, 1.13568115234375, 1.2222900390625, 1.30889892578125, 1.3955078125, 1.48211669921875, 1.5687255859375, 1.65533447265625, 1.741943359375, 1.82855224609375, 1.9151611328125, 2.00177001953125, 2.08837890625, 2.17498779296875, 2.2615966796875, 2.34820556640625, 2.434814453125, 2.52142333984375, 2.6080322265625, 2.69464111328125, 2.78125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 3.0, 7.0, 3.0, 6.0, 6.0, 9.0, 13.0, 13.0, 22.0, 31.0, 25.0, 38.0, 37.0, 46.0, 60.0, 65.0, 55.0, 62.0, 67.0, 66.0, 63.0, 56.0, 43.0, 33.0, 38.0, 33.0, 22.0, 20.0, 10.0, 12.0, 9.0, 12.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07440185546875, -0.07213973999023438, -0.06987762451171875, -0.06761550903320312, -0.0653533935546875, -0.06309127807617188, -0.06082916259765625, -0.058567047119140625, -0.056304931640625, -0.054042816162109375, -0.05178070068359375, -0.049518585205078125, -0.0472564697265625, -0.044994354248046875, -0.04273223876953125, -0.040470123291015625, -0.0382080078125, -0.035945892333984375, -0.03368377685546875, -0.031421661376953125, -0.0291595458984375, -0.026897430419921875, -0.02463531494140625, -0.022373199462890625, -0.020111083984375, -0.017848968505859375, -0.01558685302734375, -0.013324737548828125, -0.0110626220703125, -0.008800506591796875, -0.00653839111328125, -0.004276275634765625, -0.00201416015625, 0.000247955322265625, 0.00251007080078125, 0.004772186279296875, 0.0070343017578125, 0.009296417236328125, 0.01155853271484375, 0.013820648193359375, 0.016082763671875, 0.018344879150390625, 0.02060699462890625, 0.022869110107421875, 0.0251312255859375, 0.027393341064453125, 0.02965545654296875, 0.031917572021484375, 0.0341796875, 0.036441802978515625, 0.03870391845703125, 0.040966033935546875, 0.0432281494140625, 0.045490264892578125, 0.04775238037109375, 0.050014495849609375, 0.052276611328125, 0.054538726806640625, 0.05680084228515625, 0.059062957763671875, 0.0613250732421875, 0.06358718872070312, 0.06584930419921875, 0.06811141967773438, 0.07037353515625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 10.0, 3.0, 13.0, 15.0, 16.0, 17.0, 29.0, 33.0, 51.0, 76.0, 91.0, 135.0, 199.0, 388.0, 1555.0, 19837.0, 481975.0, 520400.0, 21034.0, 1657.0, 374.0, 207.0, 115.0, 78.0, 57.0, 45.0, 38.0, 30.0, 18.0, 16.0, 6.0, 10.0, 8.0, 8.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4453125, -1.4028167724609375, -1.360321044921875, -1.3178253173828125, -1.27532958984375, -1.2328338623046875, -1.190338134765625, -1.1478424072265625, -1.1053466796875, -1.0628509521484375, -1.020355224609375, -0.9778594970703125, -0.93536376953125, -0.8928680419921875, -0.850372314453125, -0.8078765869140625, -0.765380859375, -0.7228851318359375, -0.680389404296875, -0.6378936767578125, -0.59539794921875, -0.5529022216796875, -0.510406494140625, -0.4679107666015625, -0.4254150390625, -0.3829193115234375, -0.340423583984375, -0.2979278564453125, -0.25543212890625, -0.2129364013671875, -0.170440673828125, -0.1279449462890625, -0.08544921875, -0.0429534912109375, -0.000457763671875, 0.0420379638671875, 0.08453369140625, 0.1270294189453125, 0.169525146484375, 0.2120208740234375, 0.2545166015625, 0.2970123291015625, 0.339508056640625, 0.3820037841796875, 0.42449951171875, 0.4669952392578125, 0.509490966796875, 0.5519866943359375, 0.594482421875, 0.6369781494140625, 0.679473876953125, 0.7219696044921875, 0.76446533203125, 0.8069610595703125, 0.849456787109375, 0.8919525146484375, 0.9344482421875, 0.9769439697265625, 1.019439697265625, 1.0619354248046875, 1.10443115234375, 1.1469268798828125, 1.189422607421875, 1.2319183349609375, 1.2744140625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 6.0, 6.0, 7.0, 5.0, 7.0, 14.0, 25.0, 36.0, 40.0, 68.0, 99.0, 148.0, 186.0, 130.0, 81.0, 48.0, 33.0, 16.0, 18.0, 8.0, 6.0, 9.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9378912448883057, -0.9179753661155701, -0.8980594873428345, -0.8781436681747437, -0.8582277894020081, -0.8383119106292725, -0.8183960914611816, -0.798480212688446, -0.7785643339157104, -0.7586484551429749, -0.7387325763702393, -0.7188167572021484, -0.6989008784294128, -0.6789849996566772, -0.6590691804885864, -0.6391533017158508, -0.6192374229431152, -0.5993215441703796, -0.579405665397644, -0.5594898462295532, -0.5395739674568176, -0.519658088684082, -0.4997422397136688, -0.4798263907432556, -0.45991051197052, -0.4399946331977844, -0.4200787842273712, -0.400162935256958, -0.3802470564842224, -0.3603311777114868, -0.3404153287410736, -0.3204994797706604, -0.3005836308002472, -0.280667781829834, -0.2607519030570984, -0.240836039185524, -0.22092017531394958, -0.20100431144237518, -0.18108844757080078, -0.16117258369922638, -0.14125671982765198, -0.12134085595607758, -0.10142499208450317, -0.08150912821292877, -0.06159326434135437, -0.04167740046977997, -0.021761536598205566, -0.0018456727266311646, 0.018070191144943237, 0.03798605501651764, 0.05790191888809204, 0.07781778275966644, 0.09773364663124084, 0.11764951050281525, 0.13756537437438965, 0.15748123824596405, 0.17739710211753845, 0.19731296598911285, 0.21722882986068726, 0.23714469373226166, 0.25706055760383606, 0.27697640657424927, 0.29689228534698486, 0.31680816411972046, 0.33672401309013367]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 4.0, 9.0, 7.0, 16.0, 19.0, 16.0, 17.0, 23.0, 22.0, 14.0, 23.0, 23.0, 33.0, 38.0, 32.0, 35.0, 37.0, 35.0, 49.0, 40.0, 56.0, 48.0, 36.0, 33.0, 31.0, 36.0, 31.0, 25.0, 25.0, 36.0, 18.0, 19.0, 24.0, 16.0, 12.0, 13.0, 13.0, 9.0, 10.0, 2.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.09872967004776001, -0.09589646756649017, -0.09306326508522034, -0.0902300626039505, -0.08739686012268066, -0.08456365764141083, -0.08173045516014099, -0.07889725267887115, -0.07606405019760132, -0.07323084771633148, -0.07039764523506165, -0.06756444275379181, -0.06473124027252197, -0.061898037791252136, -0.0590648353099823, -0.05623163282871246, -0.05339843034744263, -0.05056522786617279, -0.047732025384902954, -0.04489882290363312, -0.04206562042236328, -0.039232417941093445, -0.03639921545982361, -0.03356601297855377, -0.030732810497283936, -0.0278996080160141, -0.025066405534744263, -0.022233203053474426, -0.01940000057220459, -0.016566798090934753, -0.013733595609664917, -0.01090039312839508, -0.008067190647125244, -0.005233988165855408, -0.0024007856845855713, 0.00043241679668426514, 0.0032656192779541016, 0.006098821759223938, 0.008932024240493774, 0.01176522672176361, 0.014598429203033447, 0.017431631684303284, 0.02026483416557312, 0.023098036646842957, 0.025931239128112793, 0.02876444160938263, 0.031597644090652466, 0.0344308465719223, 0.03726404905319214, 0.040097251534461975, 0.04293045401573181, 0.04576365649700165, 0.048596858978271484, 0.05143006145954132, 0.05426326394081116, 0.057096466422080994, 0.05992966890335083, 0.06276287138462067, 0.0655960738658905, 0.06842927634716034, 0.07126247882843018, 0.07409568130970001, 0.07692888379096985, 0.07976208627223969, 0.08259528875350952]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 2.0, 12.0, 13.0, 11.0, 12.0, 16.0, 15.0, 26.0, 33.0, 25.0, 32.0, 40.0, 32.0, 37.0, 55.0, 62.0, 50.0, 38.0, 47.0, 44.0, 47.0, 56.0, 39.0, 34.0, 34.0, 25.0, 24.0, 20.0, 18.0, 18.0, 15.0, 6.0, 16.0, 9.0, 4.0, 5.0, 3.0, 10.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.5, -5.3310546875, -5.162109375, -4.9931640625, -4.82421875, -4.6552734375, -4.486328125, -4.3173828125, -4.1484375, -3.9794921875, -3.810546875, -3.6416015625, -3.47265625, -3.3037109375, -3.134765625, -2.9658203125, -2.796875, -2.6279296875, -2.458984375, -2.2900390625, -2.12109375, -1.9521484375, -1.783203125, -1.6142578125, -1.4453125, -1.2763671875, -1.107421875, -0.9384765625, -0.76953125, -0.6005859375, -0.431640625, -0.2626953125, -0.09375, 0.0751953125, 0.244140625, 0.4130859375, 0.58203125, 0.7509765625, 0.919921875, 1.0888671875, 1.2578125, 1.4267578125, 1.595703125, 1.7646484375, 1.93359375, 2.1025390625, 2.271484375, 2.4404296875, 2.609375, 2.7783203125, 2.947265625, 3.1162109375, 3.28515625, 3.4541015625, 3.623046875, 3.7919921875, 3.9609375, 4.1298828125, 4.298828125, 4.4677734375, 4.63671875, 4.8056640625, 4.974609375, 5.1435546875, 5.3125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 10.0, 6.0, 13.0, 8.0, 19.0, 21.0, 25.0, 38.0, 56.0, 75.0, 140.0, 234.0, 373.0, 625.0, 969.0, 1609.0, 2789.0, 4593.0, 8353.0, 16117.0, 32157.0, 66775.0, 143954.0, 297192.0, 249097.0, 113506.0, 53535.0, 26266.0, 13133.0, 6937.0, 3984.0, 2299.0, 1407.0, 835.0, 506.0, 320.0, 199.0, 128.0, 80.0, 52.0, 32.0, 21.0, 14.0, 13.0, 13.0, 8.0, 5.0, 5.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.15234375, -4.979736328125, -4.80712890625, -4.634521484375, -4.4619140625, -4.289306640625, -4.11669921875, -3.944091796875, -3.771484375, -3.598876953125, -3.42626953125, -3.253662109375, -3.0810546875, -2.908447265625, -2.73583984375, -2.563232421875, -2.390625, -2.218017578125, -2.04541015625, -1.872802734375, -1.7001953125, -1.527587890625, -1.35498046875, -1.182373046875, -1.009765625, -0.837158203125, -0.66455078125, -0.491943359375, -0.3193359375, -0.146728515625, 0.02587890625, 0.198486328125, 0.37109375, 0.543701171875, 0.71630859375, 0.888916015625, 1.0615234375, 1.234130859375, 1.40673828125, 1.579345703125, 1.751953125, 1.924560546875, 2.09716796875, 2.269775390625, 2.4423828125, 2.614990234375, 2.78759765625, 2.960205078125, 3.1328125, 3.305419921875, 3.47802734375, 3.650634765625, 3.8232421875, 3.995849609375, 4.16845703125, 4.341064453125, 4.513671875, 4.686279296875, 4.85888671875, 5.031494140625, 5.2041015625, 5.376708984375, 5.54931640625, 5.721923828125, 5.89453125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 6.0, 5.0, 4.0, 7.0, 11.0, 6.0, 11.0, 16.0, 13.0, 20.0, 31.0, 32.0, 27.0, 45.0, 41.0, 51.0, 65.0, 104.0, 209.0, 1418.0, 292.0, 156.0, 87.0, 66.0, 56.0, 54.0, 42.0, 27.0, 35.0, 24.0, 20.0, 16.0, 15.0, 15.0, 9.0, 8.0, 5.0, 5.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.953125, -21.322509765625, -20.69189453125, -20.061279296875, -19.4306640625, -18.800048828125, -18.16943359375, -17.538818359375, -16.908203125, -16.277587890625, -15.64697265625, -15.016357421875, -14.3857421875, -13.755126953125, -13.12451171875, -12.493896484375, -11.86328125, -11.232666015625, -10.60205078125, -9.971435546875, -9.3408203125, -8.710205078125, -8.07958984375, -7.448974609375, -6.818359375, -6.187744140625, -5.55712890625, -4.926513671875, -4.2958984375, -3.665283203125, -3.03466796875, -2.404052734375, -1.7734375, -1.142822265625, -0.51220703125, 0.118408203125, 0.7490234375, 1.379638671875, 2.01025390625, 2.640869140625, 3.271484375, 3.902099609375, 4.53271484375, 5.163330078125, 5.7939453125, 6.424560546875, 7.05517578125, 7.685791015625, 8.31640625, 8.947021484375, 9.57763671875, 10.208251953125, 10.8388671875, 11.469482421875, 12.10009765625, 12.730712890625, 13.361328125, 13.991943359375, 14.62255859375, 15.253173828125, 15.8837890625, 16.514404296875, 17.14501953125, 17.775634765625, 18.40625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 7.0, 3.0, 5.0, 4.0, 11.0, 14.0, 17.0, 28.0, 28.0, 35.0, 52.0, 55.0, 80.0, 114.0, 191.0, 313.0, 763.0, 3323.0, 29837.0, 1230721.0, 1836112.0, 38213.0, 3919.0, 833.0, 352.0, 181.0, 146.0, 81.0, 71.0, 51.0, 32.0, 24.0, 16.0, 13.0, 20.0, 8.0, 12.0, 7.0, 6.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.734375, -27.778076171875, -26.82177734375, -25.865478515625, -24.9091796875, -23.952880859375, -22.99658203125, -22.040283203125, -21.083984375, -20.127685546875, -19.17138671875, -18.215087890625, -17.2587890625, -16.302490234375, -15.34619140625, -14.389892578125, -13.43359375, -12.477294921875, -11.52099609375, -10.564697265625, -9.6083984375, -8.652099609375, -7.69580078125, -6.739501953125, -5.783203125, -4.826904296875, -3.87060546875, -2.914306640625, -1.9580078125, -1.001708984375, -0.04541015625, 0.910888671875, 1.8671875, 2.823486328125, 3.77978515625, 4.736083984375, 5.6923828125, 6.648681640625, 7.60498046875, 8.561279296875, 9.517578125, 10.473876953125, 11.43017578125, 12.386474609375, 13.3427734375, 14.299072265625, 15.25537109375, 16.211669921875, 17.16796875, 18.124267578125, 19.08056640625, 20.036865234375, 20.9931640625, 21.949462890625, 22.90576171875, 23.862060546875, 24.818359375, 25.774658203125, 26.73095703125, 27.687255859375, 28.6435546875, 29.599853515625, 30.55615234375, 31.512451171875, 32.46875]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 39.0, 145.0, 283.0, 356.0, 137.0, 47.0, 6.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-199.8175048828125, -196.18507385253906, -192.55264282226562, -188.9202117919922, -185.2877655029297, -181.65533447265625, -178.0229034423828, -174.39047241210938, -170.75804138183594, -167.1256103515625, -163.49317932128906, -159.86074829101562, -156.22830200195312, -152.5958709716797, -148.96343994140625, -145.3310089111328, -141.69857788085938, -138.06614685058594, -134.4337158203125, -130.80128479003906, -127.1688461303711, -123.53640747070312, -119.90397644042969, -116.27154541015625, -112.63910675048828, -109.00667572021484, -105.37423706054688, -101.74180603027344, -98.109375, -94.47694396972656, -90.8445053100586, -87.21207427978516, -83.57965087890625, -79.94721984863281, -76.31478118896484, -72.6823501586914, -69.04991912841797, -65.41748046875, -61.78504943847656, -58.152618408203125, -54.520179748535156, -50.88774490356445, -47.255313873291016, -43.62287902832031, -39.990447998046875, -36.35801315307617, -32.72557830810547, -29.09314727783203, -25.460716247558594, -21.828283309936523, -18.195850372314453, -14.563416481018066, -10.930983543395996, -7.298549652099609, -3.666116714477539, -0.03368377685546875, 3.5987491607666016, 7.231182098388672, 10.863615036010742, 14.496048927307129, 18.128482818603516, 21.760915756225586, 25.393348693847656, 29.025781631469727, 32.6582145690918]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 11.0, 8.0, 8.0, 10.0, 18.0, 16.0, 22.0, 18.0, 19.0, 29.0, 25.0, 37.0, 35.0, 26.0, 37.0, 33.0, 35.0, 48.0, 40.0, 50.0, 43.0, 35.0, 45.0, 43.0, 37.0, 40.0, 43.0, 30.0, 14.0, 26.0, 23.0, 16.0, 17.0, 18.0, 6.0, 6.0, 8.0, 5.0, 6.0, 1.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.201210021972656, -43.50514602661133, -41.80908203125, -40.11301803588867, -38.416954040527344, -36.72088623046875, -35.02482223510742, -33.328758239746094, -31.632694244384766, -29.936630249023438, -28.24056625366211, -26.54450035095215, -24.84843635559082, -23.152372360229492, -21.45630645751953, -19.760242462158203, -18.064178466796875, -16.368114471435547, -14.672049522399902, -12.975984573364258, -11.27992057800293, -9.583856582641602, -7.887791633605957, -6.1917266845703125, -4.495662689208984, -2.799598217010498, -1.1035337448120117, 0.5925307273864746, 2.288595199584961, 3.984659194946289, 5.680724143981934, 7.376789093017578, 9.07284927368164, 10.768913269042969, 12.464978218078613, 14.161043167114258, 15.857107162475586, 17.553171157836914, 19.249237060546875, 20.945301055908203, 22.64136505126953, 24.33742904663086, 26.033493041992188, 27.72955894470215, 29.425622940063477, 31.121686935424805, 32.817752838134766, 34.513816833496094, 36.20988082885742, 37.90594482421875, 39.60200881958008, 41.298072814941406, 42.994140625, 44.69020080566406, 46.386268615722656, 48.082332611083984, 49.77839660644531, 51.47446060180664, 53.17052459716797, 54.8665885925293, 56.562652587890625, 58.25872039794922, 59.95478439331055, 61.650848388671875, 63.3469123840332]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 10.0, 8.0, 16.0, 17.0, 22.0, 17.0, 21.0, 22.0, 35.0, 27.0, 31.0, 32.0, 30.0, 37.0, 38.0, 43.0, 49.0, 36.0, 47.0, 49.0, 35.0, 43.0, 26.0, 26.0, 36.0, 25.0, 32.0, 17.0, 31.0, 19.0, 24.0, 18.0, 15.0, 9.0, 9.0, 6.0, 4.0, 8.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-5.015625, -4.85748291015625, -4.6993408203125, -4.54119873046875, -4.383056640625, -4.22491455078125, -4.0667724609375, -3.90863037109375, -3.75048828125, -3.59234619140625, -3.4342041015625, -3.27606201171875, -3.117919921875, -2.95977783203125, -2.8016357421875, -2.64349365234375, -2.4853515625, -2.32720947265625, -2.1690673828125, -2.01092529296875, -1.852783203125, -1.69464111328125, -1.5364990234375, -1.37835693359375, -1.22021484375, -1.06207275390625, -0.9039306640625, -0.74578857421875, -0.587646484375, -0.42950439453125, -0.2713623046875, -0.11322021484375, 0.044921875, 0.20306396484375, 0.3612060546875, 0.51934814453125, 0.677490234375, 0.83563232421875, 0.9937744140625, 1.15191650390625, 1.31005859375, 1.46820068359375, 1.6263427734375, 1.78448486328125, 1.942626953125, 2.10076904296875, 2.2589111328125, 2.41705322265625, 2.5751953125, 2.73333740234375, 2.8914794921875, 3.04962158203125, 3.207763671875, 3.36590576171875, 3.5240478515625, 3.68218994140625, 3.84033203125, 3.99847412109375, 4.1566162109375, 4.31475830078125, 4.472900390625, 4.63104248046875, 4.7891845703125, 4.94732666015625, 5.10546875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 5.0, 12.0, 13.0, 22.0, 23.0, 38.0, 46.0, 57.0, 87.0, 137.0, 216.0, 313.0, 500.0, 966.0, 1797.0, 3975.0, 10474.0, 33370.0, 127966.0, 562870.0, 1869856.0, 1203738.0, 279275.0, 66857.0, 19369.0, 6648.0, 2664.0, 1300.0, 635.0, 361.0, 208.0, 160.0, 88.0, 62.0, 39.0, 27.0, 23.0, 22.0, 14.0, 13.0, 5.0, 6.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-11.5390625, -11.2164306640625, -10.893798828125, -10.5711669921875, -10.24853515625, -9.9259033203125, -9.603271484375, -9.2806396484375, -8.9580078125, -8.6353759765625, -8.312744140625, -7.9901123046875, -7.66748046875, -7.3448486328125, -7.022216796875, -6.6995849609375, -6.376953125, -6.0543212890625, -5.731689453125, -5.4090576171875, -5.08642578125, -4.7637939453125, -4.441162109375, -4.1185302734375, -3.7958984375, -3.4732666015625, -3.150634765625, -2.8280029296875, -2.50537109375, -2.1827392578125, -1.860107421875, -1.5374755859375, -1.21484375, -0.8922119140625, -0.569580078125, -0.2469482421875, 0.07568359375, 0.3983154296875, 0.720947265625, 1.0435791015625, 1.3662109375, 1.6888427734375, 2.011474609375, 2.3341064453125, 2.65673828125, 2.9793701171875, 3.302001953125, 3.6246337890625, 3.947265625, 4.2698974609375, 4.592529296875, 4.9151611328125, 5.23779296875, 5.5604248046875, 5.883056640625, 6.2056884765625, 6.5283203125, 6.8509521484375, 7.173583984375, 7.4962158203125, 7.81884765625, 8.1414794921875, 8.464111328125, 8.7867431640625, 9.109375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 7.0, 17.0, 12.0, 23.0, 29.0, 45.0, 55.0, 88.0, 98.0, 125.0, 171.0, 221.0, 266.0, 318.0, 371.0, 380.0, 388.0, 317.0, 256.0, 207.0, 162.0, 124.0, 82.0, 72.0, 54.0, 41.0, 31.0, 26.0, 23.0, 7.0, 12.0, 9.0, 7.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-13.6953125, -13.329345703125, -12.96337890625, -12.597412109375, -12.2314453125, -11.865478515625, -11.49951171875, -11.133544921875, -10.767578125, -10.401611328125, -10.03564453125, -9.669677734375, -9.3037109375, -8.937744140625, -8.57177734375, -8.205810546875, -7.83984375, -7.473876953125, -7.10791015625, -6.741943359375, -6.3759765625, -6.010009765625, -5.64404296875, -5.278076171875, -4.912109375, -4.546142578125, -4.18017578125, -3.814208984375, -3.4482421875, -3.082275390625, -2.71630859375, -2.350341796875, -1.984375, -1.618408203125, -1.25244140625, -0.886474609375, -0.5205078125, -0.154541015625, 0.21142578125, 0.577392578125, 0.943359375, 1.309326171875, 1.67529296875, 2.041259765625, 2.4072265625, 2.773193359375, 3.13916015625, 3.505126953125, 3.87109375, 4.237060546875, 4.60302734375, 4.968994140625, 5.3349609375, 5.700927734375, 6.06689453125, 6.432861328125, 6.798828125, 7.164794921875, 7.53076171875, 7.896728515625, 8.2626953125, 8.628662109375, 8.99462890625, 9.360595703125, 9.7265625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 8.0, 8.0, 4.0, 15.0, 22.0, 18.0, 39.0, 73.0, 106.0, 161.0, 241.0, 385.0, 689.0, 1223.0, 2465.0, 5137.0, 11893.0, 31549.0, 94139.0, 303513.0, 934479.0, 1626106.0, 801240.0, 254839.0, 78965.0, 27226.0, 10371.0, 4540.0, 2179.0, 1149.0, 574.0, 355.0, 201.0, 114.0, 80.0, 52.0, 39.0, 33.0, 16.0, 15.0, 12.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.40625, -10.012451171875, -9.61865234375, -9.224853515625, -8.8310546875, -8.437255859375, -8.04345703125, -7.649658203125, -7.255859375, -6.862060546875, -6.46826171875, -6.074462890625, -5.6806640625, -5.286865234375, -4.89306640625, -4.499267578125, -4.10546875, -3.711669921875, -3.31787109375, -2.924072265625, -2.5302734375, -2.136474609375, -1.74267578125, -1.348876953125, -0.955078125, -0.561279296875, -0.16748046875, 0.226318359375, 0.6201171875, 1.013916015625, 1.40771484375, 1.801513671875, 2.1953125, 2.589111328125, 2.98291015625, 3.376708984375, 3.7705078125, 4.164306640625, 4.55810546875, 4.951904296875, 5.345703125, 5.739501953125, 6.13330078125, 6.527099609375, 6.9208984375, 7.314697265625, 7.70849609375, 8.102294921875, 8.49609375, 8.889892578125, 9.28369140625, 9.677490234375, 10.0712890625, 10.465087890625, 10.85888671875, 11.252685546875, 11.646484375, 12.040283203125, 12.43408203125, 12.827880859375, 13.2216796875, 13.615478515625, 14.00927734375, 14.403076171875, 14.796875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 11.0, 14.0, 33.0, 65.0, 92.0, 138.0, 138.0, 151.0, 127.0, 91.0, 64.0, 37.0, 20.0, 13.0, 7.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.08476257324219, -68.97450256347656, -65.86424255371094, -62.75397491455078, -59.643714904785156, -56.53345489501953, -53.42319107055664, -50.31292724609375, -47.202667236328125, -44.0924072265625, -40.98214340209961, -37.87187957763672, -34.761619567871094, -31.651357650756836, -28.541095733642578, -25.43083381652832, -22.320571899414062, -19.210309982299805, -16.100048065185547, -12.989786148071289, -9.879524230957031, -6.769262313842773, -3.6590003967285156, -0.5487384796142578, 2.5615234375, 5.671785354614258, 8.782047271728516, 11.892309188842773, 15.002571105957031, 18.11283302307129, 21.223094940185547, 24.333356857299805, 27.44361114501953, 30.55387306213379, 33.66413497924805, 36.77439880371094, 39.88465881347656, 42.99491882324219, 46.10518264770508, 49.21544647216797, 52.325706481933594, 55.43596649169922, 58.54623031616211, 61.656494140625, 64.76675415039062, 67.87701416015625, 70.98727416992188, 74.09754180908203, 77.20780181884766, 80.31806182861328, 83.42832946777344, 86.53858947753906, 89.64884948730469, 92.75910949707031, 95.86936950683594, 98.9796371459961, 102.08989715576172, 105.20015716552734, 108.3104248046875, 111.42068481445312, 114.53094482421875, 117.64120483398438, 120.75146484375, 123.86173248291016, 126.97199249267578]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 5.0, 5.0, 6.0, 4.0, 8.0, 12.0, 9.0, 8.0, 19.0, 27.0, 22.0, 25.0, 28.0, 28.0, 41.0, 33.0, 34.0, 43.0, 38.0, 35.0, 37.0, 40.0, 41.0, 44.0, 47.0, 43.0, 37.0, 32.0, 32.0, 28.0, 21.0, 23.0, 18.0, 18.0, 20.0, 22.0, 7.0, 10.0, 11.0, 6.0, 7.0, 6.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-47.998748779296875, -46.64862823486328, -45.29850769042969, -43.94838333129883, -42.598262786865234, -41.24814224243164, -39.89801788330078, -38.54789733886719, -37.197776794433594, -35.84765625, -34.497535705566406, -33.14741134643555, -31.797290802001953, -30.44717025756836, -29.097047805786133, -27.746925354003906, -26.396804809570312, -25.04668426513672, -23.696561813354492, -22.346439361572266, -20.996318817138672, -19.646198272705078, -18.29607582092285, -16.945953369140625, -15.595832824707031, -14.245711326599121, -12.895589828491211, -11.5454683303833, -10.19534683227539, -8.84522533416748, -7.49510383605957, -6.14498233795166, -4.794857025146484, -3.444735527038574, -2.094614028930664, -0.7444925308227539, 0.6056289672851562, 1.9557504653930664, 3.3058719635009766, 4.655993461608887, 6.006114959716797, 7.356236457824707, 8.706357955932617, 10.056479454040527, 11.406600952148438, 12.756722450256348, 14.106843948364258, 15.456965446472168, 16.807086944580078, 18.157207489013672, 19.5073299407959, 20.857452392578125, 22.20757293701172, 23.557693481445312, 24.90781593322754, 26.257938385009766, 27.60805892944336, 28.958179473876953, 30.30830192565918, 31.658424377441406, 33.008544921875, 34.358665466308594, 35.70878601074219, 37.05891036987305, 38.40903091430664]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 6.0, 5.0, 4.0, 6.0, 8.0, 17.0, 22.0, 16.0, 12.0, 18.0, 27.0, 30.0, 37.0, 33.0, 45.0, 41.0, 41.0, 45.0, 40.0, 34.0, 57.0, 49.0, 39.0, 35.0, 36.0, 35.0, 33.0, 34.0, 22.0, 34.0, 24.0, 17.0, 11.0, 12.0, 14.0, 16.0, 9.0, 6.0, 7.0, 6.0, 9.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.62890625, -5.45916748046875, -5.2894287109375, -5.11968994140625, -4.949951171875, -4.78021240234375, -4.6104736328125, -4.44073486328125, -4.27099609375, -4.10125732421875, -3.9315185546875, -3.76177978515625, -3.592041015625, -3.42230224609375, -3.2525634765625, -3.08282470703125, -2.9130859375, -2.74334716796875, -2.5736083984375, -2.40386962890625, -2.234130859375, -2.06439208984375, -1.8946533203125, -1.72491455078125, -1.55517578125, -1.38543701171875, -1.2156982421875, -1.04595947265625, -0.876220703125, -0.70648193359375, -0.5367431640625, -0.36700439453125, -0.197265625, -0.02752685546875, 0.1422119140625, 0.31195068359375, 0.481689453125, 0.65142822265625, 0.8211669921875, 0.99090576171875, 1.16064453125, 1.33038330078125, 1.5001220703125, 1.66986083984375, 1.839599609375, 2.00933837890625, 2.1790771484375, 2.34881591796875, 2.5185546875, 2.68829345703125, 2.8580322265625, 3.02777099609375, 3.197509765625, 3.36724853515625, 3.5369873046875, 3.70672607421875, 3.87646484375, 4.04620361328125, 4.2159423828125, 4.38568115234375, 4.555419921875, 4.72515869140625, 4.8948974609375, 5.06463623046875, 5.234375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 5.0, 11.0, 25.0, 29.0, 42.0, 69.0, 104.0, 166.0, 238.0, 373.0, 630.0, 1078.0, 1851.0, 3128.0, 5622.0, 9970.0, 17948.0, 32377.0, 55094.0, 89097.0, 129652.0, 163103.0, 166033.0, 136211.0, 95253.0, 59836.0, 35060.0, 19928.0, 10983.0, 6129.0, 3460.0, 2014.0, 1170.0, 683.0, 413.0, 270.0, 173.0, 111.0, 67.0, 42.0, 41.0, 17.0, 14.0, 6.0, 7.0, 4.0, 3.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0], "bins": [-1.734375, -1.68194580078125, -1.6295166015625, -1.57708740234375, -1.524658203125, -1.47222900390625, -1.4197998046875, -1.36737060546875, -1.31494140625, -1.26251220703125, -1.2100830078125, -1.15765380859375, -1.105224609375, -1.05279541015625, -1.0003662109375, -0.94793701171875, -0.8955078125, -0.84307861328125, -0.7906494140625, -0.73822021484375, -0.685791015625, -0.63336181640625, -0.5809326171875, -0.52850341796875, -0.47607421875, -0.42364501953125, -0.3712158203125, -0.31878662109375, -0.266357421875, -0.21392822265625, -0.1614990234375, -0.10906982421875, -0.056640625, -0.00421142578125, 0.0482177734375, 0.10064697265625, 0.153076171875, 0.20550537109375, 0.2579345703125, 0.31036376953125, 0.36279296875, 0.41522216796875, 0.4676513671875, 0.52008056640625, 0.572509765625, 0.62493896484375, 0.6773681640625, 0.72979736328125, 0.7822265625, 0.83465576171875, 0.8870849609375, 0.93951416015625, 0.991943359375, 1.04437255859375, 1.0968017578125, 1.14923095703125, 1.20166015625, 1.25408935546875, 1.3065185546875, 1.35894775390625, 1.411376953125, 1.46380615234375, 1.5162353515625, 1.56866455078125, 1.62109375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 1.0, 8.0, 6.0, 9.0, 8.0, 9.0, 13.0, 21.0, 20.0, 13.0, 21.0, 21.0, 32.0, 28.0, 25.0, 32.0, 24.0, 35.0, 32.0, 41.0, 26.0, 37.0, 1075.0, 45.0, 34.0, 30.0, 31.0, 33.0, 27.0, 25.0, 33.0, 21.0, 25.0, 18.0, 22.0, 23.0, 16.0, 16.0, 13.0, 13.0, 9.0, 5.0, 6.0, 12.0, 11.0, 7.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-3.71875, -3.604095458984375, -3.48944091796875, -3.374786376953125, -3.2601318359375, -3.145477294921875, -3.03082275390625, -2.916168212890625, -2.801513671875, -2.686859130859375, -2.57220458984375, -2.457550048828125, -2.3428955078125, -2.228240966796875, -2.11358642578125, -1.998931884765625, -1.88427734375, -1.769622802734375, -1.65496826171875, -1.540313720703125, -1.4256591796875, -1.311004638671875, -1.19635009765625, -1.081695556640625, -0.967041015625, -0.852386474609375, -0.73773193359375, -0.623077392578125, -0.5084228515625, -0.393768310546875, -0.27911376953125, -0.164459228515625, -0.0498046875, 0.064849853515625, 0.17950439453125, 0.294158935546875, 0.4088134765625, 0.523468017578125, 0.63812255859375, 0.752777099609375, 0.867431640625, 0.982086181640625, 1.09674072265625, 1.211395263671875, 1.3260498046875, 1.440704345703125, 1.55535888671875, 1.670013427734375, 1.78466796875, 1.899322509765625, 2.01397705078125, 2.128631591796875, 2.2432861328125, 2.357940673828125, 2.47259521484375, 2.587249755859375, 2.701904296875, 2.816558837890625, 2.93121337890625, 3.045867919921875, 3.1605224609375, 3.275177001953125, 3.38983154296875, 3.504486083984375, 3.619140625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 4.0, 5.0, 7.0, 13.0, 14.0, 18.0, 25.0, 42.0, 65.0, 76.0, 126.0, 205.0, 292.0, 442.0, 729.0, 1071.0, 1747.0, 2786.0, 4576.0, 7055.0, 11294.0, 18495.0, 31114.0, 478820.0, 1458151.0, 31209.0, 18277.0, 11236.0, 7154.0, 4359.0, 2819.0, 1765.0, 1136.0, 707.0, 451.0, 291.0, 176.0, 110.0, 85.0, 63.0, 41.0, 26.0, 22.0, 9.0, 14.0, 5.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.529296875, -2.452667236328125, -2.37603759765625, -2.299407958984375, -2.2227783203125, -2.146148681640625, -2.06951904296875, -1.992889404296875, -1.916259765625, -1.839630126953125, -1.76300048828125, -1.686370849609375, -1.6097412109375, -1.533111572265625, -1.45648193359375, -1.379852294921875, -1.30322265625, -1.226593017578125, -1.14996337890625, -1.073333740234375, -0.9967041015625, -0.920074462890625, -0.84344482421875, -0.766815185546875, -0.690185546875, -0.613555908203125, -0.53692626953125, -0.460296630859375, -0.3836669921875, -0.307037353515625, -0.23040771484375, -0.153778076171875, -0.0771484375, -0.000518798828125, 0.07611083984375, 0.152740478515625, 0.2293701171875, 0.305999755859375, 0.38262939453125, 0.459259033203125, 0.535888671875, 0.612518310546875, 0.68914794921875, 0.765777587890625, 0.8424072265625, 0.919036865234375, 0.99566650390625, 1.072296142578125, 1.14892578125, 1.225555419921875, 1.30218505859375, 1.378814697265625, 1.4554443359375, 1.532073974609375, 1.60870361328125, 1.685333251953125, 1.761962890625, 1.838592529296875, 1.91522216796875, 1.991851806640625, 2.0684814453125, 2.145111083984375, 2.22174072265625, 2.298370361328125, 2.375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 3.0, 3.0, 9.0, 13.0, 16.0, 12.0, 10.0, 25.0, 21.0, 24.0, 34.0, 41.0, 48.0, 53.0, 66.0, 86.0, 104.0, 82.0, 65.0, 50.0, 26.0, 32.0, 35.0, 21.0, 16.0, 14.0, 14.0, 14.0, 11.0, 14.0, 11.0, 8.0, 3.0, 4.0, 1.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0771484375, -0.07475566864013672, -0.07236289978027344, -0.06997013092041016, -0.06757736206054688, -0.0651845932006836, -0.06279182434082031, -0.06039905548095703, -0.05800628662109375, -0.05561351776123047, -0.05322074890136719, -0.050827980041503906, -0.048435211181640625, -0.046042442321777344, -0.04364967346191406, -0.04125690460205078, -0.0388641357421875, -0.03647136688232422, -0.03407859802246094, -0.031685829162597656, -0.029293060302734375, -0.026900291442871094, -0.024507522583007812, -0.02211475372314453, -0.01972198486328125, -0.01732921600341797, -0.014936447143554688, -0.012543678283691406, -0.010150909423828125, -0.007758140563964844, -0.0053653717041015625, -0.0029726028442382812, -0.000579833984375, 0.0018129348754882812, 0.0042057037353515625, 0.006598472595214844, 0.008991241455078125, 0.011384010314941406, 0.013776779174804688, 0.01616954803466797, 0.01856231689453125, 0.02095508575439453, 0.023347854614257812, 0.025740623474121094, 0.028133392333984375, 0.030526161193847656, 0.03291893005371094, 0.03531169891357422, 0.0377044677734375, 0.04009723663330078, 0.04249000549316406, 0.044882774353027344, 0.047275543212890625, 0.049668312072753906, 0.05206108093261719, 0.05445384979248047, 0.05684661865234375, 0.05923938751220703, 0.06163215637207031, 0.0640249252319336, 0.06641769409179688, 0.06881046295166016, 0.07120323181152344, 0.07359600067138672, 0.07598876953125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 9.0, 3.0, 5.0, 16.0, 9.0, 10.0, 21.0, 14.0, 27.0, 22.0, 46.0, 54.0, 69.0, 129.0, 208.0, 307.0, 690.0, 8879.0, 606189.0, 423606.0, 6704.0, 550.0, 322.0, 196.0, 118.0, 96.0, 66.0, 45.0, 24.0, 33.0, 19.0, 14.0, 10.0, 15.0, 7.0, 6.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3232421875, -1.2830963134765625, -1.242950439453125, -1.2028045654296875, -1.16265869140625, -1.1225128173828125, -1.082366943359375, -1.0422210693359375, -1.0020751953125, -0.9619293212890625, -0.921783447265625, -0.8816375732421875, -0.84149169921875, -0.8013458251953125, -0.761199951171875, -0.7210540771484375, -0.680908203125, -0.6407623291015625, -0.600616455078125, -0.5604705810546875, -0.52032470703125, -0.4801788330078125, -0.440032958984375, -0.3998870849609375, -0.3597412109375, -0.3195953369140625, -0.279449462890625, -0.2393035888671875, -0.19915771484375, -0.1590118408203125, -0.118865966796875, -0.0787200927734375, -0.03857421875, 0.0015716552734375, 0.041717529296875, 0.0818634033203125, 0.12200927734375, 0.1621551513671875, 0.202301025390625, 0.2424468994140625, 0.2825927734375, 0.3227386474609375, 0.362884521484375, 0.4030303955078125, 0.44317626953125, 0.4833221435546875, 0.523468017578125, 0.5636138916015625, 0.603759765625, 0.6439056396484375, 0.684051513671875, 0.7241973876953125, 0.76434326171875, 0.8044891357421875, 0.844635009765625, 0.8847808837890625, 0.9249267578125, 0.9650726318359375, 1.005218505859375, 1.0453643798828125, 1.08551025390625, 1.1256561279296875, 1.165802001953125, 1.2059478759765625, 1.24609375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 7.0, 19.0, 64.0, 186.0, 491.0, 167.0, 50.0, 23.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.980623483657837, -1.943557620048523, -1.9064918756484985, -1.8694260120391846, -1.8323602676391602, -1.7952944040298462, -1.7582285404205322, -1.7211627960205078, -1.6840969324111938, -1.6470310688018799, -1.6099653244018555, -1.5728994607925415, -1.535833716392517, -1.4987678527832031, -1.4617021083831787, -1.4246362447738647, -1.3875703811645508, -1.3505045175552368, -1.3134387731552124, -1.2763729095458984, -1.239307165145874, -1.20224130153656, -1.165175437927246, -1.1281096935272217, -1.0910439491271973, -1.0539780855178833, -1.0169123411178589, -0.9798464775085449, -0.9427806735038757, -0.9057148694992065, -0.8686490654945374, -0.8315832614898682, -0.7945172786712646, -0.7574514746665955, -0.7203856706619263, -0.6833198070526123, -0.6462540030479431, -0.6091881990432739, -0.5721223950386047, -0.5350565910339355, -0.49799078702926636, -0.46092498302459717, -0.4238591492176056, -0.3867933452129364, -0.3497275114059448, -0.31266170740127563, -0.27559590339660645, -0.23853006958961487, -0.20146426558494568, -0.1643984466791153, -0.1273326277732849, -0.09026682376861572, -0.05320100486278534, -0.016135185956954956, 0.020930618047714233, 0.05799645185470581, 0.095062255859375, 0.13212807476520538, 0.16919389367103577, 0.20625969767570496, 0.24332551658153534, 0.2803913354873657, 0.3174571394920349, 0.3545229732990265, 0.3915887773036957]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 4.0, 12.0, 6.0, 14.0, 15.0, 16.0, 17.0, 15.0, 23.0, 20.0, 25.0, 25.0, 34.0, 46.0, 41.0, 37.0, 36.0, 38.0, 52.0, 51.0, 48.0, 38.0, 52.0, 34.0, 30.0, 36.0, 28.0, 33.0, 23.0, 31.0, 19.0, 21.0, 11.0, 15.0, 6.0, 10.0, 7.0, 3.0, 9.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.12902522087097168, -0.12495608627796173, -0.12088695168495178, -0.11681781709194183, -0.11274868249893188, -0.10867954790592194, -0.10461040586233139, -0.10054127126932144, -0.09647213667631149, -0.09240300208330154, -0.0883338674902916, -0.08426473289728165, -0.0801955908536911, -0.07612645626068115, -0.0720573216676712, -0.06798818707466125, -0.0639190524816513, -0.05984991788864136, -0.05578078329563141, -0.05171164497733116, -0.04764251038432121, -0.043573375791311264, -0.03950423747301102, -0.03543510288000107, -0.03136596828699112, -0.02729683369398117, -0.023227697238326073, -0.019158560782670975, -0.015089426189661026, -0.011020291596651077, -0.006951155140995979, -0.0028820186853408813, 0.0011871159076690674, 0.005256251432001591, 0.009325386956334114, 0.013394522480666637, 0.01746365800499916, 0.02153279259800911, 0.025601929053664207, 0.029671065509319305, 0.033740200102329254, 0.0378093346953392, 0.04187846928834915, 0.0459476076066494, 0.05001674219965935, 0.054085876792669296, 0.05815501511096954, 0.06222414970397949, 0.06629328429698944, 0.07036241888999939, 0.07443155348300934, 0.07850068807601929, 0.08256982266902924, 0.08663895726203918, 0.09070809930562973, 0.09477723389863968, 0.09884636849164963, 0.10291550308465958, 0.10698463767766953, 0.11105377227067947, 0.11512291431427002, 0.11919204890727997, 0.12326118350028992, 0.12733031809329987, 0.13139945268630981]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 1.0, 4.0, 6.0, 5.0, 10.0, 6.0, 12.0, 13.0, 20.0, 24.0, 19.0, 26.0, 31.0, 40.0, 32.0, 38.0, 38.0, 61.0, 56.0, 32.0, 34.0, 43.0, 43.0, 35.0, 46.0, 45.0, 28.0, 32.0, 32.0, 36.0, 24.0, 24.0, 15.0, 16.0, 15.0, 10.0, 11.0, 6.0, 10.0, 5.0, 3.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.73046875, -5.5557861328125, -5.381103515625, -5.2064208984375, -5.03173828125, -4.8570556640625, -4.682373046875, -4.5076904296875, -4.3330078125, -4.1583251953125, -3.983642578125, -3.8089599609375, -3.63427734375, -3.4595947265625, -3.284912109375, -3.1102294921875, -2.935546875, -2.7608642578125, -2.586181640625, -2.4114990234375, -2.23681640625, -2.0621337890625, -1.887451171875, -1.7127685546875, -1.5380859375, -1.3634033203125, -1.188720703125, -1.0140380859375, -0.83935546875, -0.6646728515625, -0.489990234375, -0.3153076171875, -0.140625, 0.0340576171875, 0.208740234375, 0.3834228515625, 0.55810546875, 0.7327880859375, 0.907470703125, 1.0821533203125, 1.2568359375, 1.4315185546875, 1.606201171875, 1.7808837890625, 1.95556640625, 2.1302490234375, 2.304931640625, 2.4796142578125, 2.654296875, 2.8289794921875, 3.003662109375, 3.1783447265625, 3.35302734375, 3.5277099609375, 3.702392578125, 3.8770751953125, 4.0517578125, 4.2264404296875, 4.401123046875, 4.5758056640625, 4.75048828125, 4.9251708984375, 5.099853515625, 5.2745361328125, 5.44921875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 4.0, 8.0, 5.0, 10.0, 17.0, 18.0, 30.0, 53.0, 84.0, 117.0, 185.0, 285.0, 455.0, 714.0, 1226.0, 2090.0, 3491.0, 6248.0, 10836.0, 20642.0, 42554.0, 99086.0, 237029.0, 318347.0, 168468.0, 68909.0, 31374.0, 15621.0, 8630.0, 4859.0, 2903.0, 1661.0, 938.0, 579.0, 377.0, 235.0, 140.0, 85.0, 72.0, 52.0, 22.0, 26.0, 23.0, 15.0, 9.0, 8.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0], "bins": [-7.59765625, -7.38238525390625, -7.1671142578125, -6.95184326171875, -6.736572265625, -6.52130126953125, -6.3060302734375, -6.09075927734375, -5.87548828125, -5.66021728515625, -5.4449462890625, -5.22967529296875, -5.014404296875, -4.79913330078125, -4.5838623046875, -4.36859130859375, -4.1533203125, -3.93804931640625, -3.7227783203125, -3.50750732421875, -3.292236328125, -3.07696533203125, -2.8616943359375, -2.64642333984375, -2.43115234375, -2.21588134765625, -2.0006103515625, -1.78533935546875, -1.570068359375, -1.35479736328125, -1.1395263671875, -0.92425537109375, -0.708984375, -0.49371337890625, -0.2784423828125, -0.06317138671875, 0.152099609375, 0.36737060546875, 0.5826416015625, 0.79791259765625, 1.01318359375, 1.22845458984375, 1.4437255859375, 1.65899658203125, 1.874267578125, 2.08953857421875, 2.3048095703125, 2.52008056640625, 2.7353515625, 2.95062255859375, 3.1658935546875, 3.38116455078125, 3.596435546875, 3.81170654296875, 4.0269775390625, 4.24224853515625, 4.45751953125, 4.67279052734375, 4.8880615234375, 5.10333251953125, 5.318603515625, 5.53387451171875, 5.7491455078125, 5.96441650390625, 6.1796875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 8.0, 4.0, 10.0, 7.0, 13.0, 14.0, 19.0, 10.0, 21.0, 21.0, 18.0, 26.0, 19.0, 21.0, 32.0, 41.0, 40.0, 72.0, 80.0, 134.0, 262.0, 1386.0, 222.0, 116.0, 81.0, 59.0, 28.0, 42.0, 32.0, 29.0, 20.0, 17.0, 22.0, 24.0, 18.0, 15.0, 7.0, 8.0, 10.0, 10.0, 2.0, 6.0, 5.0, 4.0, 6.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-19.09375, -18.520751953125, -17.94775390625, -17.374755859375, -16.8017578125, -16.228759765625, -15.65576171875, -15.082763671875, -14.509765625, -13.936767578125, -13.36376953125, -12.790771484375, -12.2177734375, -11.644775390625, -11.07177734375, -10.498779296875, -9.92578125, -9.352783203125, -8.77978515625, -8.206787109375, -7.6337890625, -7.060791015625, -6.48779296875, -5.914794921875, -5.341796875, -4.768798828125, -4.19580078125, -3.622802734375, -3.0498046875, -2.476806640625, -1.90380859375, -1.330810546875, -0.7578125, -0.184814453125, 0.38818359375, 0.961181640625, 1.5341796875, 2.107177734375, 2.68017578125, 3.253173828125, 3.826171875, 4.399169921875, 4.97216796875, 5.545166015625, 6.1181640625, 6.691162109375, 7.26416015625, 7.837158203125, 8.41015625, 8.983154296875, 9.55615234375, 10.129150390625, 10.7021484375, 11.275146484375, 11.84814453125, 12.421142578125, 12.994140625, 13.567138671875, 14.14013671875, 14.713134765625, 15.2861328125, 15.859130859375, 16.43212890625, 17.005126953125, 17.578125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 2.0, 2.0, 9.0, 2.0, 3.0, 6.0, 4.0, 13.0, 10.0, 15.0, 11.0, 18.0, 22.0, 27.0, 36.0, 31.0, 46.0, 69.0, 107.0, 121.0, 201.0, 300.0, 727.0, 2171.0, 16888.0, 445208.0, 2593132.0, 77916.0, 6076.0, 1167.0, 457.0, 224.0, 155.0, 114.0, 82.0, 60.0, 58.0, 36.0, 39.0, 32.0, 22.0, 12.0, 8.0, 17.0, 10.0, 11.0, 5.0, 5.0, 9.0, 4.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0], "bins": [-32.15625, -31.159912109375, -30.16357421875, -29.167236328125, -28.1708984375, -27.174560546875, -26.17822265625, -25.181884765625, -24.185546875, -23.189208984375, -22.19287109375, -21.196533203125, -20.2001953125, -19.203857421875, -18.20751953125, -17.211181640625, -16.21484375, -15.218505859375, -14.22216796875, -13.225830078125, -12.2294921875, -11.233154296875, -10.23681640625, -9.240478515625, -8.244140625, -7.247802734375, -6.25146484375, -5.255126953125, -4.2587890625, -3.262451171875, -2.26611328125, -1.269775390625, -0.2734375, 0.722900390625, 1.71923828125, 2.715576171875, 3.7119140625, 4.708251953125, 5.70458984375, 6.700927734375, 7.697265625, 8.693603515625, 9.68994140625, 10.686279296875, 11.6826171875, 12.678955078125, 13.67529296875, 14.671630859375, 15.66796875, 16.664306640625, 17.66064453125, 18.656982421875, 19.6533203125, 20.649658203125, 21.64599609375, 22.642333984375, 23.638671875, 24.635009765625, 25.63134765625, 26.627685546875, 27.6240234375, 28.620361328125, 29.61669921875, 30.613037109375, 31.609375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 145.0, 833.0, 37.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.55602264404297, -27.90342903137207, -16.250835418701172, -4.598243713378906, 7.054351806640625, 18.706947326660156, 30.359535217285156, 42.01213073730469, 53.66472625732422, 65.31732177734375, 76.96990966796875, 88.62250518798828, 100.27510070800781, 111.92769622802734, 123.58028411865234, 135.23287963867188, 146.88546752929688, 158.53805541992188, 170.19065856933594, 181.84324645996094, 193.495849609375, 205.1484375, 216.801025390625, 228.45361328125, 240.10623168945312, 251.75881958007812, 263.4114074707031, 275.06402587890625, 286.71661376953125, 298.36920166015625, 310.02178955078125, 321.67437744140625, 333.32696533203125, 344.97955322265625, 356.63214111328125, 368.28472900390625, 379.9373474121094, 391.5899353027344, 403.2425231933594, 414.8951110839844, 426.5477294921875, 438.2003173828125, 449.8529052734375, 461.5054931640625, 473.1581115722656, 484.8106994628906, 496.4632873535156, 508.1158752441406, 519.7684326171875, 531.4210205078125, 543.0736083984375, 554.7261962890625, 566.3787841796875, 578.0313720703125, 589.6839599609375, 601.3366088867188, 612.9891967773438, 624.6417846679688, 636.2943725585938, 647.9469604492188, 659.5995483398438, 671.252197265625, 682.90478515625, 694.557373046875, 706.2099609375]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 8.0, 9.0, 6.0, 9.0, 7.0, 11.0, 15.0, 10.0, 20.0, 23.0, 32.0, 23.0, 47.0, 53.0, 44.0, 38.0, 55.0, 47.0, 36.0, 43.0, 46.0, 45.0, 46.0, 40.0, 31.0, 35.0, 26.0, 35.0, 26.0, 26.0, 21.0, 20.0, 17.0, 9.0, 15.0, 9.0, 6.0, 5.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.60420227050781, -45.8996696472168, -44.19514083862305, -42.49060821533203, -40.78607940673828, -39.081546783447266, -37.37701416015625, -35.6724853515625, -33.96795654296875, -32.263423919677734, -30.558895111083984, -28.85436248779297, -27.14983367919922, -25.445301055908203, -23.74077033996582, -22.036239624023438, -20.331707000732422, -18.62717628479004, -16.922645568847656, -15.218113899230957, -13.513583183288574, -11.809052467346191, -10.104520797729492, -8.39999008178711, -6.695459365844727, -4.990928649902344, -3.2863974571228027, -1.5818662643432617, 0.1226644515991211, 1.827195167541504, 3.531726837158203, 5.236257553100586, 6.940792083740234, 8.645322799682617, 10.349853515625, 12.0543851852417, 13.758915901184082, 15.463446617126465, 17.167978286743164, 18.872509002685547, 20.57703971862793, 22.281570434570312, 23.986101150512695, 25.690631866455078, 27.395164489746094, 29.099693298339844, 30.80422592163086, 32.508758544921875, 34.213287353515625, 35.91781997680664, 37.62234878540039, 39.326881408691406, 41.031410217285156, 42.73594284057617, 44.44047546386719, 46.14500427246094, 47.84953308105469, 49.5540657043457, 51.25859451293945, 52.96312713623047, 54.66765594482422, 56.372188568115234, 58.07672119140625, 59.78125, 61.485782623291016]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 7.0, 7.0, 11.0, 8.0, 13.0, 17.0, 15.0, 17.0, 20.0, 21.0, 20.0, 25.0, 29.0, 31.0, 39.0, 47.0, 37.0, 30.0, 37.0, 37.0, 36.0, 37.0, 34.0, 55.0, 42.0, 40.0, 29.0, 26.0, 30.0, 28.0, 29.0, 23.0, 12.0, 12.0, 13.0, 17.0, 7.0, 11.0, 8.0, 10.0, 4.0, 4.0, 9.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-5.32421875, -5.1605224609375, -4.996826171875, -4.8331298828125, -4.66943359375, -4.5057373046875, -4.342041015625, -4.1783447265625, -4.0146484375, -3.8509521484375, -3.687255859375, -3.5235595703125, -3.35986328125, -3.1961669921875, -3.032470703125, -2.8687744140625, -2.705078125, -2.5413818359375, -2.377685546875, -2.2139892578125, -2.05029296875, -1.8865966796875, -1.722900390625, -1.5592041015625, -1.3955078125, -1.2318115234375, -1.068115234375, -0.9044189453125, -0.74072265625, -0.5770263671875, -0.413330078125, -0.2496337890625, -0.0859375, 0.0777587890625, 0.241455078125, 0.4051513671875, 0.56884765625, 0.7325439453125, 0.896240234375, 1.0599365234375, 1.2236328125, 1.3873291015625, 1.551025390625, 1.7147216796875, 1.87841796875, 2.0421142578125, 2.205810546875, 2.3695068359375, 2.533203125, 2.6968994140625, 2.860595703125, 3.0242919921875, 3.18798828125, 3.3516845703125, 3.515380859375, 3.6790771484375, 3.8427734375, 4.0064697265625, 4.170166015625, 4.3338623046875, 4.49755859375, 4.6612548828125, 4.824951171875, 4.9886474609375, 5.15234375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 6.0, 5.0, 5.0, 8.0, 11.0, 12.0, 16.0, 22.0, 26.0, 28.0, 45.0, 82.0, 93.0, 213.0, 433.0, 889.0, 2336.0, 8600.0, 51839.0, 468238.0, 2563402.0, 975083.0, 102349.0, 14739.0, 3326.0, 1193.0, 528.0, 270.0, 145.0, 112.0, 54.0, 34.0, 25.0, 13.0, 20.0, 20.0, 15.0, 8.0, 7.0, 4.0, 4.0, 4.0, 4.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.5625, -16.055419921875, -15.54833984375, -15.041259765625, -14.5341796875, -14.027099609375, -13.52001953125, -13.012939453125, -12.505859375, -11.998779296875, -11.49169921875, -10.984619140625, -10.4775390625, -9.970458984375, -9.46337890625, -8.956298828125, -8.44921875, -7.942138671875, -7.43505859375, -6.927978515625, -6.4208984375, -5.913818359375, -5.40673828125, -4.899658203125, -4.392578125, -3.885498046875, -3.37841796875, -2.871337890625, -2.3642578125, -1.857177734375, -1.35009765625, -0.843017578125, -0.3359375, 0.171142578125, 0.67822265625, 1.185302734375, 1.6923828125, 2.199462890625, 2.70654296875, 3.213623046875, 3.720703125, 4.227783203125, 4.73486328125, 5.241943359375, 5.7490234375, 6.256103515625, 6.76318359375, 7.270263671875, 7.77734375, 8.284423828125, 8.79150390625, 9.298583984375, 9.8056640625, 10.312744140625, 10.81982421875, 11.326904296875, 11.833984375, 12.341064453125, 12.84814453125, 13.355224609375, 13.8623046875, 14.369384765625, 14.87646484375, 15.383544921875, 15.890625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 14.0, 12.0, 14.0, 35.0, 40.0, 55.0, 89.0, 137.0, 173.0, 203.0, 314.0, 451.0, 468.0, 473.0, 399.0, 327.0, 268.0, 189.0, 123.0, 81.0, 61.0, 33.0, 33.0, 22.0, 12.0, 14.0, 10.0, 9.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8203125, -15.3546142578125, -14.888916015625, -14.4232177734375, -13.95751953125, -13.4918212890625, -13.026123046875, -12.5604248046875, -12.0947265625, -11.6290283203125, -11.163330078125, -10.6976318359375, -10.23193359375, -9.7662353515625, -9.300537109375, -8.8348388671875, -8.369140625, -7.9034423828125, -7.437744140625, -6.9720458984375, -6.50634765625, -6.0406494140625, -5.574951171875, -5.1092529296875, -4.6435546875, -4.1778564453125, -3.712158203125, -3.2464599609375, -2.78076171875, -2.3150634765625, -1.849365234375, -1.3836669921875, -0.91796875, -0.4522705078125, 0.013427734375, 0.4791259765625, 0.94482421875, 1.4105224609375, 1.876220703125, 2.3419189453125, 2.8076171875, 3.2733154296875, 3.739013671875, 4.2047119140625, 4.67041015625, 5.1361083984375, 5.601806640625, 6.0675048828125, 6.533203125, 6.9989013671875, 7.464599609375, 7.9302978515625, 8.39599609375, 8.8616943359375, 9.327392578125, 9.7930908203125, 10.2587890625, 10.7244873046875, 11.190185546875, 11.6558837890625, 12.12158203125, 12.5872802734375, 13.052978515625, 13.5186767578125, 13.984375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 18.0, 18.0, 6.0, 16.0, 24.0, 37.0, 51.0, 83.0, 121.0, 227.0, 424.0, 1201.0, 7004.0, 118922.0, 2639918.0, 1371740.0, 48992.0, 3868.0, 802.0, 329.0, 170.0, 102.0, 71.0, 44.0, 26.0, 21.0, 9.0, 15.0, 9.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.90625, -31.76611328125, -30.6259765625, -29.48583984375, -28.345703125, -27.20556640625, -26.0654296875, -24.92529296875, -23.78515625, -22.64501953125, -21.5048828125, -20.36474609375, -19.224609375, -18.08447265625, -16.9443359375, -15.80419921875, -14.6640625, -13.52392578125, -12.3837890625, -11.24365234375, -10.103515625, -8.96337890625, -7.8232421875, -6.68310546875, -5.54296875, -4.40283203125, -3.2626953125, -2.12255859375, -0.982421875, 0.15771484375, 1.2978515625, 2.43798828125, 3.578125, 4.71826171875, 5.8583984375, 6.99853515625, 8.138671875, 9.27880859375, 10.4189453125, 11.55908203125, 12.69921875, 13.83935546875, 14.9794921875, 16.11962890625, 17.259765625, 18.39990234375, 19.5400390625, 20.68017578125, 21.8203125, 22.96044921875, 24.1005859375, 25.24072265625, 26.380859375, 27.52099609375, 28.6611328125, 29.80126953125, 30.94140625, 32.08154296875, 33.2216796875, 34.36181640625, 35.501953125, 36.64208984375, 37.7822265625, 38.92236328125, 40.0625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 9.0, 18.0, 39.0, 86.0, 143.0, 173.0, 186.0, 151.0, 105.0, 65.0, 27.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-91.1556625366211, -87.20409393310547, -83.25251770019531, -79.30094909667969, -75.34938049316406, -71.3978042602539, -67.44623565673828, -63.49466323852539, -59.5430908203125, -55.59151840209961, -51.63994598388672, -47.688377380371094, -43.7368049621582, -39.78523254394531, -35.83366394042969, -31.882091522216797, -27.930519104003906, -23.978946685791016, -20.027376174926758, -16.0758056640625, -12.12423324584961, -8.172660827636719, -4.221090316772461, -0.2695198059082031, 3.6820526123046875, 7.633624076843262, 11.585195541381836, 15.53676700592041, 19.488338470458984, 23.439910888671875, 27.391481399536133, 31.34305191040039, 35.29461669921875, 39.24618911743164, 43.19776153564453, 47.149330139160156, 51.10090255737305, 55.05247497558594, 59.00404357910156, 62.95561599731445, 66.90718841552734, 70.85875701904297, 74.81033325195312, 78.76190185546875, 82.71347045898438, 86.66504669189453, 90.61661529541016, 94.56819152832031, 98.51976013183594, 102.47132873535156, 106.42290496826172, 110.37447357177734, 114.3260498046875, 118.27761840820312, 122.22918701171875, 126.18075561523438, 130.13232421875, 134.08389282226562, 138.03546142578125, 141.98704528808594, 145.93861389160156, 149.8901824951172, 153.8417510986328, 157.79331970214844, 161.74490356445312]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 3.0, 5.0, 9.0, 8.0, 6.0, 8.0, 25.0, 16.0, 25.0, 19.0, 21.0, 27.0, 26.0, 42.0, 26.0, 31.0, 30.0, 28.0, 41.0, 36.0, 35.0, 45.0, 38.0, 35.0, 37.0, 37.0, 40.0, 33.0, 34.0, 37.0, 25.0, 16.0, 22.0, 19.0, 17.0, 14.0, 15.0, 11.0, 11.0, 4.0, 6.0, 11.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.70191192626953, -37.41788101196289, -36.133846282958984, -34.849815368652344, -33.56578063964844, -32.2817497253418, -30.997716903686523, -29.71368408203125, -28.429651260375977, -27.145618438720703, -25.86158561706543, -24.577552795410156, -23.293521881103516, -22.00948715209961, -20.72545623779297, -19.441423416137695, -18.157390594482422, -16.87335777282715, -15.589324951171875, -14.305293083190918, -13.021260261535645, -11.737227439880371, -10.453195571899414, -9.16916275024414, -7.885129928588867, -6.601097106933594, -5.3170647621154785, -4.033032417297363, -2.74899959564209, -1.4649667739868164, -0.18093442916870117, 1.103097915649414, 2.387126922607422, 3.671159505844116, 4.9551920890808105, 6.239224433898926, 7.523257255554199, 8.807290077209473, 10.09132194519043, 11.375354766845703, 12.659387588500977, 13.94342041015625, 15.227453231811523, 16.511486053466797, 17.795516967773438, 19.079551696777344, 20.363582611083984, 21.647615432739258, 22.93164825439453, 24.215681076049805, 25.499713897705078, 26.78374671936035, 28.067779541015625, 29.351810455322266, 30.63584327697754, 31.919876098632812, 33.20391082763672, 34.48794174194336, 35.771976470947266, 37.056007385253906, 38.34004211425781, 39.62407302856445, 40.90810775756836, 42.192138671875, 43.47616958618164]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 6.0, 2.0, 11.0, 3.0, 13.0, 13.0, 16.0, 15.0, 21.0, 22.0, 37.0, 26.0, 30.0, 41.0, 35.0, 53.0, 53.0, 58.0, 44.0, 35.0, 52.0, 39.0, 44.0, 37.0, 36.0, 42.0, 40.0, 36.0, 28.0, 26.0, 21.0, 8.0, 18.0, 10.0, 8.0, 8.0, 1.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.328125, -6.1314697265625, -5.934814453125, -5.7381591796875, -5.54150390625, -5.3448486328125, -5.148193359375, -4.9515380859375, -4.7548828125, -4.5582275390625, -4.361572265625, -4.1649169921875, -3.96826171875, -3.7716064453125, -3.574951171875, -3.3782958984375, -3.181640625, -2.9849853515625, -2.788330078125, -2.5916748046875, -2.39501953125, -2.1983642578125, -2.001708984375, -1.8050537109375, -1.6083984375, -1.4117431640625, -1.215087890625, -1.0184326171875, -0.82177734375, -0.6251220703125, -0.428466796875, -0.2318115234375, -0.03515625, 0.1614990234375, 0.358154296875, 0.5548095703125, 0.75146484375, 0.9481201171875, 1.144775390625, 1.3414306640625, 1.5380859375, 1.7347412109375, 1.931396484375, 2.1280517578125, 2.32470703125, 2.5213623046875, 2.718017578125, 2.9146728515625, 3.111328125, 3.3079833984375, 3.504638671875, 3.7012939453125, 3.89794921875, 4.0946044921875, 4.291259765625, 4.4879150390625, 4.6845703125, 4.8812255859375, 5.077880859375, 5.2745361328125, 5.47119140625, 5.6678466796875, 5.864501953125, 6.0611572265625, 6.2578125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 6.0, 2.0, 6.0, 8.0, 24.0, 27.0, 45.0, 69.0, 98.0, 159.0, 233.0, 465.0, 753.0, 1315.0, 2172.0, 3842.0, 6434.0, 11103.0, 18598.0, 30804.0, 48455.0, 73931.0, 104002.0, 133026.0, 149012.0, 138109.0, 110469.0, 79155.0, 52800.0, 33645.0, 20554.0, 12232.0, 7119.0, 4147.0, 2291.0, 1379.0, 792.0, 502.0, 289.0, 185.0, 122.0, 66.0, 43.0, 28.0, 15.0, 11.0, 8.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.4775390625, -1.4322052001953125, -1.386871337890625, -1.3415374755859375, -1.29620361328125, -1.2508697509765625, -1.205535888671875, -1.1602020263671875, -1.1148681640625, -1.0695343017578125, -1.024200439453125, -0.9788665771484375, -0.93353271484375, -0.8881988525390625, -0.842864990234375, -0.7975311279296875, -0.752197265625, -0.7068634033203125, -0.661529541015625, -0.6161956787109375, -0.57086181640625, -0.5255279541015625, -0.480194091796875, -0.4348602294921875, -0.3895263671875, -0.3441925048828125, -0.298858642578125, -0.2535247802734375, -0.20819091796875, -0.1628570556640625, -0.117523193359375, -0.0721893310546875, -0.02685546875, 0.0184783935546875, 0.063812255859375, 0.1091461181640625, 0.15447998046875, 0.1998138427734375, 0.245147705078125, 0.2904815673828125, 0.3358154296875, 0.3811492919921875, 0.426483154296875, 0.4718170166015625, 0.51715087890625, 0.5624847412109375, 0.607818603515625, 0.6531524658203125, 0.698486328125, 0.7438201904296875, 0.789154052734375, 0.8344879150390625, 0.87982177734375, 0.9251556396484375, 0.970489501953125, 1.0158233642578125, 1.0611572265625, 1.1064910888671875, 1.151824951171875, 1.1971588134765625, 1.24249267578125, 1.2878265380859375, 1.333160400390625, 1.3784942626953125, 1.423828125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 7.0, 6.0, 1.0, 6.0, 11.0, 7.0, 11.0, 13.0, 20.0, 28.0, 16.0, 24.0, 23.0, 21.0, 25.0, 38.0, 27.0, 32.0, 42.0, 39.0, 32.0, 45.0, 1067.0, 38.0, 35.0, 34.0, 34.0, 31.0, 36.0, 38.0, 31.0, 33.0, 22.0, 28.0, 23.0, 13.0, 19.0, 11.0, 13.0, 11.0, 12.0, 5.0, 4.0, 5.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.04296875, -3.91436767578125, -3.7857666015625, -3.65716552734375, -3.528564453125, -3.39996337890625, -3.2713623046875, -3.14276123046875, -3.01416015625, -2.88555908203125, -2.7569580078125, -2.62835693359375, -2.499755859375, -2.37115478515625, -2.2425537109375, -2.11395263671875, -1.9853515625, -1.85675048828125, -1.7281494140625, -1.59954833984375, -1.470947265625, -1.34234619140625, -1.2137451171875, -1.08514404296875, -0.95654296875, -0.82794189453125, -0.6993408203125, -0.57073974609375, -0.442138671875, -0.31353759765625, -0.1849365234375, -0.05633544921875, 0.072265625, 0.20086669921875, 0.3294677734375, 0.45806884765625, 0.586669921875, 0.71527099609375, 0.8438720703125, 0.97247314453125, 1.10107421875, 1.22967529296875, 1.3582763671875, 1.48687744140625, 1.615478515625, 1.74407958984375, 1.8726806640625, 2.00128173828125, 2.1298828125, 2.25848388671875, 2.3870849609375, 2.51568603515625, 2.644287109375, 2.77288818359375, 2.9014892578125, 3.03009033203125, 3.15869140625, 3.28729248046875, 3.4158935546875, 3.54449462890625, 3.673095703125, 3.80169677734375, 3.9302978515625, 4.05889892578125, 4.1875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 3.0, 9.0, 8.0, 14.0, 15.0, 19.0, 45.0, 68.0, 80.0, 136.0, 199.0, 341.0, 545.0, 807.0, 1216.0, 1997.0, 3047.0, 4742.0, 7321.0, 11693.0, 18847.0, 31698.0, 964567.0, 966988.0, 31508.0, 18721.0, 11777.0, 7424.0, 4754.0, 3098.0, 1958.0, 1233.0, 784.0, 524.0, 320.0, 221.0, 127.0, 102.0, 60.0, 35.0, 22.0, 23.0, 13.0, 9.0, 4.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.359375, -2.28564453125, -2.2119140625, -2.13818359375, -2.064453125, -1.99072265625, -1.9169921875, -1.84326171875, -1.76953125, -1.69580078125, -1.6220703125, -1.54833984375, -1.474609375, -1.40087890625, -1.3271484375, -1.25341796875, -1.1796875, -1.10595703125, -1.0322265625, -0.95849609375, -0.884765625, -0.81103515625, -0.7373046875, -0.66357421875, -0.58984375, -0.51611328125, -0.4423828125, -0.36865234375, -0.294921875, -0.22119140625, -0.1474609375, -0.07373046875, 0.0, 0.07373046875, 0.1474609375, 0.22119140625, 0.294921875, 0.36865234375, 0.4423828125, 0.51611328125, 0.58984375, 0.66357421875, 0.7373046875, 0.81103515625, 0.884765625, 0.95849609375, 1.0322265625, 1.10595703125, 1.1796875, 1.25341796875, 1.3271484375, 1.40087890625, 1.474609375, 1.54833984375, 1.6220703125, 1.69580078125, 1.76953125, 1.84326171875, 1.9169921875, 1.99072265625, 2.064453125, 2.13818359375, 2.2119140625, 2.28564453125, 2.359375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 9.0, 2.0, 14.0, 11.0, 9.0, 15.0, 16.0, 18.0, 35.0, 47.0, 43.0, 45.0, 48.0, 51.0, 79.0, 104.0, 78.0, 65.0, 53.0, 50.0, 34.0, 32.0, 26.0, 22.0, 16.0, 22.0, 8.0, 8.0, 6.0, 4.0, 4.0, 7.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.228759765625, -0.22230911254882812, -0.21585845947265625, -0.20940780639648438, -0.2029571533203125, -0.19650650024414062, -0.19005584716796875, -0.18360519409179688, -0.177154541015625, -0.17070388793945312, -0.16425323486328125, -0.15780258178710938, -0.1513519287109375, -0.14490127563476562, -0.13845062255859375, -0.13199996948242188, -0.12554931640625, -0.11909866333007812, -0.11264801025390625, -0.10619735717773438, -0.0997467041015625, -0.09329605102539062, -0.08684539794921875, -0.08039474487304688, -0.073944091796875, -0.06749343872070312, -0.06104278564453125, -0.054592132568359375, -0.0481414794921875, -0.041690826416015625, -0.03524017333984375, -0.028789520263671875, -0.0223388671875, -0.015888214111328125, -0.00943756103515625, -0.002986907958984375, 0.0034637451171875, 0.009914398193359375, 0.01636505126953125, 0.022815704345703125, 0.029266357421875, 0.035717010498046875, 0.04216766357421875, 0.048618316650390625, 0.0550689697265625, 0.061519622802734375, 0.06797027587890625, 0.07442092895507812, 0.08087158203125, 0.08732223510742188, 0.09377288818359375, 0.10022354125976562, 0.1066741943359375, 0.11312484741210938, 0.11957550048828125, 0.12602615356445312, 0.132476806640625, 0.13892745971679688, 0.14537811279296875, 0.15182876586914062, 0.1582794189453125, 0.16473007202148438, 0.17118072509765625, 0.17763137817382812, 0.18408203125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 0.0, 3.0, 7.0, 5.0, 4.0, 6.0, 5.0, 12.0, 18.0, 18.0, 25.0, 38.0, 39.0, 65.0, 107.0, 175.0, 365.0, 1634.0, 1016122.0, 28566.0, 651.0, 243.0, 136.0, 77.0, 54.0, 42.0, 33.0, 20.0, 18.0, 14.0, 9.0, 10.0, 7.0, 7.0, 8.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9921875, -3.85797119140625, -3.7237548828125, -3.58953857421875, -3.455322265625, -3.32110595703125, -3.1868896484375, -3.05267333984375, -2.91845703125, -2.78424072265625, -2.6500244140625, -2.51580810546875, -2.381591796875, -2.24737548828125, -2.1131591796875, -1.97894287109375, -1.8447265625, -1.71051025390625, -1.5762939453125, -1.44207763671875, -1.307861328125, -1.17364501953125, -1.0394287109375, -0.90521240234375, -0.77099609375, -0.63677978515625, -0.5025634765625, -0.36834716796875, -0.234130859375, -0.09991455078125, 0.0343017578125, 0.16851806640625, 0.302734375, 0.43695068359375, 0.5711669921875, 0.70538330078125, 0.839599609375, 0.97381591796875, 1.1080322265625, 1.24224853515625, 1.37646484375, 1.51068115234375, 1.6448974609375, 1.77911376953125, 1.913330078125, 2.04754638671875, 2.1817626953125, 2.31597900390625, 2.4501953125, 2.58441162109375, 2.7186279296875, 2.85284423828125, 2.987060546875, 3.12127685546875, 3.2554931640625, 3.38970947265625, 3.52392578125, 3.65814208984375, 3.7923583984375, 3.92657470703125, 4.060791015625, 4.19500732421875, 4.3292236328125, 4.46343994140625, 4.59765625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 279.0, 724.0, 10.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.211994171142578, -11.012153625488281, -10.8123140335083, -10.612473487854004, -10.412632942199707, -10.212793350219727, -10.01295280456543, -9.813112258911133, -9.613272666931152, -9.413432121276855, -9.213592529296875, -9.013751983642578, -8.813911437988281, -8.6140718460083, -8.414231300354004, -8.214390754699707, -8.01455020904541, -7.8147101402282715, -7.614869594573975, -7.415029525756836, -7.215189456939697, -7.0153489112854, -6.815508842468262, -6.615668296813965, -6.415828704833984, -6.215988636016846, -6.016148090362549, -5.81630802154541, -5.6164679527282715, -5.416627407073975, -5.216787338256836, -5.016946792602539, -4.817106246948242, -4.6172661781311035, -4.417425632476807, -4.217585563659668, -4.017745494842529, -3.8179049491882324, -3.6180648803710938, -3.418224573135376, -3.2183847427368164, -3.0185444355010986, -2.81870436668396, -2.618864059448242, -2.4190237522125244, -2.2191834449768066, -2.019343376159668, -1.8195030689239502, -1.6196627616882324, -1.4198225736618042, -1.2199822664260864, -1.0201420783996582, -0.8203018307685852, -0.6204615831375122, -0.420621395111084, -0.2207810878753662, -0.02094089984893799, 0.17889933288097382, 0.3787395656108856, 0.5785797834396362, 0.7784200310707092, 0.9782602787017822, 1.1781004667282104, 1.3779407739639282, 1.5777809619903564]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 7.0, 6.0, 5.0, 11.0, 13.0, 6.0, 21.0, 9.0, 30.0, 28.0, 23.0, 26.0, 34.0, 31.0, 35.0, 46.0, 40.0, 42.0, 42.0, 45.0, 51.0, 45.0, 44.0, 46.0, 40.0, 28.0, 31.0, 21.0, 25.0, 31.0, 28.0, 14.0, 19.0, 18.0, 12.0, 16.0, 9.0, 6.0, 7.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7929999828338623, -0.7705682516098022, -0.748136579990387, -0.7257048487663269, -0.7032731175422668, -0.6808413863182068, -0.6584097146987915, -0.6359779834747314, -0.6135462522506714, -0.5911145210266113, -0.568682849407196, -0.546251118183136, -0.5238193869590759, -0.5013876557350159, -0.4789559841156006, -0.4565242528915405, -0.43409255146980286, -0.4116608500480652, -0.3892291188240051, -0.36679741740226746, -0.3443656861782074, -0.3219339847564697, -0.29950225353240967, -0.277070552110672, -0.2546388506889343, -0.23220713436603546, -0.2097754180431366, -0.18734371662139893, -0.16491198539733887, -0.1424802839756012, -0.12004856765270233, -0.09761685132980347, -0.07518512010574341, -0.05275340378284454, -0.030321691185235977, -0.007889978587627411, 0.014541737735271454, 0.03697345405817032, 0.059405162930488586, 0.08183687925338745, 0.10426859557628632, 0.12670031189918518, 0.14913202822208405, 0.1715637445449829, 0.19399544596672058, 0.21642717719078064, 0.2388588786125183, 0.26129060983657837, 0.28372231125831604, 0.3061540126800537, 0.32858574390411377, 0.35101744532585144, 0.3734491765499115, 0.39588087797164917, 0.41831260919570923, 0.4407443106174469, 0.46317601203918457, 0.48560771346092224, 0.5080394148826599, 0.53047114610672, 0.55290287733078, 0.5753346085548401, 0.5977662801742554, 0.6201980113983154, 0.6426297426223755]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 3.0, 6.0, 8.0, 8.0, 17.0, 16.0, 17.0, 26.0, 26.0, 30.0, 38.0, 46.0, 44.0, 56.0, 53.0, 49.0, 57.0, 58.0, 54.0, 48.0, 36.0, 53.0, 41.0, 45.0, 37.0, 27.0, 15.0, 20.0, 14.0, 16.0, 7.0, 3.0, 6.0, 6.0, 4.0, 3.0, 0.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.50390625, -6.286865234375, -6.06982421875, -5.852783203125, -5.6357421875, -5.418701171875, -5.20166015625, -4.984619140625, -4.767578125, -4.550537109375, -4.33349609375, -4.116455078125, -3.8994140625, -3.682373046875, -3.46533203125, -3.248291015625, -3.03125, -2.814208984375, -2.59716796875, -2.380126953125, -2.1630859375, -1.946044921875, -1.72900390625, -1.511962890625, -1.294921875, -1.077880859375, -0.86083984375, -0.643798828125, -0.4267578125, -0.209716796875, 0.00732421875, 0.224365234375, 0.44140625, 0.658447265625, 0.87548828125, 1.092529296875, 1.3095703125, 1.526611328125, 1.74365234375, 1.960693359375, 2.177734375, 2.394775390625, 2.61181640625, 2.828857421875, 3.0458984375, 3.262939453125, 3.47998046875, 3.697021484375, 3.9140625, 4.131103515625, 4.34814453125, 4.565185546875, 4.7822265625, 4.999267578125, 5.21630859375, 5.433349609375, 5.650390625, 5.867431640625, 6.08447265625, 6.301513671875, 6.5185546875, 6.735595703125, 6.95263671875, 7.169677734375, 7.38671875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 7.0, 3.0, 9.0, 10.0, 13.0, 24.0, 26.0, 61.0, 79.0, 108.0, 170.0, 238.0, 394.0, 636.0, 1024.0, 1799.0, 2964.0, 4954.0, 8699.0, 15055.0, 25652.0, 46555.0, 100352.0, 248012.0, 311688.0, 143418.0, 60605.0, 31590.0, 18273.0, 10628.0, 6344.0, 3633.0, 2126.0, 1244.0, 745.0, 503.0, 303.0, 202.0, 140.0, 83.0, 65.0, 41.0, 30.0, 17.0, 10.0, 11.0, 4.0, 7.0, 4.0, 4.0, 0.0, 2.0], "bins": [-6.59375, -6.41156005859375, -6.2293701171875, -6.04718017578125, -5.864990234375, -5.68280029296875, -5.5006103515625, -5.31842041015625, -5.13623046875, -4.95404052734375, -4.7718505859375, -4.58966064453125, -4.407470703125, -4.22528076171875, -4.0430908203125, -3.86090087890625, -3.6787109375, -3.49652099609375, -3.3143310546875, -3.13214111328125, -2.949951171875, -2.76776123046875, -2.5855712890625, -2.40338134765625, -2.22119140625, -2.03900146484375, -1.8568115234375, -1.67462158203125, -1.492431640625, -1.31024169921875, -1.1280517578125, -0.94586181640625, -0.763671875, -0.58148193359375, -0.3992919921875, -0.21710205078125, -0.034912109375, 0.14727783203125, 0.3294677734375, 0.51165771484375, 0.69384765625, 0.87603759765625, 1.0582275390625, 1.24041748046875, 1.422607421875, 1.60479736328125, 1.7869873046875, 1.96917724609375, 2.1513671875, 2.33355712890625, 2.5157470703125, 2.69793701171875, 2.880126953125, 3.06231689453125, 3.2445068359375, 3.42669677734375, 3.60888671875, 3.79107666015625, 3.9732666015625, 4.15545654296875, 4.337646484375, 4.51983642578125, 4.7020263671875, 4.88421630859375, 5.06640625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 6.0, 8.0, 6.0, 10.0, 12.0, 10.0, 20.0, 17.0, 19.0, 19.0, 15.0, 27.0, 30.0, 29.0, 42.0, 41.0, 59.0, 82.0, 155.0, 311.0, 1412.0, 164.0, 116.0, 69.0, 57.0, 42.0, 42.0, 37.0, 23.0, 20.0, 21.0, 32.0, 15.0, 14.0, 12.0, 7.0, 11.0, 12.0, 6.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.546875, -18.91748046875, -18.2880859375, -17.65869140625, -17.029296875, -16.39990234375, -15.7705078125, -15.14111328125, -14.51171875, -13.88232421875, -13.2529296875, -12.62353515625, -11.994140625, -11.36474609375, -10.7353515625, -10.10595703125, -9.4765625, -8.84716796875, -8.2177734375, -7.58837890625, -6.958984375, -6.32958984375, -5.7001953125, -5.07080078125, -4.44140625, -3.81201171875, -3.1826171875, -2.55322265625, -1.923828125, -1.29443359375, -0.6650390625, -0.03564453125, 0.59375, 1.22314453125, 1.8525390625, 2.48193359375, 3.111328125, 3.74072265625, 4.3701171875, 4.99951171875, 5.62890625, 6.25830078125, 6.8876953125, 7.51708984375, 8.146484375, 8.77587890625, 9.4052734375, 10.03466796875, 10.6640625, 11.29345703125, 11.9228515625, 12.55224609375, 13.181640625, 13.81103515625, 14.4404296875, 15.06982421875, 15.69921875, 16.32861328125, 16.9580078125, 17.58740234375, 18.216796875, 18.84619140625, 19.4755859375, 20.10498046875, 20.734375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 2.0, 14.0, 7.0, 13.0, 12.0, 20.0, 28.0, 38.0, 41.0, 72.0, 105.0, 155.0, 281.0, 548.0, 1752.0, 28098.0, 2950704.0, 158607.0, 3514.0, 754.0, 359.0, 163.0, 122.0, 88.0, 66.0, 34.0, 30.0, 18.0, 13.0, 12.0, 5.0, 6.0, 4.0, 8.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.78125, -45.09130859375, -43.4013671875, -41.71142578125, -40.021484375, -38.33154296875, -36.6416015625, -34.95166015625, -33.26171875, -31.57177734375, -29.8818359375, -28.19189453125, -26.501953125, -24.81201171875, -23.1220703125, -21.43212890625, -19.7421875, -18.05224609375, -16.3623046875, -14.67236328125, -12.982421875, -11.29248046875, -9.6025390625, -7.91259765625, -6.22265625, -4.53271484375, -2.8427734375, -1.15283203125, 0.537109375, 2.22705078125, 3.9169921875, 5.60693359375, 7.296875, 8.98681640625, 10.6767578125, 12.36669921875, 14.056640625, 15.74658203125, 17.4365234375, 19.12646484375, 20.81640625, 22.50634765625, 24.1962890625, 25.88623046875, 27.576171875, 29.26611328125, 30.9560546875, 32.64599609375, 34.3359375, 36.02587890625, 37.7158203125, 39.40576171875, 41.095703125, 42.78564453125, 44.4755859375, 46.16552734375, 47.85546875, 49.54541015625, 51.2353515625, 52.92529296875, 54.615234375, 56.30517578125, 57.9951171875, 59.68505859375, 61.375]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 21.0, 139.0, 427.0, 356.0, 68.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.315757751464844, -51.12123107910156, -45.92670822143555, -40.732181549072266, -35.53765869140625, -30.34313201904297, -25.148605346679688, -19.954082489013672, -14.75955581665039, -9.565031051635742, -4.370505332946777, 0.8240203857421875, 6.018545150756836, 11.213069915771484, 16.407596588134766, 21.60211944580078, 26.796646118164062, 31.99117088317871, 37.18569564819336, 42.38022232055664, 47.574745178222656, 52.76927185058594, 57.96379852294922, 63.158321380615234, 68.35284423828125, 73.54737091064453, 78.74189758300781, 83.93641662597656, 89.13094329833984, 94.32546997070312, 99.5199966430664, 104.71452331542969, 109.90904235839844, 115.10356903076172, 120.298095703125, 125.49261474609375, 130.68714904785156, 135.8816680908203, 141.07620239257812, 146.27072143554688, 151.46524047851562, 156.65975952148438, 161.8542938232422, 167.04881286621094, 172.24334716796875, 177.4378662109375, 182.63238525390625, 187.82691955566406, 193.02145385742188, 198.21597290039062, 203.41050720214844, 208.6050262451172, 213.799560546875, 218.99407958984375, 224.1885986328125, 229.3831329345703, 234.57765197753906, 239.7721710205078, 244.96670532226562, 250.16122436523438, 255.3557586669922, 260.55029296875, 265.74481201171875, 270.9393310546875, 276.13385009765625]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 11.0, 4.0, 5.0, 11.0, 15.0, 20.0, 17.0, 18.0, 19.0, 24.0, 17.0, 13.0, 19.0, 22.0, 29.0, 25.0, 43.0, 45.0, 27.0, 34.0, 39.0, 30.0, 28.0, 47.0, 42.0, 41.0, 33.0, 34.0, 24.0, 34.0, 31.0, 22.0, 29.0, 20.0, 22.0, 11.0, 15.0, 9.0, 21.0, 10.0, 6.0, 4.0, 7.0, 6.0, 5.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-50.62106704711914, -48.974056243896484, -47.32704162597656, -45.680030822753906, -44.03302001953125, -42.386009216308594, -40.73899459838867, -39.091983795166016, -37.444969177246094, -35.79795837402344, -34.150943756103516, -32.50393295288086, -30.856922149658203, -29.209909439086914, -27.562896728515625, -25.91588592529297, -24.268875122070312, -22.621862411499023, -20.974851608276367, -19.327838897705078, -17.680828094482422, -16.033815383911133, -14.386802673339844, -12.739790916442871, -11.092779159545898, -9.445767402648926, -7.798755168914795, -6.151742935180664, -4.504731178283691, -2.8577194213867188, -1.2107067108154297, 0.43630504608154297, 2.08331298828125, 3.7303249835968018, 5.3773369789123535, 7.024349212646484, 8.671360969543457, 10.31837272644043, 11.965385437011719, 13.612397193908691, 15.259408950805664, 16.906421661376953, 18.55343246459961, 20.2004451751709, 21.847457885742188, 23.494468688964844, 25.141481399536133, 26.788494110107422, 28.435504913330078, 30.082517623901367, 31.729528427124023, 33.37654113769531, 35.02355194091797, 36.670562744140625, 38.31757736206055, 39.9645881652832, 41.611602783203125, 43.25861358642578, 44.9056282043457, 46.55263900756836, 48.199649810791016, 49.84666442871094, 51.493675231933594, 53.14068603515625, 54.787696838378906]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 4.0, 7.0, 7.0, 8.0, 9.0, 16.0, 24.0, 21.0, 17.0, 34.0, 35.0, 42.0, 44.0, 52.0, 54.0, 52.0, 55.0, 52.0, 47.0, 52.0, 48.0, 55.0, 39.0, 35.0, 35.0, 27.0, 33.0, 19.0, 15.0, 16.0, 9.0, 11.0, 6.0, 7.0, 5.0, 5.0, 3.0, 0.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.38671875, -7.1585693359375, -6.930419921875, -6.7022705078125, -6.47412109375, -6.2459716796875, -6.017822265625, -5.7896728515625, -5.5615234375, -5.3333740234375, -5.105224609375, -4.8770751953125, -4.64892578125, -4.4207763671875, -4.192626953125, -3.9644775390625, -3.736328125, -3.5081787109375, -3.280029296875, -3.0518798828125, -2.82373046875, -2.5955810546875, -2.367431640625, -2.1392822265625, -1.9111328125, -1.6829833984375, -1.454833984375, -1.2266845703125, -0.99853515625, -0.7703857421875, -0.542236328125, -0.3140869140625, -0.0859375, 0.1422119140625, 0.370361328125, 0.5985107421875, 0.82666015625, 1.0548095703125, 1.282958984375, 1.5111083984375, 1.7392578125, 1.9674072265625, 2.195556640625, 2.4237060546875, 2.65185546875, 2.8800048828125, 3.108154296875, 3.3363037109375, 3.564453125, 3.7926025390625, 4.020751953125, 4.2489013671875, 4.47705078125, 4.7052001953125, 4.933349609375, 5.1614990234375, 5.3896484375, 5.6177978515625, 5.845947265625, 6.0740966796875, 6.30224609375, 6.5303955078125, 6.758544921875, 6.9866943359375, 7.21484375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 10.0, 14.0, 15.0, 18.0, 22.0, 36.0, 48.0, 68.0, 101.0, 139.0, 220.0, 365.0, 533.0, 879.0, 1699.0, 3158.0, 7008.0, 16457.0, 42123.0, 112865.0, 315297.0, 809195.0, 1374295.0, 922466.0, 369026.0, 133683.0, 49042.0, 19103.0, 8175.0, 3686.0, 1867.0, 995.0, 586.0, 337.0, 235.0, 140.0, 115.0, 64.0, 47.0, 40.0, 25.0, 19.0, 18.0, 15.0, 9.0, 8.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-7.1640625, -6.9298095703125, -6.695556640625, -6.4613037109375, -6.22705078125, -5.9927978515625, -5.758544921875, -5.5242919921875, -5.2900390625, -5.0557861328125, -4.821533203125, -4.5872802734375, -4.35302734375, -4.1187744140625, -3.884521484375, -3.6502685546875, -3.416015625, -3.1817626953125, -2.947509765625, -2.7132568359375, -2.47900390625, -2.2447509765625, -2.010498046875, -1.7762451171875, -1.5419921875, -1.3077392578125, -1.073486328125, -0.8392333984375, -0.60498046875, -0.3707275390625, -0.136474609375, 0.0977783203125, 0.33203125, 0.5662841796875, 0.800537109375, 1.0347900390625, 1.26904296875, 1.5032958984375, 1.737548828125, 1.9718017578125, 2.2060546875, 2.4403076171875, 2.674560546875, 2.9088134765625, 3.14306640625, 3.3773193359375, 3.611572265625, 3.8458251953125, 4.080078125, 4.3143310546875, 4.548583984375, 4.7828369140625, 5.01708984375, 5.2513427734375, 5.485595703125, 5.7198486328125, 5.9541015625, 6.1883544921875, 6.422607421875, 6.6568603515625, 6.89111328125, 7.1253662109375, 7.359619140625, 7.5938720703125, 7.828125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 1.0, 6.0, 7.0, 5.0, 6.0, 10.0, 14.0, 23.0, 22.0, 27.0, 42.0, 63.0, 81.0, 107.0, 130.0, 157.0, 193.0, 275.0, 341.0, 333.0, 379.0, 373.0, 306.0, 279.0, 221.0, 182.0, 114.0, 90.0, 59.0, 55.0, 38.0, 29.0, 28.0, 21.0, 17.0, 13.0, 9.0, 6.0, 5.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.125, -11.751220703125, -11.37744140625, -11.003662109375, -10.6298828125, -10.256103515625, -9.88232421875, -9.508544921875, -9.134765625, -8.760986328125, -8.38720703125, -8.013427734375, -7.6396484375, -7.265869140625, -6.89208984375, -6.518310546875, -6.14453125, -5.770751953125, -5.39697265625, -5.023193359375, -4.6494140625, -4.275634765625, -3.90185546875, -3.528076171875, -3.154296875, -2.780517578125, -2.40673828125, -2.032958984375, -1.6591796875, -1.285400390625, -0.91162109375, -0.537841796875, -0.1640625, 0.209716796875, 0.58349609375, 0.957275390625, 1.3310546875, 1.704833984375, 2.07861328125, 2.452392578125, 2.826171875, 3.199951171875, 3.57373046875, 3.947509765625, 4.3212890625, 4.695068359375, 5.06884765625, 5.442626953125, 5.81640625, 6.190185546875, 6.56396484375, 6.937744140625, 7.3115234375, 7.685302734375, 8.05908203125, 8.432861328125, 8.806640625, 9.180419921875, 9.55419921875, 9.927978515625, 10.3017578125, 10.675537109375, 11.04931640625, 11.423095703125, 11.796875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 2.0, 4.0, 11.0, 14.0, 15.0, 27.0, 30.0, 35.0, 45.0, 67.0, 81.0, 143.0, 284.0, 596.0, 1763.0, 6182.0, 30011.0, 194744.0, 1309078.0, 2153445.0, 421252.0, 60734.0, 11111.0, 2781.0, 881.0, 340.0, 202.0, 130.0, 89.0, 46.0, 29.0, 29.0, 21.0, 14.0, 3.0, 13.0, 6.0, 4.0, 7.0, 5.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.609375, -19.94873046875, -19.2880859375, -18.62744140625, -17.966796875, -17.30615234375, -16.6455078125, -15.98486328125, -15.32421875, -14.66357421875, -14.0029296875, -13.34228515625, -12.681640625, -12.02099609375, -11.3603515625, -10.69970703125, -10.0390625, -9.37841796875, -8.7177734375, -8.05712890625, -7.396484375, -6.73583984375, -6.0751953125, -5.41455078125, -4.75390625, -4.09326171875, -3.4326171875, -2.77197265625, -2.111328125, -1.45068359375, -0.7900390625, -0.12939453125, 0.53125, 1.19189453125, 1.8525390625, 2.51318359375, 3.173828125, 3.83447265625, 4.4951171875, 5.15576171875, 5.81640625, 6.47705078125, 7.1376953125, 7.79833984375, 8.458984375, 9.11962890625, 9.7802734375, 10.44091796875, 11.1015625, 11.76220703125, 12.4228515625, 13.08349609375, 13.744140625, 14.40478515625, 15.0654296875, 15.72607421875, 16.38671875, 17.04736328125, 17.7080078125, 18.36865234375, 19.029296875, 19.68994140625, 20.3505859375, 21.01123046875, 21.671875]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 8.0, 18.0, 41.0, 53.0, 71.0, 88.0, 116.0, 110.0, 124.0, 93.0, 94.0, 72.0, 45.0, 31.0, 16.0, 13.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.5863037109375, -92.93058013916016, -90.27485656738281, -87.61913299560547, -84.96340942382812, -82.30769348144531, -79.65196228027344, -76.99624633789062, -74.34052276611328, -71.68479919433594, -69.0290756225586, -66.37335205078125, -63.71763229370117, -61.06190872192383, -58.406185150146484, -55.750465393066406, -53.0947380065918, -50.43901443481445, -47.78329086303711, -45.12757110595703, -42.47184753417969, -39.816123962402344, -37.160400390625, -34.504676818847656, -31.848955154418945, -29.1932315826416, -26.53750991821289, -23.881786346435547, -21.226062774658203, -18.570341110229492, -15.914617538452148, -13.258895874023438, -10.603172302246094, -7.947449684143066, -5.291726589202881, -2.6360034942626953, 0.01971912384033203, 2.6754417419433594, 5.331165313720703, 7.986886978149414, 10.642610549926758, 13.298333168029785, 15.954055786132812, 18.609779357910156, 21.2655029296875, 23.92122459411621, 26.576948165893555, 29.232669830322266, 31.88839340209961, 34.54411697387695, 37.1998405456543, 39.855560302734375, 42.51128387451172, 45.16700744628906, 47.822731018066406, 50.47845458984375, 53.134178161621094, 55.78990173339844, 58.44562530517578, 61.101348876953125, 63.7570686340332, 66.41279602050781, 69.06851196289062, 71.72423553466797, 74.37995910644531]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 1.0, 5.0, 6.0, 4.0, 10.0, 11.0, 8.0, 15.0, 17.0, 20.0, 26.0, 24.0, 23.0, 28.0, 19.0, 34.0, 35.0, 25.0, 34.0, 40.0, 39.0, 31.0, 50.0, 34.0, 32.0, 38.0, 24.0, 37.0, 50.0, 27.0, 37.0, 24.0, 18.0, 25.0, 24.0, 16.0, 15.0, 16.0, 10.0, 12.0, 10.0, 11.0, 5.0, 6.0, 5.0, 4.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0], "bins": [-42.36705017089844, -41.14271545410156, -39.91838455200195, -38.694053649902344, -37.46971893310547, -36.245384216308594, -35.021053314208984, -33.796722412109375, -32.5723876953125, -31.348054885864258, -30.123722076416016, -28.899389266967773, -27.67505645751953, -26.45072364807129, -25.226390838623047, -24.002058029174805, -22.777725219726562, -21.55339241027832, -20.329059600830078, -19.104726791381836, -17.880393981933594, -16.65606117248535, -15.43172836303711, -14.207395553588867, -12.983062744140625, -11.758729934692383, -10.53439712524414, -9.310064315795898, -8.085731506347656, -6.861398696899414, -5.637065887451172, -4.41273307800293, -3.188396453857422, -1.9640636444091797, -0.7397308349609375, 0.4846019744873047, 1.7089347839355469, 2.933267593383789, 4.157600402832031, 5.381933212280273, 6.606266021728516, 7.830598831176758, 9.054931640625, 10.279264450073242, 11.503597259521484, 12.727930068969727, 13.952262878417969, 15.176595687866211, 16.400928497314453, 17.625261306762695, 18.849594116210938, 20.07392692565918, 21.298259735107422, 22.522592544555664, 23.746925354003906, 24.97125816345215, 26.19559097290039, 27.419923782348633, 28.644256591796875, 29.868589401245117, 31.09292221069336, 32.31725311279297, 33.541587829589844, 34.76592254638672, 35.99025344848633]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 3.0, 4.0, 9.0, 8.0, 5.0, 7.0, 9.0, 11.0, 23.0, 18.0, 20.0, 33.0, 26.0, 32.0, 27.0, 43.0, 47.0, 35.0, 44.0, 42.0, 46.0, 52.0, 49.0, 56.0, 44.0, 38.0, 25.0, 34.0, 36.0, 24.0, 24.0, 21.0, 23.0, 16.0, 15.0, 11.0, 7.0, 8.0, 8.0, 10.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.82421875, -6.6239013671875, -6.423583984375, -6.2232666015625, -6.02294921875, -5.8226318359375, -5.622314453125, -5.4219970703125, -5.2216796875, -5.0213623046875, -4.821044921875, -4.6207275390625, -4.42041015625, -4.2200927734375, -4.019775390625, -3.8194580078125, -3.619140625, -3.4188232421875, -3.218505859375, -3.0181884765625, -2.81787109375, -2.6175537109375, -2.417236328125, -2.2169189453125, -2.0166015625, -1.8162841796875, -1.615966796875, -1.4156494140625, -1.21533203125, -1.0150146484375, -0.814697265625, -0.6143798828125, -0.4140625, -0.2137451171875, -0.013427734375, 0.1868896484375, 0.38720703125, 0.5875244140625, 0.787841796875, 0.9881591796875, 1.1884765625, 1.3887939453125, 1.589111328125, 1.7894287109375, 1.98974609375, 2.1900634765625, 2.390380859375, 2.5906982421875, 2.791015625, 2.9913330078125, 3.191650390625, 3.3919677734375, 3.59228515625, 3.7926025390625, 3.992919921875, 4.1932373046875, 4.3935546875, 4.5938720703125, 4.794189453125, 4.9945068359375, 5.19482421875, 5.3951416015625, 5.595458984375, 5.7957763671875, 5.99609375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 5.0, 6.0, 5.0, 20.0, 18.0, 26.0, 39.0, 83.0, 131.0, 207.0, 334.0, 606.0, 991.0, 1570.0, 2579.0, 4140.0, 6812.0, 10972.0, 17314.0, 27287.0, 41064.0, 59632.0, 82168.0, 104650.0, 121753.0, 128319.0, 116452.0, 97049.0, 73750.0, 52716.0, 35579.0, 23320.0, 15020.0, 9221.0, 5691.0, 3517.0, 2192.0, 1315.0, 804.0, 490.0, 315.0, 166.0, 89.0, 68.0, 36.0, 15.0, 8.0, 9.0, 7.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.32421875, -1.280548095703125, -1.23687744140625, -1.193206787109375, -1.1495361328125, -1.105865478515625, -1.06219482421875, -1.018524169921875, -0.974853515625, -0.931182861328125, -0.88751220703125, -0.843841552734375, -0.8001708984375, -0.756500244140625, -0.71282958984375, -0.669158935546875, -0.62548828125, -0.581817626953125, -0.53814697265625, -0.494476318359375, -0.4508056640625, -0.407135009765625, -0.36346435546875, -0.319793701171875, -0.276123046875, -0.232452392578125, -0.18878173828125, -0.145111083984375, -0.1014404296875, -0.057769775390625, -0.01409912109375, 0.029571533203125, 0.0732421875, 0.116912841796875, 0.16058349609375, 0.204254150390625, 0.2479248046875, 0.291595458984375, 0.33526611328125, 0.378936767578125, 0.422607421875, 0.466278076171875, 0.50994873046875, 0.553619384765625, 0.5972900390625, 0.640960693359375, 0.68463134765625, 0.728302001953125, 0.77197265625, 0.815643310546875, 0.85931396484375, 0.902984619140625, 0.9466552734375, 0.990325927734375, 1.03399658203125, 1.077667236328125, 1.121337890625, 1.165008544921875, 1.20867919921875, 1.252349853515625, 1.2960205078125, 1.339691162109375, 1.38336181640625, 1.427032470703125, 1.470703125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 8.0, 5.0, 8.0, 10.0, 20.0, 11.0, 11.0, 30.0, 29.0, 25.0, 37.0, 33.0, 21.0, 29.0, 31.0, 37.0, 38.0, 43.0, 36.0, 1069.0, 48.0, 42.0, 50.0, 46.0, 27.0, 26.0, 26.0, 29.0, 33.0, 26.0, 24.0, 12.0, 17.0, 20.0, 16.0, 16.0, 9.0, 8.0, 3.0, 5.0, 3.0, 9.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4765625, -4.31951904296875, -4.1624755859375, -4.00543212890625, -3.848388671875, -3.69134521484375, -3.5343017578125, -3.37725830078125, -3.22021484375, -3.06317138671875, -2.9061279296875, -2.74908447265625, -2.592041015625, -2.43499755859375, -2.2779541015625, -2.12091064453125, -1.9638671875, -1.80682373046875, -1.6497802734375, -1.49273681640625, -1.335693359375, -1.17864990234375, -1.0216064453125, -0.86456298828125, -0.70751953125, -0.55047607421875, -0.3934326171875, -0.23638916015625, -0.079345703125, 0.07769775390625, 0.2347412109375, 0.39178466796875, 0.548828125, 0.70587158203125, 0.8629150390625, 1.01995849609375, 1.177001953125, 1.33404541015625, 1.4910888671875, 1.64813232421875, 1.80517578125, 1.96221923828125, 2.1192626953125, 2.27630615234375, 2.433349609375, 2.59039306640625, 2.7474365234375, 2.90447998046875, 3.0615234375, 3.21856689453125, 3.3756103515625, 3.53265380859375, 3.689697265625, 3.84674072265625, 4.0037841796875, 4.16082763671875, 4.31787109375, 4.47491455078125, 4.6319580078125, 4.78900146484375, 4.946044921875, 5.10308837890625, 5.2601318359375, 5.41717529296875, 5.57421875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 7.0, 9.0, 11.0, 6.0, 17.0, 23.0, 48.0, 64.0, 92.0, 137.0, 214.0, 302.0, 437.0, 686.0, 973.0, 1506.0, 2267.0, 3549.0, 5095.0, 7807.0, 11430.0, 17602.0, 27890.0, 81128.0, 1841470.0, 33984.0, 20452.0, 13229.0, 9005.0, 5937.0, 3937.0, 2649.0, 1650.0, 1221.0, 765.0, 471.0, 332.0, 228.0, 160.0, 105.0, 74.0, 42.0, 35.0, 22.0, 18.0, 15.0, 13.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3671875, -2.291259765625, -2.21533203125, -2.139404296875, -2.0634765625, -1.987548828125, -1.91162109375, -1.835693359375, -1.759765625, -1.683837890625, -1.60791015625, -1.531982421875, -1.4560546875, -1.380126953125, -1.30419921875, -1.228271484375, -1.15234375, -1.076416015625, -1.00048828125, -0.924560546875, -0.8486328125, -0.772705078125, -0.69677734375, -0.620849609375, -0.544921875, -0.468994140625, -0.39306640625, -0.317138671875, -0.2412109375, -0.165283203125, -0.08935546875, -0.013427734375, 0.0625, 0.138427734375, 0.21435546875, 0.290283203125, 0.3662109375, 0.442138671875, 0.51806640625, 0.593994140625, 0.669921875, 0.745849609375, 0.82177734375, 0.897705078125, 0.9736328125, 1.049560546875, 1.12548828125, 1.201416015625, 1.27734375, 1.353271484375, 1.42919921875, 1.505126953125, 1.5810546875, 1.656982421875, 1.73291015625, 1.808837890625, 1.884765625, 1.960693359375, 2.03662109375, 2.112548828125, 2.1884765625, 2.264404296875, 2.34033203125, 2.416259765625, 2.4921875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 7.0, 3.0, 7.0, 6.0, 7.0, 13.0, 7.0, 13.0, 18.0, 11.0, 23.0, 13.0, 25.0, 24.0, 37.0, 37.0, 40.0, 55.0, 54.0, 78.0, 75.0, 73.0, 48.0, 55.0, 30.0, 32.0, 29.0, 20.0, 23.0, 24.0, 19.0, 17.0, 13.0, 13.0, 15.0, 7.0, 11.0, 8.0, 4.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0667724609375, -0.0645303726196289, -0.06228828430175781, -0.06004619598388672, -0.057804107666015625, -0.05556201934814453, -0.05331993103027344, -0.051077842712402344, -0.04883575439453125, -0.046593666076660156, -0.04435157775878906, -0.04210948944091797, -0.039867401123046875, -0.03762531280517578, -0.03538322448730469, -0.033141136169433594, -0.0308990478515625, -0.028656959533691406, -0.026414871215820312, -0.02417278289794922, -0.021930694580078125, -0.01968860626220703, -0.017446517944335938, -0.015204429626464844, -0.01296234130859375, -0.010720252990722656, -0.008478164672851562, -0.006236076354980469, -0.003993988037109375, -0.0017518997192382812, 0.0004901885986328125, 0.0027322769165039062, 0.004974365234375, 0.007216453552246094, 0.009458541870117188, 0.011700630187988281, 0.013942718505859375, 0.01618480682373047, 0.018426895141601562, 0.020668983459472656, 0.02291107177734375, 0.025153160095214844, 0.027395248413085938, 0.02963733673095703, 0.031879425048828125, 0.03412151336669922, 0.03636360168457031, 0.038605690002441406, 0.0408477783203125, 0.043089866638183594, 0.04533195495605469, 0.04757404327392578, 0.049816131591796875, 0.05205821990966797, 0.05430030822753906, 0.056542396545410156, 0.05878448486328125, 0.061026573181152344, 0.06326866149902344, 0.06551074981689453, 0.06775283813476562, 0.06999492645263672, 0.07223701477050781, 0.0744791030883789, 0.07672119140625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 9.0, 10.0, 8.0, 10.0, 10.0, 14.0, 15.0, 11.0, 14.0, 19.0, 24.0, 35.0, 40.0, 50.0, 82.0, 130.0, 274.0, 702.0, 9677.0, 910654.0, 123809.0, 1993.0, 421.0, 169.0, 104.0, 70.0, 39.0, 22.0, 18.0, 15.0, 25.0, 9.0, 11.0, 8.0, 8.0, 8.0, 11.0, 4.0, 3.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4951171875, -1.449493408203125, -1.40386962890625, -1.358245849609375, -1.3126220703125, -1.266998291015625, -1.22137451171875, -1.175750732421875, -1.130126953125, -1.084503173828125, -1.03887939453125, -0.993255615234375, -0.9476318359375, -0.902008056640625, -0.85638427734375, -0.810760498046875, -0.76513671875, -0.719512939453125, -0.67388916015625, -0.628265380859375, -0.5826416015625, -0.537017822265625, -0.49139404296875, -0.445770263671875, -0.400146484375, -0.354522705078125, -0.30889892578125, -0.263275146484375, -0.2176513671875, -0.172027587890625, -0.12640380859375, -0.080780029296875, -0.03515625, 0.010467529296875, 0.05609130859375, 0.101715087890625, 0.1473388671875, 0.192962646484375, 0.23858642578125, 0.284210205078125, 0.329833984375, 0.375457763671875, 0.42108154296875, 0.466705322265625, 0.5123291015625, 0.557952880859375, 0.60357666015625, 0.649200439453125, 0.69482421875, 0.740447998046875, 0.78607177734375, 0.831695556640625, 0.8773193359375, 0.922943115234375, 0.96856689453125, 1.014190673828125, 1.059814453125, 1.105438232421875, 1.15106201171875, 1.196685791015625, 1.2423095703125, 1.287933349609375, 1.33355712890625, 1.379180908203125, 1.4248046875]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 10.0, 47.0, 447.0, 450.0, 47.0, 10.0, 4.0, 3.0, 0.0, 1.0], "bins": [-3.770216703414917, -3.7040605545043945, -3.637904405593872, -3.5717480182647705, -3.505591869354248, -3.4394357204437256, -3.373279571533203, -3.3071234226226807, -3.240967273712158, -3.1748111248016357, -3.1086549758911133, -3.0424985885620117, -2.9763424396514893, -2.910186290740967, -2.8440301418304443, -2.777873992919922, -2.7117176055908203, -2.645561456680298, -2.5794053077697754, -2.513248920440674, -2.4470927715301514, -2.380936622619629, -2.3147804737091064, -2.248624324798584, -2.1824679374694824, -2.11631178855896, -2.0501556396484375, -1.9839993715286255, -1.9178431034088135, -1.851686954498291, -1.7855308055877686, -1.719374656677246, -1.6532185077667236, -1.5870623588562012, -1.5209060907363892, -1.4547499418258667, -1.3885936737060547, -1.3224375247955322, -1.2562813758850098, -1.1901252269744873, -1.1239690780639648, -1.0578129291534424, -0.9916566610336304, -0.9255005121231079, -0.8593443036079407, -0.7931880950927734, -0.727031946182251, -0.6608757376670837, -0.5947194695472717, -0.5285632610321045, -0.46240708231925964, -0.3962509036064148, -0.33009469509124756, -0.2639384865760803, -0.19778230786323547, -0.13162612915039062, -0.06546992063522339, 0.0006862729787826538, 0.0668424665927887, 0.13299866020679474, 0.19915485382080078, 0.265311062335968, 0.33146724104881287, 0.3976234197616577, 0.46377962827682495]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 8.0, 8.0, 9.0, 10.0, 15.0, 27.0, 16.0, 30.0, 37.0, 36.0, 38.0, 32.0, 34.0, 47.0, 41.0, 47.0, 49.0, 53.0, 45.0, 42.0, 45.0, 44.0, 41.0, 34.0, 27.0, 34.0, 34.0, 26.0, 19.0, 12.0, 20.0, 11.0, 6.0, 9.0, 6.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.29440778493881226, -0.28588932752609253, -0.2773708701133728, -0.2688524127006531, -0.26033395528793335, -0.2518154978752136, -0.2432970255613327, -0.23477856814861298, -0.22626009583473206, -0.21774163842201233, -0.2092231810092926, -0.20070472359657288, -0.19218625128269196, -0.18366779386997223, -0.1751493364572525, -0.16663087904453278, -0.15811242163181305, -0.14959396421909332, -0.1410755068063736, -0.13255703449249268, -0.12403857707977295, -0.11552011966705322, -0.1070016622543335, -0.09848320484161377, -0.08996473997831345, -0.08144628256559372, -0.0729278177022934, -0.06440936028957367, -0.055890899151563644, -0.04737243801355362, -0.03885398060083389, -0.030335519462823868, -0.021817058324813843, -0.013298598118126392, -0.004780137911438942, 0.003738321363925934, 0.012256782501935959, 0.020775243639945984, 0.02929370105266571, 0.037812162190675735, 0.04633062332868576, 0.054849084466695786, 0.06336754560470581, 0.07188600301742554, 0.08040446043014526, 0.08892292529344559, 0.09744138270616531, 0.10595984756946564, 0.11447830498218536, 0.12299676239490509, 0.13151521980762482, 0.14003369212150574, 0.14855214953422546, 0.1570706069469452, 0.16558906435966492, 0.17410752177238464, 0.18262597918510437, 0.1911444365978241, 0.19966289401054382, 0.20818135142326355, 0.21669982373714447, 0.2252182811498642, 0.23373673856258392, 0.24225519597530365, 0.25077366828918457]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 4.0, 7.0, 7.0, 6.0, 7.0, 13.0, 10.0, 16.0, 29.0, 29.0, 27.0, 27.0, 31.0, 41.0, 29.0, 38.0, 64.0, 56.0, 53.0, 65.0, 51.0, 34.0, 38.0, 50.0, 34.0, 36.0, 24.0, 32.0, 18.0, 16.0, 16.0, 23.0, 15.0, 9.0, 7.0, 12.0, 9.0, 8.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.72265625, -6.51373291015625, -6.3048095703125, -6.09588623046875, -5.886962890625, -5.67803955078125, -5.4691162109375, -5.26019287109375, -5.05126953125, -4.84234619140625, -4.6334228515625, -4.42449951171875, -4.215576171875, -4.00665283203125, -3.7977294921875, -3.58880615234375, -3.3798828125, -3.17095947265625, -2.9620361328125, -2.75311279296875, -2.544189453125, -2.33526611328125, -2.1263427734375, -1.91741943359375, -1.70849609375, -1.49957275390625, -1.2906494140625, -1.08172607421875, -0.872802734375, -0.66387939453125, -0.4549560546875, -0.24603271484375, -0.037109375, 0.17181396484375, 0.3807373046875, 0.58966064453125, 0.798583984375, 1.00750732421875, 1.2164306640625, 1.42535400390625, 1.63427734375, 1.84320068359375, 2.0521240234375, 2.26104736328125, 2.469970703125, 2.67889404296875, 2.8878173828125, 3.09674072265625, 3.3056640625, 3.51458740234375, 3.7235107421875, 3.93243408203125, 4.141357421875, 4.35028076171875, 4.5592041015625, 4.76812744140625, 4.97705078125, 5.18597412109375, 5.3948974609375, 5.60382080078125, 5.812744140625, 6.02166748046875, 6.2305908203125, 6.43951416015625, 6.6484375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 2.0, 6.0, 12.0, 9.0, 11.0, 21.0, 31.0, 43.0, 63.0, 84.0, 108.0, 129.0, 218.0, 266.0, 421.0, 601.0, 876.0, 1343.0, 2309.0, 3783.0, 6885.0, 12990.0, 24543.0, 47151.0, 88127.0, 157017.0, 241514.0, 201660.0, 119007.0, 64907.0, 33985.0, 17847.0, 9295.0, 5271.0, 2871.0, 1756.0, 1129.0, 664.0, 479.0, 307.0, 210.0, 169.0, 120.0, 80.0, 77.0, 45.0, 35.0, 28.0, 18.0, 7.0, 10.0, 10.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-6.19140625, -5.99005126953125, -5.7886962890625, -5.58734130859375, -5.385986328125, -5.18463134765625, -4.9832763671875, -4.78192138671875, -4.58056640625, -4.37921142578125, -4.1778564453125, -3.97650146484375, -3.775146484375, -3.57379150390625, -3.3724365234375, -3.17108154296875, -2.9697265625, -2.76837158203125, -2.5670166015625, -2.36566162109375, -2.164306640625, -1.96295166015625, -1.7615966796875, -1.56024169921875, -1.35888671875, -1.15753173828125, -0.9561767578125, -0.75482177734375, -0.553466796875, -0.35211181640625, -0.1507568359375, 0.05059814453125, 0.251953125, 0.45330810546875, 0.6546630859375, 0.85601806640625, 1.057373046875, 1.25872802734375, 1.4600830078125, 1.66143798828125, 1.86279296875, 2.06414794921875, 2.2655029296875, 2.46685791015625, 2.668212890625, 2.86956787109375, 3.0709228515625, 3.27227783203125, 3.4736328125, 3.67498779296875, 3.8763427734375, 4.07769775390625, 4.279052734375, 4.48040771484375, 4.6817626953125, 4.88311767578125, 5.08447265625, 5.28582763671875, 5.4871826171875, 5.68853759765625, 5.889892578125, 6.09124755859375, 6.2926025390625, 6.49395751953125, 6.6953125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 7.0, 2.0, 4.0, 3.0, 2.0, 5.0, 6.0, 8.0, 6.0, 6.0, 10.0, 10.0, 7.0, 24.0, 14.0, 23.0, 18.0, 28.0, 30.0, 37.0, 31.0, 48.0, 63.0, 87.0, 143.0, 201.0, 1351.0, 236.0, 140.0, 99.0, 65.0, 63.0, 43.0, 37.0, 34.0, 25.0, 17.0, 30.0, 21.0, 13.0, 12.0, 8.0, 8.0, 8.0, 8.0, 3.0, 4.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-24.453125, -23.74560546875, -23.0380859375, -22.33056640625, -21.623046875, -20.91552734375, -20.2080078125, -19.50048828125, -18.79296875, -18.08544921875, -17.3779296875, -16.67041015625, -15.962890625, -15.25537109375, -14.5478515625, -13.84033203125, -13.1328125, -12.42529296875, -11.7177734375, -11.01025390625, -10.302734375, -9.59521484375, -8.8876953125, -8.18017578125, -7.47265625, -6.76513671875, -6.0576171875, -5.35009765625, -4.642578125, -3.93505859375, -3.2275390625, -2.52001953125, -1.8125, -1.10498046875, -0.3974609375, 0.31005859375, 1.017578125, 1.72509765625, 2.4326171875, 3.14013671875, 3.84765625, 4.55517578125, 5.2626953125, 5.97021484375, 6.677734375, 7.38525390625, 8.0927734375, 8.80029296875, 9.5078125, 10.21533203125, 10.9228515625, 11.63037109375, 12.337890625, 13.04541015625, 13.7529296875, 14.46044921875, 15.16796875, 15.87548828125, 16.5830078125, 17.29052734375, 17.998046875, 18.70556640625, 19.4130859375, 20.12060546875, 20.828125]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 5.0, 11.0, 7.0, 7.0, 10.0, 18.0, 18.0, 17.0, 37.0, 45.0, 61.0, 55.0, 100.0, 138.0, 179.0, 299.0, 459.0, 1158.0, 5464.0, 96899.0, 2768749.0, 259840.0, 8957.0, 1539.0, 558.0, 294.0, 209.0, 138.0, 100.0, 81.0, 49.0, 39.0, 27.0, 31.0, 25.0, 22.0, 17.0, 9.0, 11.0, 6.0, 3.0, 7.0, 2.0, 6.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.75, -43.3779296875, -42.005859375, -40.6337890625, -39.26171875, -37.8896484375, -36.517578125, -35.1455078125, -33.7734375, -32.4013671875, -31.029296875, -29.6572265625, -28.28515625, -26.9130859375, -25.541015625, -24.1689453125, -22.796875, -21.4248046875, -20.052734375, -18.6806640625, -17.30859375, -15.9365234375, -14.564453125, -13.1923828125, -11.8203125, -10.4482421875, -9.076171875, -7.7041015625, -6.33203125, -4.9599609375, -3.587890625, -2.2158203125, -0.84375, 0.5283203125, 1.900390625, 3.2724609375, 4.64453125, 6.0166015625, 7.388671875, 8.7607421875, 10.1328125, 11.5048828125, 12.876953125, 14.2490234375, 15.62109375, 16.9931640625, 18.365234375, 19.7373046875, 21.109375, 22.4814453125, 23.853515625, 25.2255859375, 26.59765625, 27.9697265625, 29.341796875, 30.7138671875, 32.0859375, 33.4580078125, 34.830078125, 36.2021484375, 37.57421875, 38.9462890625, 40.318359375, 41.6904296875, 43.0625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [6.0, 12.0, 27.0, 88.0, 161.0, 284.0, 240.0, 136.0, 48.0, 14.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.42997169494629, -19.379505157470703, -15.329038619995117, -11.278572082519531, -7.228105545043945, -3.1776390075683594, 0.8728275299072266, 4.9232940673828125, 8.973760604858398, 13.024227142333984, 17.07469367980957, 21.125160217285156, 25.175626754760742, 29.226093292236328, 33.27655792236328, 37.3270263671875, 41.37749481201172, 45.42796325683594, 49.47842788696289, 53.528892517089844, 57.57936096191406, 61.62982940673828, 65.6802978515625, 69.73075866699219, 73.7812271118164, 77.83169555664062, 81.88215637207031, 85.93262481689453, 89.98309326171875, 94.03356170654297, 98.08403015136719, 102.13449096679688, 106.18495178222656, 110.23542022705078, 114.285888671875, 118.33634948730469, 122.3868179321289, 126.43728637695312, 130.4877471923828, 134.53822326660156, 138.58868408203125, 142.63914489746094, 146.6896209716797, 150.74008178710938, 154.79055786132812, 158.8410186767578, 162.8914794921875, 166.94195556640625, 170.99241638183594, 175.04287719726562, 179.09335327148438, 183.14381408691406, 187.19427490234375, 191.2447509765625, 195.2952117919922, 199.34568786621094, 203.39614868164062, 207.4466094970703, 211.49708557128906, 215.54754638671875, 219.5980224609375, 223.6484832763672, 227.69894409179688, 231.74942016601562, 235.7998809814453]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 8.0, 8.0, 10.0, 7.0, 10.0, 17.0, 22.0, 13.0, 11.0, 28.0, 29.0, 22.0, 33.0, 37.0, 48.0, 51.0, 29.0, 52.0, 53.0, 38.0, 50.0, 47.0, 47.0, 51.0, 29.0, 40.0, 35.0, 29.0, 25.0, 24.0, 17.0, 20.0, 10.0, 11.0, 8.0, 11.0, 8.0, 5.0, 4.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.33655548095703, -68.28878784179688, -66.24102020263672, -64.19325256347656, -62.145484924316406, -60.09771728515625, -58.04994583129883, -56.00217819213867, -53.954410552978516, -51.90664291381836, -49.8588752746582, -47.81110763549805, -45.763336181640625, -43.71556854248047, -41.66780090332031, -39.620033264160156, -37.572265625, -35.524497985839844, -33.47673034667969, -31.4289608001709, -29.381193161010742, -27.333425521850586, -25.285655975341797, -23.23788833618164, -21.190120697021484, -19.142353057861328, -17.094585418701172, -15.046815872192383, -12.999048233032227, -10.95128059387207, -8.903512001037598, -6.855743408203125, -4.8079681396484375, -2.760200023651123, -0.7124319076538086, 1.3353362083435059, 3.3831043243408203, 5.430871963500977, 7.478640556335449, 9.526409149169922, 11.574176788330078, 13.621944427490234, 15.669713020324707, 17.71748161315918, 19.765249252319336, 21.813016891479492, 23.86078643798828, 25.908554077148438, 27.956321716308594, 30.00408935546875, 32.051856994628906, 34.09962463378906, 36.14739227294922, 38.195159912109375, 40.2429313659668, 42.29069900512695, 44.33846664428711, 46.386234283447266, 48.43400192260742, 50.48176956176758, 52.529541015625, 54.577308654785156, 56.62507629394531, 58.67284393310547, 60.720611572265625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 10.0, 3.0, 9.0, 8.0, 3.0, 14.0, 25.0, 21.0, 32.0, 26.0, 24.0, 36.0, 35.0, 46.0, 41.0, 52.0, 46.0, 56.0, 74.0, 49.0, 39.0, 45.0, 60.0, 35.0, 26.0, 30.0, 25.0, 31.0, 19.0, 20.0, 11.0, 8.0, 8.0, 8.0, 8.0, 7.0, 6.0, 4.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.97265625, -7.7325439453125, -7.492431640625, -7.2523193359375, -7.01220703125, -6.7720947265625, -6.531982421875, -6.2918701171875, -6.0517578125, -5.8116455078125, -5.571533203125, -5.3314208984375, -5.09130859375, -4.8511962890625, -4.611083984375, -4.3709716796875, -4.130859375, -3.8907470703125, -3.650634765625, -3.4105224609375, -3.17041015625, -2.9302978515625, -2.690185546875, -2.4500732421875, -2.2099609375, -1.9698486328125, -1.729736328125, -1.4896240234375, -1.24951171875, -1.0093994140625, -0.769287109375, -0.5291748046875, -0.2890625, -0.0489501953125, 0.191162109375, 0.4312744140625, 0.67138671875, 0.9114990234375, 1.151611328125, 1.3917236328125, 1.6318359375, 1.8719482421875, 2.112060546875, 2.3521728515625, 2.59228515625, 2.8323974609375, 3.072509765625, 3.3126220703125, 3.552734375, 3.7928466796875, 4.032958984375, 4.2730712890625, 4.51318359375, 4.7532958984375, 4.993408203125, 5.2335205078125, 5.4736328125, 5.7137451171875, 5.953857421875, 6.1939697265625, 6.43408203125, 6.6741943359375, 6.914306640625, 7.1544189453125, 7.39453125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 5.0, 1.0, 5.0, 8.0, 11.0, 6.0, 14.0, 25.0, 27.0, 27.0, 14.0, 39.0, 80.0, 123.0, 233.0, 601.0, 2019.0, 10898.0, 138196.0, 2069301.0, 1845377.0, 115157.0, 9290.0, 1757.0, 522.0, 201.0, 118.0, 63.0, 45.0, 18.0, 19.0, 15.0, 20.0, 9.0, 10.0, 8.0, 11.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.09375, -22.371337890625, -21.64892578125, -20.926513671875, -20.2041015625, -19.481689453125, -18.75927734375, -18.036865234375, -17.314453125, -16.592041015625, -15.86962890625, -15.147216796875, -14.4248046875, -13.702392578125, -12.97998046875, -12.257568359375, -11.53515625, -10.812744140625, -10.09033203125, -9.367919921875, -8.6455078125, -7.923095703125, -7.20068359375, -6.478271484375, -5.755859375, -5.033447265625, -4.31103515625, -3.588623046875, -2.8662109375, -2.143798828125, -1.42138671875, -0.698974609375, 0.0234375, 0.745849609375, 1.46826171875, 2.190673828125, 2.9130859375, 3.635498046875, 4.35791015625, 5.080322265625, 5.802734375, 6.525146484375, 7.24755859375, 7.969970703125, 8.6923828125, 9.414794921875, 10.13720703125, 10.859619140625, 11.58203125, 12.304443359375, 13.02685546875, 13.749267578125, 14.4716796875, 15.194091796875, 15.91650390625, 16.638916015625, 17.361328125, 18.083740234375, 18.80615234375, 19.528564453125, 20.2509765625, 20.973388671875, 21.69580078125, 22.418212890625, 23.140625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 4.0, 11.0, 18.0, 24.0, 31.0, 48.0, 51.0, 91.0, 105.0, 160.0, 198.0, 274.0, 326.0, 409.0, 414.0, 408.0, 376.0, 267.0, 240.0, 150.0, 122.0, 104.0, 70.0, 46.0, 32.0, 24.0, 14.0, 18.0, 11.0, 9.0, 3.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.2734375, -12.82470703125, -12.3759765625, -11.92724609375, -11.478515625, -11.02978515625, -10.5810546875, -10.13232421875, -9.68359375, -9.23486328125, -8.7861328125, -8.33740234375, -7.888671875, -7.43994140625, -6.9912109375, -6.54248046875, -6.09375, -5.64501953125, -5.1962890625, -4.74755859375, -4.298828125, -3.85009765625, -3.4013671875, -2.95263671875, -2.50390625, -2.05517578125, -1.6064453125, -1.15771484375, -0.708984375, -0.26025390625, 0.1884765625, 0.63720703125, 1.0859375, 1.53466796875, 1.9833984375, 2.43212890625, 2.880859375, 3.32958984375, 3.7783203125, 4.22705078125, 4.67578125, 5.12451171875, 5.5732421875, 6.02197265625, 6.470703125, 6.91943359375, 7.3681640625, 7.81689453125, 8.265625, 8.71435546875, 9.1630859375, 9.61181640625, 10.060546875, 10.50927734375, 10.9580078125, 11.40673828125, 11.85546875, 12.30419921875, 12.7529296875, 13.20166015625, 13.650390625, 14.09912109375, 14.5478515625, 14.99658203125, 15.4453125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 8.0, 13.0, 17.0, 20.0, 17.0, 38.0, 44.0, 94.0, 113.0, 183.0, 282.0, 559.0, 1467.0, 7453.0, 74588.0, 1017644.0, 2712176.0, 347426.0, 26478.0, 3722.0, 939.0, 375.0, 216.0, 123.0, 85.0, 61.0, 35.0, 32.0, 20.0, 19.0, 6.0, 9.0, 6.0, 3.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-33.25, -32.3583984375, -31.466796875, -30.5751953125, -29.68359375, -28.7919921875, -27.900390625, -27.0087890625, -26.1171875, -25.2255859375, -24.333984375, -23.4423828125, -22.55078125, -21.6591796875, -20.767578125, -19.8759765625, -18.984375, -18.0927734375, -17.201171875, -16.3095703125, -15.41796875, -14.5263671875, -13.634765625, -12.7431640625, -11.8515625, -10.9599609375, -10.068359375, -9.1767578125, -8.28515625, -7.3935546875, -6.501953125, -5.6103515625, -4.71875, -3.8271484375, -2.935546875, -2.0439453125, -1.15234375, -0.2607421875, 0.630859375, 1.5224609375, 2.4140625, 3.3056640625, 4.197265625, 5.0888671875, 5.98046875, 6.8720703125, 7.763671875, 8.6552734375, 9.546875, 10.4384765625, 11.330078125, 12.2216796875, 13.11328125, 14.0048828125, 14.896484375, 15.7880859375, 16.6796875, 17.5712890625, 18.462890625, 19.3544921875, 20.24609375, 21.1376953125, 22.029296875, 22.9208984375, 23.8125]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 16.0, 38.0, 68.0, 88.0, 148.0, 166.0, 141.0, 132.0, 82.0, 65.0, 38.0, 15.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.7294464111328, -134.27561950683594, -130.82179260253906, -127.36796569824219, -123.91414642333984, -120.46031951904297, -117.0064926147461, -113.55266571044922, -110.09884643554688, -106.64501953125, -103.19119262695312, -99.73736572265625, -96.2835464477539, -92.82971954345703, -89.37589263916016, -85.92206573486328, -82.4682388305664, -79.01441192626953, -75.56058502197266, -72.10676574707031, -68.65293884277344, -65.19911193847656, -61.74528503417969, -58.29145812988281, -54.8376350402832, -51.38380813598633, -47.92998504638672, -44.476158142089844, -41.02233123779297, -37.56850814819336, -34.114681243896484, -30.660856246948242, -27.20702362060547, -23.753198623657227, -20.299373626708984, -16.84554672241211, -13.391721725463867, -9.937896728515625, -6.48406982421875, -3.030244827270508, 0.4235801696777344, 3.8774056434631348, 7.331231117248535, 10.785057067871094, 14.238882064819336, 17.692707061767578, 21.146533966064453, 24.600358963012695, 28.054183959960938, 31.50800895690918, 34.96183395385742, 38.4156608581543, 41.869483947753906, 45.32331085205078, 48.777137756347656, 52.23096466064453, 55.68478775024414, 59.138614654541016, 62.592437744140625, 66.0462646484375, 69.50009155273438, 72.95391845703125, 76.40774536132812, 79.86156463623047, 83.31539154052734]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 0.0, 6.0, 3.0, 5.0, 3.0, 8.0, 5.0, 8.0, 5.0, 10.0, 10.0, 12.0, 10.0, 16.0, 15.0, 14.0, 13.0, 29.0, 24.0, 35.0, 20.0, 24.0, 36.0, 26.0, 27.0, 47.0, 42.0, 29.0, 29.0, 49.0, 40.0, 29.0, 37.0, 33.0, 36.0, 25.0, 28.0, 27.0, 23.0, 19.0, 22.0, 16.0, 17.0, 19.0, 14.0, 14.0, 8.0, 8.0, 11.0, 3.0, 5.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0], "bins": [-40.41389846801758, -39.182533264160156, -37.95116424560547, -36.71979522705078, -35.48843002319336, -34.25706481933594, -33.02569580078125, -31.794328689575195, -30.56296157836914, -29.331594467163086, -28.10022735595703, -26.868860244750977, -25.637493133544922, -24.406126022338867, -23.174758911132812, -21.943391799926758, -20.712024688720703, -19.48065757751465, -18.249290466308594, -17.01792335510254, -15.786556243896484, -14.55518913269043, -13.323822021484375, -12.09245491027832, -10.861087799072266, -9.629720687866211, -8.398353576660156, -7.166986465454102, -5.935619354248047, -4.704252243041992, -3.4728851318359375, -2.241518020629883, -1.0101509094238281, 0.22121620178222656, 1.4525833129882812, 2.683950424194336, 3.9153175354003906, 5.146684646606445, 6.3780517578125, 7.609418869018555, 8.84078598022461, 10.072153091430664, 11.303520202636719, 12.534887313842773, 13.766254425048828, 14.997621536254883, 16.228988647460938, 17.460355758666992, 18.691722869873047, 19.9230899810791, 21.154457092285156, 22.38582420349121, 23.617191314697266, 24.84855842590332, 26.079925537109375, 27.31129264831543, 28.542659759521484, 29.77402687072754, 31.005393981933594, 32.23676300048828, 33.4681282043457, 34.699493408203125, 35.93086242675781, 37.1622314453125, 38.39359664916992]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 3.0, 10.0, 8.0, 10.0, 8.0, 14.0, 11.0, 20.0, 20.0, 19.0, 17.0, 21.0, 23.0, 51.0, 40.0, 45.0, 46.0, 41.0, 33.0, 49.0, 56.0, 49.0, 47.0, 54.0, 39.0, 31.0, 36.0, 30.0, 14.0, 23.0, 21.0, 23.0, 19.0, 13.0, 14.0, 11.0, 5.0, 11.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0], "bins": [-7.31640625, -7.1080322265625, -6.899658203125, -6.6912841796875, -6.48291015625, -6.2745361328125, -6.066162109375, -5.8577880859375, -5.6494140625, -5.4410400390625, -5.232666015625, -5.0242919921875, -4.81591796875, -4.6075439453125, -4.399169921875, -4.1907958984375, -3.982421875, -3.7740478515625, -3.565673828125, -3.3572998046875, -3.14892578125, -2.9405517578125, -2.732177734375, -2.5238037109375, -2.3154296875, -2.1070556640625, -1.898681640625, -1.6903076171875, -1.48193359375, -1.2735595703125, -1.065185546875, -0.8568115234375, -0.6484375, -0.4400634765625, -0.231689453125, -0.0233154296875, 0.18505859375, 0.3934326171875, 0.601806640625, 0.8101806640625, 1.0185546875, 1.2269287109375, 1.435302734375, 1.6436767578125, 1.85205078125, 2.0604248046875, 2.268798828125, 2.4771728515625, 2.685546875, 2.8939208984375, 3.102294921875, 3.3106689453125, 3.51904296875, 3.7274169921875, 3.935791015625, 4.1441650390625, 4.3525390625, 4.5609130859375, 4.769287109375, 4.9776611328125, 5.18603515625, 5.3944091796875, 5.602783203125, 5.8111572265625, 6.01953125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 10.0, 13.0, 14.0, 33.0, 50.0, 77.0, 101.0, 175.0, 267.0, 432.0, 723.0, 1137.0, 1771.0, 2843.0, 4680.0, 7234.0, 11528.0, 17822.0, 27610.0, 41340.0, 59732.0, 81843.0, 103700.0, 120561.0, 126607.0, 116247.0, 95360.0, 73497.0, 52108.0, 35810.0, 23775.0, 15278.0, 9771.0, 6094.0, 3776.0, 2420.0, 1565.0, 946.0, 567.0, 387.0, 243.0, 140.0, 96.0, 59.0, 45.0, 32.0, 12.0, 11.0, 8.0, 5.0, 4.0, 0.0, 4.0], "bins": [-1.595703125, -1.5505218505859375, -1.505340576171875, -1.4601593017578125, -1.41497802734375, -1.3697967529296875, -1.324615478515625, -1.2794342041015625, -1.2342529296875, -1.1890716552734375, -1.143890380859375, -1.0987091064453125, -1.05352783203125, -1.0083465576171875, -0.963165283203125, -0.9179840087890625, -0.872802734375, -0.8276214599609375, -0.782440185546875, -0.7372589111328125, -0.69207763671875, -0.6468963623046875, -0.601715087890625, -0.5565338134765625, -0.5113525390625, -0.4661712646484375, -0.420989990234375, -0.3758087158203125, -0.33062744140625, -0.2854461669921875, -0.240264892578125, -0.1950836181640625, -0.14990234375, -0.1047210693359375, -0.059539794921875, -0.0143585205078125, 0.03082275390625, 0.0760040283203125, 0.121185302734375, 0.1663665771484375, 0.2115478515625, 0.2567291259765625, 0.301910400390625, 0.3470916748046875, 0.39227294921875, 0.4374542236328125, 0.482635498046875, 0.5278167724609375, 0.572998046875, 0.6181793212890625, 0.663360595703125, 0.7085418701171875, 0.75372314453125, 0.7989044189453125, 0.844085693359375, 0.8892669677734375, 0.9344482421875, 0.9796295166015625, 1.024810791015625, 1.0699920654296875, 1.11517333984375, 1.1603546142578125, 1.205535888671875, 1.2507171630859375, 1.2958984375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 3.0, 10.0, 5.0, 11.0, 9.0, 9.0, 10.0, 18.0, 13.0, 18.0, 23.0, 28.0, 31.0, 32.0, 23.0, 34.0, 38.0, 45.0, 39.0, 33.0, 33.0, 1061.0, 44.0, 48.0, 39.0, 35.0, 27.0, 47.0, 34.0, 35.0, 35.0, 15.0, 17.0, 17.0, 21.0, 9.0, 12.0, 12.0, 6.0, 8.0, 9.0, 5.0, 8.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.8203125, -4.660400390625, -4.50048828125, -4.340576171875, -4.1806640625, -4.020751953125, -3.86083984375, -3.700927734375, -3.541015625, -3.381103515625, -3.22119140625, -3.061279296875, -2.9013671875, -2.741455078125, -2.58154296875, -2.421630859375, -2.26171875, -2.101806640625, -1.94189453125, -1.781982421875, -1.6220703125, -1.462158203125, -1.30224609375, -1.142333984375, -0.982421875, -0.822509765625, -0.66259765625, -0.502685546875, -0.3427734375, -0.182861328125, -0.02294921875, 0.136962890625, 0.296875, 0.456787109375, 0.61669921875, 0.776611328125, 0.9365234375, 1.096435546875, 1.25634765625, 1.416259765625, 1.576171875, 1.736083984375, 1.89599609375, 2.055908203125, 2.2158203125, 2.375732421875, 2.53564453125, 2.695556640625, 2.85546875, 3.015380859375, 3.17529296875, 3.335205078125, 3.4951171875, 3.655029296875, 3.81494140625, 3.974853515625, 4.134765625, 4.294677734375, 4.45458984375, 4.614501953125, 4.7744140625, 4.934326171875, 5.09423828125, 5.254150390625, 5.4140625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 12.0, 17.0, 22.0, 30.0, 30.0, 56.0, 86.0, 133.0, 148.0, 267.0, 393.0, 603.0, 966.0, 1445.0, 2254.0, 3477.0, 5245.0, 8242.0, 12781.0, 20017.0, 33494.0, 1831679.0, 97445.0, 28651.0, 17435.0, 11319.0, 7341.0, 4755.0, 3083.0, 1892.0, 1322.0, 817.0, 556.0, 383.0, 243.0, 161.0, 107.0, 78.0, 41.0, 34.0, 21.0, 19.0, 8.0, 7.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.62890625, -2.543731689453125, -2.45855712890625, -2.373382568359375, -2.2882080078125, -2.203033447265625, -2.11785888671875, -2.032684326171875, -1.947509765625, -1.862335205078125, -1.77716064453125, -1.691986083984375, -1.6068115234375, -1.521636962890625, -1.43646240234375, -1.351287841796875, -1.26611328125, -1.180938720703125, -1.09576416015625, -1.010589599609375, -0.9254150390625, -0.840240478515625, -0.75506591796875, -0.669891357421875, -0.584716796875, -0.499542236328125, -0.41436767578125, -0.329193115234375, -0.2440185546875, -0.158843994140625, -0.07366943359375, 0.011505126953125, 0.0966796875, 0.181854248046875, 0.26702880859375, 0.352203369140625, 0.4373779296875, 0.522552490234375, 0.60772705078125, 0.692901611328125, 0.778076171875, 0.863250732421875, 0.94842529296875, 1.033599853515625, 1.1187744140625, 1.203948974609375, 1.28912353515625, 1.374298095703125, 1.45947265625, 1.544647216796875, 1.62982177734375, 1.714996337890625, 1.8001708984375, 1.885345458984375, 1.97052001953125, 2.055694580078125, 2.140869140625, 2.226043701171875, 2.31121826171875, 2.396392822265625, 2.4815673828125, 2.566741943359375, 2.65191650390625, 2.737091064453125, 2.822265625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 10.0, 10.0, 16.0, 19.0, 28.0, 36.0, 46.0, 50.0, 50.0, 63.0, 89.0, 103.0, 97.0, 74.0, 63.0, 61.0, 43.0, 23.0, 26.0, 21.0, 15.0, 16.0, 14.0, 6.0, 8.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1024169921875, -0.0991973876953125, -0.095977783203125, -0.0927581787109375, -0.08953857421875, -0.0863189697265625, -0.083099365234375, -0.0798797607421875, -0.07666015625, -0.0734405517578125, -0.070220947265625, -0.0670013427734375, -0.06378173828125, -0.0605621337890625, -0.057342529296875, -0.0541229248046875, -0.0509033203125, -0.0476837158203125, -0.044464111328125, -0.0412445068359375, -0.03802490234375, -0.0348052978515625, -0.031585693359375, -0.0283660888671875, -0.025146484375, -0.0219268798828125, -0.018707275390625, -0.0154876708984375, -0.01226806640625, -0.0090484619140625, -0.005828857421875, -0.0026092529296875, 0.0006103515625, 0.0038299560546875, 0.007049560546875, 0.0102691650390625, 0.01348876953125, 0.0167083740234375, 0.019927978515625, 0.0231475830078125, 0.0263671875, 0.0295867919921875, 0.032806396484375, 0.0360260009765625, 0.03924560546875, 0.0424652099609375, 0.045684814453125, 0.0489044189453125, 0.0521240234375, 0.0553436279296875, 0.058563232421875, 0.0617828369140625, 0.06500244140625, 0.0682220458984375, 0.071441650390625, 0.0746612548828125, 0.077880859375, 0.0811004638671875, 0.084320068359375, 0.0875396728515625, 0.09075927734375, 0.0939788818359375, 0.097198486328125, 0.1004180908203125, 0.1036376953125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 12.0, 6.0, 19.0, 17.0, 18.0, 27.0, 32.0, 51.0, 96.0, 173.0, 358.0, 2061.0, 241402.0, 799811.0, 3512.0, 470.0, 159.0, 102.0, 72.0, 49.0, 30.0, 24.0, 16.0, 13.0, 9.0, 7.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2109375, -2.14202880859375, -2.0731201171875, -2.00421142578125, -1.935302734375, -1.86639404296875, -1.7974853515625, -1.72857666015625, -1.65966796875, -1.59075927734375, -1.5218505859375, -1.45294189453125, -1.384033203125, -1.31512451171875, -1.2462158203125, -1.17730712890625, -1.1083984375, -1.03948974609375, -0.9705810546875, -0.90167236328125, -0.832763671875, -0.76385498046875, -0.6949462890625, -0.62603759765625, -0.55712890625, -0.48822021484375, -0.4193115234375, -0.35040283203125, -0.281494140625, -0.21258544921875, -0.1436767578125, -0.07476806640625, -0.005859375, 0.06304931640625, 0.1319580078125, 0.20086669921875, 0.269775390625, 0.33868408203125, 0.4075927734375, 0.47650146484375, 0.54541015625, 0.61431884765625, 0.6832275390625, 0.75213623046875, 0.821044921875, 0.88995361328125, 0.9588623046875, 1.02777099609375, 1.0966796875, 1.16558837890625, 1.2344970703125, 1.30340576171875, 1.372314453125, 1.44122314453125, 1.5101318359375, 1.57904052734375, 1.64794921875, 1.71685791015625, 1.7857666015625, 1.85467529296875, 1.923583984375, 1.99249267578125, 2.0614013671875, 2.13031005859375, 2.19921875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 6.0, 18.0, 26.0, 37.0, 89.0, 193.0, 308.0, 170.0, 85.0, 42.0, 14.0, 5.0, 8.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0422015190124512, -1.0175701379776, -0.992938756942749, -0.9683074355125427, -0.9436760544776917, -0.9190446734428406, -0.8944133520126343, -0.8697819709777832, -0.8451505899429321, -0.820519208908081, -0.79588782787323, -0.7712565064430237, -0.7466251254081726, -0.7219937443733215, -0.6973624229431152, -0.6727310419082642, -0.6480996608734131, -0.623468279838562, -0.5988368988037109, -0.5742055773735046, -0.5495741963386536, -0.5249428153038025, -0.5003114938735962, -0.4756801128387451, -0.45104873180389404, -0.42641735076904297, -0.4017859995365143, -0.3771546483039856, -0.3525232672691345, -0.32789188623428345, -0.30326053500175476, -0.2786291837692261, -0.2539978623390198, -0.2293664962053299, -0.20473513007164001, -0.18010376393795013, -0.15547239780426025, -0.13084103167057037, -0.1062096655368805, -0.08157829940319061, -0.05694693326950073, -0.03231556713581085, -0.007684201002120972, 0.01694716513156891, 0.04157853126525879, 0.06620989739894867, 0.09084126353263855, 0.11547262966632843, 0.1401039958000183, 0.1647353619337082, 0.18936672806739807, 0.21399809420108795, 0.23862946033477783, 0.2632608413696289, 0.2878921926021576, 0.3125235438346863, 0.33715492486953735, 0.3617863059043884, 0.3864176571369171, 0.4110490083694458, 0.4356803894042969, 0.46031177043914795, 0.48494312167167664, 0.5095744729042053, 0.5342058539390564]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 5.0, 3.0, 9.0, 8.0, 10.0, 16.0, 22.0, 32.0, 14.0, 28.0, 40.0, 39.0, 48.0, 35.0, 51.0, 48.0, 52.0, 65.0, 45.0, 47.0, 45.0, 32.0, 45.0, 44.0, 37.0, 25.0, 29.0, 23.0, 23.0, 19.0, 18.0, 16.0, 11.0, 6.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10857278108596802, -0.10550890862941742, -0.10244503617286682, -0.09938116371631622, -0.09631729125976562, -0.09325342625379562, -0.09018955379724503, -0.08712568134069443, -0.08406180888414383, -0.08099793642759323, -0.07793406397104263, -0.07487019151449203, -0.07180632650852203, -0.06874245405197144, -0.06567858159542084, -0.06261470913887024, -0.05955083668231964, -0.05648696422576904, -0.053423091769218445, -0.050359223037958145, -0.04729535058140755, -0.04423147812485695, -0.04116760939359665, -0.03810373693704605, -0.03503986448049545, -0.031975992023944855, -0.028912121430039406, -0.025848250836133957, -0.02278437837958336, -0.01972050592303276, -0.01665663532912731, -0.013592764735221863, -0.010528892278671265, -0.007465020753443241, -0.004401149228215218, -0.001337277702987194, 0.0017265938222408295, 0.004790465347468853, 0.007854336872696877, 0.010918207466602325, 0.013982079923152924, 0.01704595237970352, 0.02010982297360897, 0.02317369356751442, 0.026237566024065018, 0.029301438480615616, 0.032365307211875916, 0.035429179668426514, 0.03849305212497711, 0.04155692458152771, 0.04462079703807831, 0.04768466576933861, 0.050748538225889206, 0.053812410682439804, 0.056876279413700104, 0.0599401518702507, 0.0630040243268013, 0.0660678967833519, 0.0691317692399025, 0.0721956416964531, 0.0752595067024231, 0.0783233791589737, 0.08138725161552429, 0.08445112407207489, 0.08751499652862549]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 8.0, 10.0, 7.0, 13.0, 16.0, 14.0, 18.0, 15.0, 23.0, 34.0, 33.0, 30.0, 33.0, 40.0, 34.0, 52.0, 39.0, 47.0, 51.0, 52.0, 38.0, 43.0, 37.0, 42.0, 31.0, 36.0, 31.0, 23.0, 19.0, 14.0, 20.0, 19.0, 16.0, 11.0, 5.0, 8.0, 8.0, 4.0, 3.0, 5.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.5234375, -6.3206787109375, -6.117919921875, -5.9151611328125, -5.71240234375, -5.5096435546875, -5.306884765625, -5.1041259765625, -4.9013671875, -4.6986083984375, -4.495849609375, -4.2930908203125, -4.09033203125, -3.8875732421875, -3.684814453125, -3.4820556640625, -3.279296875, -3.0765380859375, -2.873779296875, -2.6710205078125, -2.46826171875, -2.2655029296875, -2.062744140625, -1.8599853515625, -1.6572265625, -1.4544677734375, -1.251708984375, -1.0489501953125, -0.84619140625, -0.6434326171875, -0.440673828125, -0.2379150390625, -0.03515625, 0.1676025390625, 0.370361328125, 0.5731201171875, 0.77587890625, 0.9786376953125, 1.181396484375, 1.3841552734375, 1.5869140625, 1.7896728515625, 1.992431640625, 2.1951904296875, 2.39794921875, 2.6007080078125, 2.803466796875, 3.0062255859375, 3.208984375, 3.4117431640625, 3.614501953125, 3.8172607421875, 4.02001953125, 4.2227783203125, 4.425537109375, 4.6282958984375, 4.8310546875, 5.0338134765625, 5.236572265625, 5.4393310546875, 5.64208984375, 5.8448486328125, 6.047607421875, 6.2503662109375, 6.453125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 6.0, 5.0, 10.0, 6.0, 15.0, 24.0, 22.0, 43.0, 54.0, 95.0, 153.0, 277.0, 418.0, 710.0, 1336.0, 2274.0, 4109.0, 7314.0, 12637.0, 21930.0, 38000.0, 64379.0, 109765.0, 193162.0, 244518.0, 144681.0, 84560.0, 49591.0, 28952.0, 16937.0, 9613.0, 5713.0, 3111.0, 1726.0, 987.0, 551.0, 338.0, 199.0, 120.0, 74.0, 57.0, 30.0, 18.0, 8.0, 7.0, 10.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.24609375, -5.07269287109375, -4.8992919921875, -4.72589111328125, -4.552490234375, -4.37908935546875, -4.2056884765625, -4.03228759765625, -3.85888671875, -3.68548583984375, -3.5120849609375, -3.33868408203125, -3.165283203125, -2.99188232421875, -2.8184814453125, -2.64508056640625, -2.4716796875, -2.29827880859375, -2.1248779296875, -1.95147705078125, -1.778076171875, -1.60467529296875, -1.4312744140625, -1.25787353515625, -1.08447265625, -0.91107177734375, -0.7376708984375, -0.56427001953125, -0.390869140625, -0.21746826171875, -0.0440673828125, 0.12933349609375, 0.302734375, 0.47613525390625, 0.6495361328125, 0.82293701171875, 0.996337890625, 1.16973876953125, 1.3431396484375, 1.51654052734375, 1.68994140625, 1.86334228515625, 2.0367431640625, 2.21014404296875, 2.383544921875, 2.55694580078125, 2.7303466796875, 2.90374755859375, 3.0771484375, 3.25054931640625, 3.4239501953125, 3.59735107421875, 3.770751953125, 3.94415283203125, 4.1175537109375, 4.29095458984375, 4.46435546875, 4.63775634765625, 4.8111572265625, 4.98455810546875, 5.157958984375, 5.33135986328125, 5.5047607421875, 5.67816162109375, 5.8515625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 4.0, 11.0, 7.0, 20.0, 24.0, 11.0, 22.0, 19.0, 32.0, 35.0, 44.0, 50.0, 55.0, 55.0, 118.0, 211.0, 1420.0, 290.0, 160.0, 85.0, 61.0, 53.0, 34.0, 41.0, 22.0, 36.0, 32.0, 20.0, 18.0, 12.0, 7.0, 9.0, 7.0, 6.0, 6.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.84375, -26.0712890625, -25.298828125, -24.5263671875, -23.75390625, -22.9814453125, -22.208984375, -21.4365234375, -20.6640625, -19.8916015625, -19.119140625, -18.3466796875, -17.57421875, -16.8017578125, -16.029296875, -15.2568359375, -14.484375, -13.7119140625, -12.939453125, -12.1669921875, -11.39453125, -10.6220703125, -9.849609375, -9.0771484375, -8.3046875, -7.5322265625, -6.759765625, -5.9873046875, -5.21484375, -4.4423828125, -3.669921875, -2.8974609375, -2.125, -1.3525390625, -0.580078125, 0.1923828125, 0.96484375, 1.7373046875, 2.509765625, 3.2822265625, 4.0546875, 4.8271484375, 5.599609375, 6.3720703125, 7.14453125, 7.9169921875, 8.689453125, 9.4619140625, 10.234375, 11.0068359375, 11.779296875, 12.5517578125, 13.32421875, 14.0966796875, 14.869140625, 15.6416015625, 16.4140625, 17.1865234375, 17.958984375, 18.7314453125, 19.50390625, 20.2763671875, 21.048828125, 21.8212890625, 22.59375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 8.0, 4.0, 10.0, 8.0, 16.0, 14.0, 31.0, 36.0, 46.0, 58.0, 83.0, 104.0, 132.0, 225.0, 292.0, 625.0, 2270.0, 76733.0, 2954045.0, 106559.0, 2656.0, 678.0, 316.0, 192.0, 142.0, 93.0, 78.0, 52.0, 46.0, 42.0, 36.0, 25.0, 13.0, 15.0, 2.0, 6.0, 4.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.40625, -46.87109375, -45.3359375, -43.80078125, -42.265625, -40.73046875, -39.1953125, -37.66015625, -36.125, -34.58984375, -33.0546875, -31.51953125, -29.984375, -28.44921875, -26.9140625, -25.37890625, -23.84375, -22.30859375, -20.7734375, -19.23828125, -17.703125, -16.16796875, -14.6328125, -13.09765625, -11.5625, -10.02734375, -8.4921875, -6.95703125, -5.421875, -3.88671875, -2.3515625, -0.81640625, 0.71875, 2.25390625, 3.7890625, 5.32421875, 6.859375, 8.39453125, 9.9296875, 11.46484375, 13.0, 14.53515625, 16.0703125, 17.60546875, 19.140625, 20.67578125, 22.2109375, 23.74609375, 25.28125, 26.81640625, 28.3515625, 29.88671875, 31.421875, 32.95703125, 34.4921875, 36.02734375, 37.5625, 39.09765625, 40.6328125, 42.16796875, 43.703125, 45.23828125, 46.7734375, 48.30859375, 49.84375]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 29.0, 785.0, 203.0, 1.0], "bins": [-833.3871459960938, -819.8749389648438, -806.3626708984375, -792.8504638671875, -779.3382568359375, -765.8259887695312, -752.3137817382812, -738.8015747070312, -725.289306640625, -711.777099609375, -698.2648315429688, -684.7526245117188, -671.2404174804688, -657.7281494140625, -644.2159423828125, -630.7037353515625, -617.1915283203125, -603.6793212890625, -590.1670532226562, -576.6548461914062, -563.1426391601562, -549.63037109375, -536.1181640625, -522.60595703125, -509.09368896484375, -495.5814514160156, -482.0692443847656, -468.5570068359375, -455.0447692871094, -441.53253173828125, -428.02032470703125, -414.5080871582031, -400.995849609375, -387.4836120605469, -373.9714050292969, -360.45916748046875, -346.9469299316406, -333.4346923828125, -319.9224853515625, -306.4102478027344, -292.8980407714844, -279.38580322265625, -265.87359619140625, -252.36135864257812, -238.84912109375, -225.33689880371094, -211.82467651367188, -198.31243896484375, -184.80020141601562, -171.28797912597656, -157.77574157714844, -144.26351928710938, -130.75128173828125, -117.23905944824219, -103.72683715820312, -90.21460723876953, -76.70237731933594, -63.190147399902344, -49.677921295166016, -36.16569519042969, -22.653465270996094, -9.1412353515625, 4.3709869384765625, 17.883216857910156, 31.395444869995117]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 5.0, 5.0, 6.0, 14.0, 13.0, 20.0, 12.0, 29.0, 18.0, 34.0, 29.0, 28.0, 35.0, 38.0, 31.0, 32.0, 33.0, 50.0, 36.0, 28.0, 43.0, 41.0, 41.0, 39.0, 35.0, 37.0, 29.0, 29.0, 22.0, 24.0, 20.0, 24.0, 19.0, 17.0, 10.0, 12.0, 6.0, 11.0, 2.0, 7.0, 10.0, 9.0, 4.0, 6.0, 0.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.7867431640625, -53.9520378112793, -52.11733627319336, -50.282630920410156, -48.44792556762695, -46.61322021484375, -44.77851867675781, -42.94381332397461, -41.109107971191406, -39.2744026184082, -37.439701080322266, -35.60499572753906, -33.77029037475586, -31.93558692932129, -30.10088348388672, -28.266178131103516, -26.431476593017578, -24.596773147583008, -22.762067794799805, -20.927364349365234, -19.09265899658203, -17.25795555114746, -15.42325210571289, -13.588547706604004, -11.753843307495117, -9.91913890838623, -8.084434509277344, -6.249731063842773, -4.415026664733887, -2.580322265625, -0.7456188201904297, 1.089085578918457, 2.9237937927246094, 4.758498191833496, 6.593202114105225, 8.427906036376953, 10.26261043548584, 12.097314834594727, 13.932018280029297, 15.766722679138184, 17.60142707824707, 19.43613052368164, 21.270835876464844, 23.105539321899414, 24.940242767333984, 26.774948120117188, 28.609651565551758, 30.444355010986328, 32.27906036376953, 34.113765716552734, 35.94846725463867, 37.783172607421875, 39.61787796020508, 41.45258331298828, 43.28728485107422, 45.12199020385742, 46.956695556640625, 48.79140090942383, 50.626102447509766, 52.46080780029297, 54.29551315307617, 56.130218505859375, 57.96492004394531, 59.799625396728516, 61.63432693481445]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 14.0, 8.0, 12.0, 13.0, 9.0, 15.0, 20.0, 26.0, 31.0, 33.0, 34.0, 43.0, 45.0, 45.0, 51.0, 53.0, 65.0, 56.0, 52.0, 48.0, 44.0, 38.0, 24.0, 28.0, 22.0, 36.0, 23.0, 19.0, 21.0, 11.0, 15.0, 13.0, 11.0, 5.0, 5.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.5546875, -9.30181884765625, -9.0489501953125, -8.79608154296875, -8.543212890625, -8.29034423828125, -8.0374755859375, -7.78460693359375, -7.53173828125, -7.27886962890625, -7.0260009765625, -6.77313232421875, -6.520263671875, -6.26739501953125, -6.0145263671875, -5.76165771484375, -5.5087890625, -5.25592041015625, -5.0030517578125, -4.75018310546875, -4.497314453125, -4.24444580078125, -3.9915771484375, -3.73870849609375, -3.48583984375, -3.23297119140625, -2.9801025390625, -2.72723388671875, -2.474365234375, -2.22149658203125, -1.9686279296875, -1.71575927734375, -1.462890625, -1.21002197265625, -0.9571533203125, -0.70428466796875, -0.451416015625, -0.19854736328125, 0.0543212890625, 0.30718994140625, 0.56005859375, 0.81292724609375, 1.0657958984375, 1.31866455078125, 1.571533203125, 1.82440185546875, 2.0772705078125, 2.33013916015625, 2.5830078125, 2.83587646484375, 3.0887451171875, 3.34161376953125, 3.594482421875, 3.84735107421875, 4.1002197265625, 4.35308837890625, 4.60595703125, 4.85882568359375, 5.1116943359375, 5.36456298828125, 5.617431640625, 5.87030029296875, 6.1231689453125, 6.37603759765625, 6.62890625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 3.0, 9.0, 10.0, 12.0, 17.0, 14.0, 15.0, 32.0, 40.0, 49.0, 80.0, 146.0, 420.0, 1047.0, 4100.0, 25296.0, 229364.0, 1728995.0, 1900679.0, 268018.0, 29243.0, 4569.0, 1218.0, 418.0, 162.0, 99.0, 54.0, 48.0, 29.0, 15.0, 15.0, 13.0, 17.0, 3.0, 8.0, 12.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.46875, -19.884521484375, -19.30029296875, -18.716064453125, -18.1318359375, -17.547607421875, -16.96337890625, -16.379150390625, -15.794921875, -15.210693359375, -14.62646484375, -14.042236328125, -13.4580078125, -12.873779296875, -12.28955078125, -11.705322265625, -11.12109375, -10.536865234375, -9.95263671875, -9.368408203125, -8.7841796875, -8.199951171875, -7.61572265625, -7.031494140625, -6.447265625, -5.863037109375, -5.27880859375, -4.694580078125, -4.1103515625, -3.526123046875, -2.94189453125, -2.357666015625, -1.7734375, -1.189208984375, -0.60498046875, -0.020751953125, 0.5634765625, 1.147705078125, 1.73193359375, 2.316162109375, 2.900390625, 3.484619140625, 4.06884765625, 4.653076171875, 5.2373046875, 5.821533203125, 6.40576171875, 6.989990234375, 7.57421875, 8.158447265625, 8.74267578125, 9.326904296875, 9.9111328125, 10.495361328125, 11.07958984375, 11.663818359375, 12.248046875, 12.832275390625, 13.41650390625, 14.000732421875, 14.5849609375, 15.169189453125, 15.75341796875, 16.337646484375, 16.921875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 1.0, 8.0, 7.0, 6.0, 14.0, 10.0, 17.0, 13.0, 23.0, 32.0, 22.0, 54.0, 75.0, 76.0, 95.0, 119.0, 158.0, 211.0, 228.0, 283.0, 315.0, 345.0, 317.0, 286.0, 289.0, 225.0, 178.0, 162.0, 105.0, 98.0, 68.0, 40.0, 39.0, 37.0, 24.0, 20.0, 22.0, 18.0, 10.0, 5.0, 0.0, 3.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.359375, -11.0006103515625, -10.641845703125, -10.2830810546875, -9.92431640625, -9.5655517578125, -9.206787109375, -8.8480224609375, -8.4892578125, -8.1304931640625, -7.771728515625, -7.4129638671875, -7.05419921875, -6.6954345703125, -6.336669921875, -5.9779052734375, -5.619140625, -5.2603759765625, -4.901611328125, -4.5428466796875, -4.18408203125, -3.8253173828125, -3.466552734375, -3.1077880859375, -2.7490234375, -2.3902587890625, -2.031494140625, -1.6727294921875, -1.31396484375, -0.9552001953125, -0.596435546875, -0.2376708984375, 0.12109375, 0.4798583984375, 0.838623046875, 1.1973876953125, 1.55615234375, 1.9149169921875, 2.273681640625, 2.6324462890625, 2.9912109375, 3.3499755859375, 3.708740234375, 4.0675048828125, 4.42626953125, 4.7850341796875, 5.143798828125, 5.5025634765625, 5.861328125, 6.2200927734375, 6.578857421875, 6.9376220703125, 7.29638671875, 7.6551513671875, 8.013916015625, 8.3726806640625, 8.7314453125, 9.0902099609375, 9.448974609375, 9.8077392578125, 10.16650390625, 10.5252685546875, 10.884033203125, 11.2427978515625, 11.6015625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 6.0, 2.0, 3.0, 3.0, 7.0, 17.0, 13.0, 26.0, 31.0, 27.0, 38.0, 36.0, 70.0, 97.0, 119.0, 192.0, 249.0, 417.0, 1236.0, 11987.0, 313888.0, 3245522.0, 595764.0, 21446.0, 1645.0, 463.0, 256.0, 183.0, 120.0, 76.0, 92.0, 61.0, 34.0, 28.0, 22.0, 21.0, 22.0, 13.0, 10.0, 10.0, 4.0, 10.0, 5.0, 2.0, 5.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-36.53125, -35.375, -34.21875, -33.0625, -31.90625, -30.75, -29.59375, -28.4375, -27.28125, -26.125, -24.96875, -23.8125, -22.65625, -21.5, -20.34375, -19.1875, -18.03125, -16.875, -15.71875, -14.5625, -13.40625, -12.25, -11.09375, -9.9375, -8.78125, -7.625, -6.46875, -5.3125, -4.15625, -3.0, -1.84375, -0.6875, 0.46875, 1.625, 2.78125, 3.9375, 5.09375, 6.25, 7.40625, 8.5625, 9.71875, 10.875, 12.03125, 13.1875, 14.34375, 15.5, 16.65625, 17.8125, 18.96875, 20.125, 21.28125, 22.4375, 23.59375, 24.75, 25.90625, 27.0625, 28.21875, 29.375, 30.53125, 31.6875, 32.84375, 34.0, 35.15625, 36.3125, 37.46875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 20.0, 60.0, 96.0, 184.0, 247.0, 200.0, 136.0, 52.0, 18.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-238.7595672607422, -233.38858032226562, -228.01760864257812, -222.64662170410156, -217.27565002441406, -211.9046630859375, -206.53369140625, -201.16270446777344, -195.79171752929688, -190.4207305908203, -185.0497589111328, -179.67877197265625, -174.30780029296875, -168.9368133544922, -163.56582641601562, -158.19485473632812, -152.82388305664062, -147.45289611816406, -142.08192443847656, -136.7109375, -131.3399658203125, -125.96897888183594, -120.5979995727539, -115.22702026367188, -109.85603332519531, -104.48505401611328, -99.11407470703125, -93.74308776855469, -88.37210845947266, -83.00112915039062, -77.6301498413086, -72.25917053222656, -66.88819122314453, -61.5172119140625, -56.1462287902832, -50.77524948120117, -45.404266357421875, -40.033287048339844, -34.66230773925781, -29.291324615478516, -23.920345306396484, -18.54936408996582, -13.178383827209473, -7.807403564453125, -2.436422348022461, 2.934558868408203, 8.305538177490234, 13.676521301269531, 19.047500610351562, 24.418481826782227, 29.78946304321289, 35.16044235229492, 40.53142547607422, 45.90240478515625, 51.27338409423828, 56.64436721801758, 62.01534652709961, 67.3863296508789, 72.75730895996094, 78.12828826904297, 83.499267578125, 88.87025451660156, 94.24122619628906, 99.61221313476562, 104.98319244384766]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 5.0, 3.0, 6.0, 11.0, 13.0, 11.0, 10.0, 17.0, 22.0, 25.0, 26.0, 19.0, 23.0, 29.0, 38.0, 23.0, 24.0, 49.0, 38.0, 39.0, 46.0, 35.0, 42.0, 41.0, 41.0, 44.0, 39.0, 40.0, 26.0, 33.0, 21.0, 19.0, 26.0, 26.0, 15.0, 16.0, 11.0, 9.0, 5.0, 8.0, 10.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.995662689208984, -41.5419807434082, -40.08830261230469, -38.634620666503906, -37.180938720703125, -35.72726058959961, -34.27357864379883, -32.81990051269531, -31.36621856689453, -29.912538528442383, -28.4588565826416, -27.005176544189453, -25.551496505737305, -24.097816467285156, -22.644134521484375, -21.190454483032227, -19.736772537231445, -18.283092498779297, -16.829410552978516, -15.375730514526367, -13.922050476074219, -12.468369483947754, -11.014688491821289, -9.56100845336914, -8.107327461242676, -6.653646945953369, -5.1999664306640625, -3.7462854385375977, -2.292604923248291, -0.8389244079589844, 0.6147565841674805, 2.068436622619629, 3.5221176147460938, 4.9757981300354, 6.429478645324707, 7.883159637451172, 9.33683967590332, 10.790520668029785, 12.24420166015625, 13.697881698608398, 15.151562690734863, 16.605243682861328, 18.058923721313477, 19.512603759765625, 20.966285705566406, 22.419965744018555, 23.873645782470703, 25.327327728271484, 26.781007766723633, 28.23468780517578, 29.688369750976562, 31.14204978942871, 32.59572982788086, 34.04941177368164, 35.503089904785156, 36.95677185058594, 38.41045379638672, 39.8641357421875, 41.317813873291016, 42.7714958190918, 44.22517776489258, 45.678855895996094, 47.132537841796875, 48.586219787597656, 50.03989791870117]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 7.0, 9.0, 9.0, 17.0, 16.0, 25.0, 24.0, 18.0, 17.0, 24.0, 30.0, 29.0, 28.0, 31.0, 41.0, 40.0, 30.0, 39.0, 44.0, 41.0, 52.0, 45.0, 29.0, 42.0, 36.0, 32.0, 28.0, 35.0, 18.0, 25.0, 19.0, 19.0, 20.0, 12.0, 17.0, 11.0, 8.0, 8.0, 7.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5, -5.29217529296875, -5.0843505859375, -4.87652587890625, -4.668701171875, -4.46087646484375, -4.2530517578125, -4.04522705078125, -3.83740234375, -3.62957763671875, -3.4217529296875, -3.21392822265625, -3.006103515625, -2.79827880859375, -2.5904541015625, -2.38262939453125, -2.1748046875, -1.96697998046875, -1.7591552734375, -1.55133056640625, -1.343505859375, -1.13568115234375, -0.9278564453125, -0.72003173828125, -0.51220703125, -0.30438232421875, -0.0965576171875, 0.11126708984375, 0.319091796875, 0.52691650390625, 0.7347412109375, 0.94256591796875, 1.150390625, 1.35821533203125, 1.5660400390625, 1.77386474609375, 1.981689453125, 2.18951416015625, 2.3973388671875, 2.60516357421875, 2.81298828125, 3.02081298828125, 3.2286376953125, 3.43646240234375, 3.644287109375, 3.85211181640625, 4.0599365234375, 4.26776123046875, 4.4755859375, 4.68341064453125, 4.8912353515625, 5.09906005859375, 5.306884765625, 5.51470947265625, 5.7225341796875, 5.93035888671875, 6.13818359375, 6.34600830078125, 6.5538330078125, 6.76165771484375, 6.969482421875, 7.17730712890625, 7.3851318359375, 7.59295654296875, 7.80078125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 7.0, 8.0, 13.0, 17.0, 31.0, 37.0, 67.0, 112.0, 172.0, 219.0, 399.0, 720.0, 983.0, 1671.0, 2770.0, 4450.0, 7293.0, 11828.0, 18599.0, 29126.0, 43975.0, 63734.0, 87480.0, 110746.0, 129059.0, 129731.0, 114781.0, 90950.0, 67856.0, 46967.0, 31624.0, 20226.0, 12626.0, 7798.0, 4703.0, 2900.0, 1843.0, 1102.0, 724.0, 415.0, 291.0, 178.0, 122.0, 66.0, 49.0, 29.0, 21.0, 16.0, 12.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3447265625, -1.3028106689453125, -1.260894775390625, -1.2189788818359375, -1.17706298828125, -1.1351470947265625, -1.093231201171875, -1.0513153076171875, -1.0093994140625, -0.9674835205078125, -0.925567626953125, -0.8836517333984375, -0.84173583984375, -0.7998199462890625, -0.757904052734375, -0.7159881591796875, -0.674072265625, -0.6321563720703125, -0.590240478515625, -0.5483245849609375, -0.50640869140625, -0.4644927978515625, -0.422576904296875, -0.3806610107421875, -0.3387451171875, -0.2968292236328125, -0.254913330078125, -0.2129974365234375, -0.17108154296875, -0.1291656494140625, -0.087249755859375, -0.0453338623046875, -0.00341796875, 0.0384979248046875, 0.080413818359375, 0.1223297119140625, 0.16424560546875, 0.2061614990234375, 0.248077392578125, 0.2899932861328125, 0.3319091796875, 0.3738250732421875, 0.415740966796875, 0.4576568603515625, 0.49957275390625, 0.5414886474609375, 0.583404541015625, 0.6253204345703125, 0.667236328125, 0.7091522216796875, 0.751068115234375, 0.7929840087890625, 0.83489990234375, 0.8768157958984375, 0.918731689453125, 0.9606475830078125, 1.0025634765625, 1.0444793701171875, 1.086395263671875, 1.1283111572265625, 1.17022705078125, 1.2121429443359375, 1.254058837890625, 1.2959747314453125, 1.337890625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 1.0, 12.0, 14.0, 11.0, 12.0, 17.0, 10.0, 21.0, 25.0, 20.0, 29.0, 28.0, 35.0, 43.0, 36.0, 38.0, 47.0, 46.0, 1071.0, 49.0, 51.0, 39.0, 51.0, 33.0, 38.0, 35.0, 26.0, 25.0, 24.0, 28.0, 22.0, 13.0, 15.0, 14.0, 9.0, 6.0, 4.0, 6.0, 2.0, 3.0, 4.0, 0.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.40234375, -5.2091064453125, -5.015869140625, -4.8226318359375, -4.62939453125, -4.4361572265625, -4.242919921875, -4.0496826171875, -3.8564453125, -3.6632080078125, -3.469970703125, -3.2767333984375, -3.08349609375, -2.8902587890625, -2.697021484375, -2.5037841796875, -2.310546875, -2.1173095703125, -1.924072265625, -1.7308349609375, -1.53759765625, -1.3443603515625, -1.151123046875, -0.9578857421875, -0.7646484375, -0.5714111328125, -0.378173828125, -0.1849365234375, 0.00830078125, 0.2015380859375, 0.394775390625, 0.5880126953125, 0.78125, 0.9744873046875, 1.167724609375, 1.3609619140625, 1.55419921875, 1.7474365234375, 1.940673828125, 2.1339111328125, 2.3271484375, 2.5203857421875, 2.713623046875, 2.9068603515625, 3.10009765625, 3.2933349609375, 3.486572265625, 3.6798095703125, 3.873046875, 4.0662841796875, 4.259521484375, 4.4527587890625, 4.64599609375, 4.8392333984375, 5.032470703125, 5.2257080078125, 5.4189453125, 5.6121826171875, 5.805419921875, 5.9986572265625, 6.19189453125, 6.3851318359375, 6.578369140625, 6.7716064453125, 6.96484375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 5.0, 8.0, 15.0, 16.0, 17.0, 46.0, 55.0, 72.0, 103.0, 191.0, 260.0, 392.0, 575.0, 939.0, 1416.0, 2091.0, 3198.0, 4941.0, 7538.0, 11745.0, 18466.0, 30538.0, 227191.0, 1701100.0, 31981.0, 19138.0, 12312.0, 7853.0, 5116.0, 3483.0, 2121.0, 1417.0, 930.0, 587.0, 434.0, 268.0, 194.0, 120.0, 72.0, 49.0, 42.0, 36.0, 19.0, 11.0, 7.0, 6.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.59765625, -2.5213623046875, -2.445068359375, -2.3687744140625, -2.29248046875, -2.2161865234375, -2.139892578125, -2.0635986328125, -1.9873046875, -1.9110107421875, -1.834716796875, -1.7584228515625, -1.68212890625, -1.6058349609375, -1.529541015625, -1.4532470703125, -1.376953125, -1.3006591796875, -1.224365234375, -1.1480712890625, -1.07177734375, -0.9954833984375, -0.919189453125, -0.8428955078125, -0.7666015625, -0.6903076171875, -0.614013671875, -0.5377197265625, -0.46142578125, -0.3851318359375, -0.308837890625, -0.2325439453125, -0.15625, -0.0799560546875, -0.003662109375, 0.0726318359375, 0.14892578125, 0.2252197265625, 0.301513671875, 0.3778076171875, 0.4541015625, 0.5303955078125, 0.606689453125, 0.6829833984375, 0.75927734375, 0.8355712890625, 0.911865234375, 0.9881591796875, 1.064453125, 1.1407470703125, 1.217041015625, 1.2933349609375, 1.36962890625, 1.4459228515625, 1.522216796875, 1.5985107421875, 1.6748046875, 1.7510986328125, 1.827392578125, 1.9036865234375, 1.97998046875, 2.0562744140625, 2.132568359375, 2.2088623046875, 2.28515625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 1.0, 5.0, 4.0, 5.0, 7.0, 8.0, 11.0, 15.0, 20.0, 14.0, 22.0, 30.0, 36.0, 48.0, 67.0, 96.0, 102.0, 84.0, 73.0, 73.0, 60.0, 53.0, 30.0, 24.0, 26.0, 18.0, 12.0, 17.0, 9.0, 6.0, 3.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12744140625, -0.12257003784179688, -0.11769866943359375, -0.11282730102539062, -0.1079559326171875, -0.10308456420898438, -0.09821319580078125, -0.09334182739257812, -0.088470458984375, -0.08359909057617188, -0.07872772216796875, -0.07385635375976562, -0.0689849853515625, -0.06411361694335938, -0.05924224853515625, -0.054370880126953125, -0.04949951171875, -0.044628143310546875, -0.03975677490234375, -0.034885406494140625, -0.0300140380859375, -0.025142669677734375, -0.02027130126953125, -0.015399932861328125, -0.010528564453125, -0.005657196044921875, -0.00078582763671875, 0.004085540771484375, 0.0089569091796875, 0.013828277587890625, 0.01869964599609375, 0.023571014404296875, 0.0284423828125, 0.033313751220703125, 0.03818511962890625, 0.043056488037109375, 0.0479278564453125, 0.052799224853515625, 0.05767059326171875, 0.06254196166992188, 0.067413330078125, 0.07228469848632812, 0.07715606689453125, 0.08202743530273438, 0.0868988037109375, 0.09177017211914062, 0.09664154052734375, 0.10151290893554688, 0.10638427734375, 0.11125564575195312, 0.11612701416015625, 0.12099838256835938, 0.1258697509765625, 0.13074111938476562, 0.13561248779296875, 0.14048385620117188, 0.145355224609375, 0.15022659301757812, 0.15509796142578125, 0.15996932983398438, 0.1648406982421875, 0.16971206665039062, 0.17458343505859375, 0.17945480346679688, 0.184326171875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 5.0, 2.0, 9.0, 17.0, 15.0, 13.0, 23.0, 26.0, 41.0, 53.0, 90.0, 184.0, 468.0, 26286.0, 1019458.0, 1215.0, 285.0, 102.0, 73.0, 36.0, 24.0, 27.0, 18.0, 12.0, 12.0, 13.0, 6.0, 7.0, 4.0, 4.0, 5.0, 1.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.3203125, -4.20733642578125, -4.0943603515625, -3.98138427734375, -3.868408203125, -3.75543212890625, -3.6424560546875, -3.52947998046875, -3.41650390625, -3.30352783203125, -3.1905517578125, -3.07757568359375, -2.964599609375, -2.85162353515625, -2.7386474609375, -2.62567138671875, -2.5126953125, -2.39971923828125, -2.2867431640625, -2.17376708984375, -2.060791015625, -1.94781494140625, -1.8348388671875, -1.72186279296875, -1.60888671875, -1.49591064453125, -1.3829345703125, -1.26995849609375, -1.156982421875, -1.04400634765625, -0.9310302734375, -0.81805419921875, -0.705078125, -0.59210205078125, -0.4791259765625, -0.36614990234375, -0.253173828125, -0.14019775390625, -0.0272216796875, 0.08575439453125, 0.19873046875, 0.31170654296875, 0.4246826171875, 0.53765869140625, 0.650634765625, 0.76361083984375, 0.8765869140625, 0.98956298828125, 1.1025390625, 1.21551513671875, 1.3284912109375, 1.44146728515625, 1.554443359375, 1.66741943359375, 1.7803955078125, 1.89337158203125, 2.00634765625, 2.11932373046875, 2.2322998046875, 2.34527587890625, 2.458251953125, 2.57122802734375, 2.6842041015625, 2.79718017578125, 2.91015625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 14.0, 193.0, 764.0, 43.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.580434799194336, -4.496021270751953, -4.41160774230957, -4.327194690704346, -4.242781162261963, -4.15836763381958, -4.073954105377197, -3.9895408153533936, -3.9051272869110107, -3.820713758468628, -3.736300468444824, -3.6518869400024414, -3.5674736499786377, -3.483060121536255, -3.398646831512451, -3.3142333030700684, -3.2298197746276855, -3.1454062461853027, -3.060992956161499, -2.976579427719116, -2.8921661376953125, -2.8077526092529297, -2.723339080810547, -2.638925790786743, -2.5545125007629395, -2.4700989723205566, -2.385685682296753, -2.30127215385437, -2.2168588638305664, -2.1324453353881836, -2.048031806945801, -1.963618516921997, -1.8792049884796143, -1.794791579246521, -1.7103781700134277, -1.625964641571045, -1.5415512323379517, -1.4571378231048584, -1.3727244138717651, -1.2883110046386719, -1.203897476196289, -1.1194840669631958, -1.0350706577301025, -0.9506571888923645, -0.8662437200546265, -0.7818303108215332, -0.6974169015884399, -0.6130034327507019, -0.5285900235176086, -0.444176584482193, -0.35976314544677734, -0.2753497362136841, -0.19093629717826843, -0.10652285814285278, -0.02210944890975952, 0.062304019927978516, 0.14671742916107178, 0.23113086819648743, 0.3155443072319031, 0.39995771646499634, 0.484371155500412, 0.5687845945358276, 0.6531980037689209, 0.7376114726066589, 0.8220248818397522]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 3.0, 6.0, 6.0, 8.0, 3.0, 15.0, 12.0, 22.0, 28.0, 28.0, 12.0, 23.0, 34.0, 38.0, 29.0, 31.0, 48.0, 48.0, 58.0, 41.0, 44.0, 36.0, 50.0, 35.0, 34.0, 30.0, 34.0, 32.0, 33.0, 17.0, 20.0, 18.0, 16.0, 23.0, 20.0, 15.0, 7.0, 9.0, 5.0, 8.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.4646565914154053, -0.4518785774707794, -0.43910056352615356, -0.4263225793838501, -0.41354456543922424, -0.4007665514945984, -0.38798853754997253, -0.3752105236053467, -0.3624325096607208, -0.34965449571609497, -0.3368764817714691, -0.32409846782684326, -0.3113204836845398, -0.29854246973991394, -0.2857644557952881, -0.27298644185066223, -0.2602084279060364, -0.24743041396141052, -0.23465241491794586, -0.22187440097332, -0.20909638702869415, -0.1963183879852295, -0.18354037404060364, -0.17076236009597778, -0.15798437595367432, -0.14520636200904846, -0.1324283629655838, -0.11965034902095795, -0.10687233507633209, -0.09409432858228683, -0.08131632208824158, -0.06853830814361572, -0.05576029419898987, -0.04298228397965431, -0.030204275622963905, -0.0174262672662735, -0.0046482570469379425, 0.008129753172397614, 0.02090775966644287, 0.033685773611068726, 0.04646378010511398, 0.05924179032444954, 0.0720198005437851, 0.08479780703783035, 0.09757581353187561, 0.11035382747650146, 0.12313183397054672, 0.13590985536575317, 0.14868785440921783, 0.1614658683538437, 0.17424386739730835, 0.1870218813419342, 0.19979989528656006, 0.2125779092311859, 0.22535590827465057, 0.23813392221927643, 0.2509119212627411, 0.26368993520736694, 0.2764679491519928, 0.28924596309661865, 0.3020239472389221, 0.314801961183548, 0.32757997512817383, 0.3403579890727997, 0.35313600301742554]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 7.0, 9.0, 9.0, 12.0, 18.0, 18.0, 18.0, 26.0, 28.0, 27.0, 23.0, 31.0, 37.0, 51.0, 37.0, 44.0, 51.0, 44.0, 59.0, 49.0, 49.0, 40.0, 43.0, 47.0, 31.0, 39.0, 27.0, 29.0, 10.0, 19.0, 10.0, 16.0, 13.0, 10.0, 5.0, 6.0, 6.0, 5.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.53125, -6.289794921875, -6.04833984375, -5.806884765625, -5.5654296875, -5.323974609375, -5.08251953125, -4.841064453125, -4.599609375, -4.358154296875, -4.11669921875, -3.875244140625, -3.6337890625, -3.392333984375, -3.15087890625, -2.909423828125, -2.66796875, -2.426513671875, -2.18505859375, -1.943603515625, -1.7021484375, -1.460693359375, -1.21923828125, -0.977783203125, -0.736328125, -0.494873046875, -0.25341796875, -0.011962890625, 0.2294921875, 0.470947265625, 0.71240234375, 0.953857421875, 1.1953125, 1.436767578125, 1.67822265625, 1.919677734375, 2.1611328125, 2.402587890625, 2.64404296875, 2.885498046875, 3.126953125, 3.368408203125, 3.60986328125, 3.851318359375, 4.0927734375, 4.334228515625, 4.57568359375, 4.817138671875, 5.05859375, 5.300048828125, 5.54150390625, 5.782958984375, 6.0244140625, 6.265869140625, 6.50732421875, 6.748779296875, 6.990234375, 7.231689453125, 7.47314453125, 7.714599609375, 7.9560546875, 8.197509765625, 8.43896484375, 8.680419921875, 8.921875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 7.0, 16.0, 11.0, 19.0, 30.0, 56.0, 105.0, 170.0, 321.0, 580.0, 1066.0, 1977.0, 3939.0, 7624.0, 15627.0, 34669.0, 82461.0, 200566.0, 371776.0, 188257.0, 76739.0, 32622.0, 14814.0, 7280.0, 3700.0, 1880.0, 978.0, 567.0, 286.0, 200.0, 91.0, 58.0, 31.0, 22.0, 5.0, 4.0, 6.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.296875, -8.00537109375, -7.7138671875, -7.42236328125, -7.130859375, -6.83935546875, -6.5478515625, -6.25634765625, -5.96484375, -5.67333984375, -5.3818359375, -5.09033203125, -4.798828125, -4.50732421875, -4.2158203125, -3.92431640625, -3.6328125, -3.34130859375, -3.0498046875, -2.75830078125, -2.466796875, -2.17529296875, -1.8837890625, -1.59228515625, -1.30078125, -1.00927734375, -0.7177734375, -0.42626953125, -0.134765625, 0.15673828125, 0.4482421875, 0.73974609375, 1.03125, 1.32275390625, 1.6142578125, 1.90576171875, 2.197265625, 2.48876953125, 2.7802734375, 3.07177734375, 3.36328125, 3.65478515625, 3.9462890625, 4.23779296875, 4.529296875, 4.82080078125, 5.1123046875, 5.40380859375, 5.6953125, 5.98681640625, 6.2783203125, 6.56982421875, 6.861328125, 7.15283203125, 7.4443359375, 7.73583984375, 8.02734375, 8.31884765625, 8.6103515625, 8.90185546875, 9.193359375, 9.48486328125, 9.7763671875, 10.06787109375, 10.359375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 5.0, 8.0, 8.0, 5.0, 10.0, 10.0, 28.0, 25.0, 30.0, 36.0, 33.0, 40.0, 42.0, 49.0, 83.0, 182.0, 306.0, 1486.0, 204.0, 92.0, 66.0, 45.0, 48.0, 42.0, 34.0, 22.0, 33.0, 20.0, 20.0, 10.0, 8.0, 8.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.28125, -25.411376953125, -24.54150390625, -23.671630859375, -22.8017578125, -21.931884765625, -21.06201171875, -20.192138671875, -19.322265625, -18.452392578125, -17.58251953125, -16.712646484375, -15.8427734375, -14.972900390625, -14.10302734375, -13.233154296875, -12.36328125, -11.493408203125, -10.62353515625, -9.753662109375, -8.8837890625, -8.013916015625, -7.14404296875, -6.274169921875, -5.404296875, -4.534423828125, -3.66455078125, -2.794677734375, -1.9248046875, -1.054931640625, -0.18505859375, 0.684814453125, 1.5546875, 2.424560546875, 3.29443359375, 4.164306640625, 5.0341796875, 5.904052734375, 6.77392578125, 7.643798828125, 8.513671875, 9.383544921875, 10.25341796875, 11.123291015625, 11.9931640625, 12.863037109375, 13.73291015625, 14.602783203125, 15.47265625, 16.342529296875, 17.21240234375, 18.082275390625, 18.9521484375, 19.822021484375, 20.69189453125, 21.561767578125, 22.431640625, 23.301513671875, 24.17138671875, 25.041259765625, 25.9111328125, 26.781005859375, 27.65087890625, 28.520751953125, 29.390625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 9.0, 7.0, 7.0, 8.0, 16.0, 18.0, 20.0, 24.0, 46.0, 62.0, 80.0, 116.0, 166.0, 273.0, 489.0, 1536.0, 62764.0, 3048845.0, 28852.0, 1075.0, 432.0, 272.0, 171.0, 109.0, 91.0, 47.0, 42.0, 34.0, 27.0, 14.0, 17.0, 8.0, 8.0, 7.0, 3.0, 3.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-68.25, -66.078125, -63.90625, -61.734375, -59.5625, -57.390625, -55.21875, -53.046875, -50.875, -48.703125, -46.53125, -44.359375, -42.1875, -40.015625, -37.84375, -35.671875, -33.5, -31.328125, -29.15625, -26.984375, -24.8125, -22.640625, -20.46875, -18.296875, -16.125, -13.953125, -11.78125, -9.609375, -7.4375, -5.265625, -3.09375, -0.921875, 1.25, 3.421875, 5.59375, 7.765625, 9.9375, 12.109375, 14.28125, 16.453125, 18.625, 20.796875, 22.96875, 25.140625, 27.3125, 29.484375, 31.65625, 33.828125, 36.0, 38.171875, 40.34375, 42.515625, 44.6875, 46.859375, 49.03125, 51.203125, 53.375, 55.546875, 57.71875, 59.890625, 62.0625, 64.234375, 66.40625, 68.578125, 70.75]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 22.0, 23.0, 50.0, 86.0, 120.0, 145.0, 183.0, 140.0, 98.0, 76.0, 34.0, 20.0, 10.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.95283126831055, -41.10564422607422, -39.258460998535156, -37.41127395629883, -35.5640869140625, -33.71690368652344, -31.86971664428711, -30.02252960205078, -28.175344467163086, -26.32815933227539, -24.480972290039062, -22.633787155151367, -20.786602020263672, -18.939414978027344, -17.09222984313965, -15.245043754577637, -13.397857666015625, -11.550671577453613, -9.703485488891602, -7.856300354003906, -6.0091142654418945, -4.161928176879883, -2.3147430419921875, -0.4675569534301758, 1.379629135131836, 3.2268149852752686, 5.074000835418701, 6.921186447143555, 8.768372535705566, 10.615558624267578, 12.462743759155273, 14.309929847717285, 16.157119750976562, 18.004304885864258, 19.851491928100586, 21.69867706298828, 23.54586410522461, 25.393049240112305, 27.240234375, 29.087421417236328, 30.934606552124023, 32.78179168701172, 34.62897872924805, 36.476165771484375, 38.32334899902344, 40.170536041259766, 42.017723083496094, 43.864906311035156, 45.712093353271484, 47.55928039550781, 49.406463623046875, 51.2536506652832, 53.10083770751953, 54.948020935058594, 56.79520797729492, 58.64239501953125, 60.48957824707031, 62.33676528930664, 64.18395233154297, 66.03113555908203, 67.8783187866211, 69.72550964355469, 71.57269287109375, 73.41987609863281, 75.2670669555664]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 9.0, 9.0, 7.0, 11.0, 5.0, 10.0, 13.0, 17.0, 22.0, 22.0, 21.0, 24.0, 29.0, 18.0, 42.0, 40.0, 37.0, 43.0, 34.0, 41.0, 35.0, 37.0, 49.0, 39.0, 34.0, 24.0, 31.0, 31.0, 28.0, 32.0, 33.0, 19.0, 28.0, 20.0, 24.0, 12.0, 14.0, 14.0, 10.0, 9.0, 3.0, 5.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-51.821075439453125, -50.0968017578125, -48.37252426147461, -46.648250579833984, -44.92397689819336, -43.19969940185547, -41.475425720214844, -39.75115203857422, -38.026878356933594, -36.30260467529297, -34.57832717895508, -32.85405349731445, -31.129779815673828, -29.40550422668457, -27.681228637695312, -25.956954956054688, -24.232677459716797, -22.50840187072754, -20.784128189086914, -19.059852600097656, -17.33557891845703, -15.611303329467773, -13.887027740478516, -12.162753105163574, -10.438478469848633, -8.714203834533691, -6.989928722381592, -5.265653610229492, -3.541378974914551, -1.8171043395996094, -0.09282875061035156, 1.6314458847045898, 3.3557205200195312, 5.079995155334473, 6.804270267486572, 8.528545379638672, 10.252820014953613, 11.977094650268555, 13.701370239257812, 15.425644874572754, 17.149919509887695, 18.874195098876953, 20.598468780517578, 22.322744369506836, 24.047019958496094, 25.77129364013672, 27.495569229125977, 29.219844818115234, 30.94411849975586, 32.668392181396484, 34.392669677734375, 36.116943359375, 37.841217041015625, 39.56549072265625, 41.28976821899414, 43.014041900634766, 44.738319396972656, 46.46259307861328, 48.18687057495117, 49.9111442565918, 51.63541793823242, 53.35969543457031, 55.08396911621094, 56.80824279785156, 58.53251647949219]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 5.0, 4.0, 12.0, 7.0, 16.0, 14.0, 19.0, 26.0, 14.0, 26.0, 26.0, 34.0, 35.0, 36.0, 46.0, 45.0, 46.0, 38.0, 46.0, 54.0, 40.0, 42.0, 44.0, 38.0, 44.0, 28.0, 38.0, 30.0, 25.0, 18.0, 17.0, 16.0, 14.0, 14.0, 9.0, 7.0, 4.0, 5.0, 5.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.12109375, -6.87518310546875, -6.6292724609375, -6.38336181640625, -6.137451171875, -5.89154052734375, -5.6456298828125, -5.39971923828125, -5.15380859375, -4.90789794921875, -4.6619873046875, -4.41607666015625, -4.170166015625, -3.92425537109375, -3.6783447265625, -3.43243408203125, -3.1865234375, -2.94061279296875, -2.6947021484375, -2.44879150390625, -2.202880859375, -1.95697021484375, -1.7110595703125, -1.46514892578125, -1.21923828125, -0.97332763671875, -0.7274169921875, -0.48150634765625, -0.235595703125, 0.01031494140625, 0.2562255859375, 0.50213623046875, 0.748046875, 0.99395751953125, 1.2398681640625, 1.48577880859375, 1.731689453125, 1.97760009765625, 2.2235107421875, 2.46942138671875, 2.71533203125, 2.96124267578125, 3.2071533203125, 3.45306396484375, 3.698974609375, 3.94488525390625, 4.1907958984375, 4.43670654296875, 4.6826171875, 4.92852783203125, 5.1744384765625, 5.42034912109375, 5.666259765625, 5.91217041015625, 6.1580810546875, 6.40399169921875, 6.64990234375, 6.89581298828125, 7.1417236328125, 7.38763427734375, 7.633544921875, 7.87945556640625, 8.1253662109375, 8.37127685546875, 8.6171875]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 9.0, 8.0, 14.0, 12.0, 20.0, 21.0, 40.0, 42.0, 66.0, 98.0, 150.0, 244.0, 562.0, 1079.0, 2853.0, 8988.0, 32855.0, 130557.0, 509404.0, 1462719.0, 1410724.0, 471614.0, 118694.0, 29993.0, 8349.0, 2749.0, 1067.0, 526.0, 256.0, 173.0, 121.0, 76.0, 56.0, 35.0, 25.0, 25.0, 14.0, 15.0, 10.0, 8.0, 7.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-12.7421875, -12.3778076171875, -12.013427734375, -11.6490478515625, -11.28466796875, -10.9202880859375, -10.555908203125, -10.1915283203125, -9.8271484375, -9.4627685546875, -9.098388671875, -8.7340087890625, -8.36962890625, -8.0052490234375, -7.640869140625, -7.2764892578125, -6.912109375, -6.5477294921875, -6.183349609375, -5.8189697265625, -5.45458984375, -5.0902099609375, -4.725830078125, -4.3614501953125, -3.9970703125, -3.6326904296875, -3.268310546875, -2.9039306640625, -2.53955078125, -2.1751708984375, -1.810791015625, -1.4464111328125, -1.08203125, -0.7176513671875, -0.353271484375, 0.0111083984375, 0.37548828125, 0.7398681640625, 1.104248046875, 1.4686279296875, 1.8330078125, 2.1973876953125, 2.561767578125, 2.9261474609375, 3.29052734375, 3.6549072265625, 4.019287109375, 4.3836669921875, 4.748046875, 5.1124267578125, 5.476806640625, 5.8411865234375, 6.20556640625, 6.5699462890625, 6.934326171875, 7.2987060546875, 7.6630859375, 8.0274658203125, 8.391845703125, 8.7562255859375, 9.12060546875, 9.4849853515625, 9.849365234375, 10.2137451171875, 10.578125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 2.0, 4.0, 6.0, 8.0, 7.0, 12.0, 26.0, 13.0, 20.0, 34.0, 37.0, 57.0, 79.0, 86.0, 104.0, 124.0, 189.0, 214.0, 252.0, 287.0, 331.0, 336.0, 346.0, 303.0, 230.0, 197.0, 140.0, 132.0, 112.0, 81.0, 61.0, 50.0, 41.0, 42.0, 34.0, 25.0, 10.0, 8.0, 9.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.21875, -9.8583984375, -9.498046875, -9.1376953125, -8.77734375, -8.4169921875, -8.056640625, -7.6962890625, -7.3359375, -6.9755859375, -6.615234375, -6.2548828125, -5.89453125, -5.5341796875, -5.173828125, -4.8134765625, -4.453125, -4.0927734375, -3.732421875, -3.3720703125, -3.01171875, -2.6513671875, -2.291015625, -1.9306640625, -1.5703125, -1.2099609375, -0.849609375, -0.4892578125, -0.12890625, 0.2314453125, 0.591796875, 0.9521484375, 1.3125, 1.6728515625, 2.033203125, 2.3935546875, 2.75390625, 3.1142578125, 3.474609375, 3.8349609375, 4.1953125, 4.5556640625, 4.916015625, 5.2763671875, 5.63671875, 5.9970703125, 6.357421875, 6.7177734375, 7.078125, 7.4384765625, 7.798828125, 8.1591796875, 8.51953125, 8.8798828125, 9.240234375, 9.6005859375, 9.9609375, 10.3212890625, 10.681640625, 11.0419921875, 11.40234375, 11.7626953125, 12.123046875, 12.4833984375, 12.84375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 4.0, 1.0, 5.0, 3.0, 4.0, 4.0, 9.0, 4.0, 20.0, 28.0, 36.0, 45.0, 53.0, 56.0, 75.0, 99.0, 156.0, 192.0, 258.0, 527.0, 2144.0, 36881.0, 1076390.0, 2910618.0, 158218.0, 6408.0, 839.0, 342.0, 213.0, 158.0, 134.0, 98.0, 59.0, 47.0, 40.0, 25.0, 15.0, 21.0, 18.0, 8.0, 4.0, 7.0, 8.0, 4.0, 1.0, 6.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-42.0625, -40.8681640625, -39.673828125, -38.4794921875, -37.28515625, -36.0908203125, -34.896484375, -33.7021484375, -32.5078125, -31.3134765625, -30.119140625, -28.9248046875, -27.73046875, -26.5361328125, -25.341796875, -24.1474609375, -22.953125, -21.7587890625, -20.564453125, -19.3701171875, -18.17578125, -16.9814453125, -15.787109375, -14.5927734375, -13.3984375, -12.2041015625, -11.009765625, -9.8154296875, -8.62109375, -7.4267578125, -6.232421875, -5.0380859375, -3.84375, -2.6494140625, -1.455078125, -0.2607421875, 0.93359375, 2.1279296875, 3.322265625, 4.5166015625, 5.7109375, 6.9052734375, 8.099609375, 9.2939453125, 10.48828125, 11.6826171875, 12.876953125, 14.0712890625, 15.265625, 16.4599609375, 17.654296875, 18.8486328125, 20.04296875, 21.2373046875, 22.431640625, 23.6259765625, 24.8203125, 26.0146484375, 27.208984375, 28.4033203125, 29.59765625, 30.7919921875, 31.986328125, 33.1806640625, 34.375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 22.0, 69.0, 182.0, 229.0, 251.0, 156.0, 70.0, 23.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-274.61590576171875, -269.2176208496094, -263.8193054199219, -258.4210205078125, -253.022705078125, -247.62440490722656, -242.22610473632812, -236.8278045654297, -231.42950439453125, -226.0312042236328, -220.63290405273438, -215.23460388183594, -209.8363037109375, -204.43800354003906, -199.03970336914062, -193.6414031982422, -188.24310302734375, -182.8448028564453, -177.44650268554688, -172.04820251464844, -166.64990234375, -161.25160217285156, -155.85330200195312, -150.4550018310547, -145.0567169189453, -139.65841674804688, -134.26011657714844, -128.86181640625, -123.46351623535156, -118.06521606445312, -112.66691589355469, -107.26861572265625, -101.87032318115234, -96.4720230102539, -91.07372283935547, -85.67542266845703, -80.2771224975586, -74.87882232666016, -69.48052978515625, -64.08222961425781, -58.68392562866211, -53.28562545776367, -47.887325286865234, -42.48902893066406, -37.090728759765625, -31.692426681518555, -26.29412841796875, -20.895828247070312, -15.497528076171875, -10.099227905273438, -4.700928688049316, 0.6973705291748047, 6.095670700073242, 11.49397087097168, 16.892269134521484, 22.290569305419922, 27.68886947631836, 33.0871696472168, 38.485469818115234, 43.883766174316406, 49.282066345214844, 54.68036651611328, 60.07866668701172, 65.47696685791016, 70.8752670288086]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 6.0, 14.0, 8.0, 10.0, 17.0, 18.0, 19.0, 10.0, 13.0, 17.0, 26.0, 25.0, 27.0, 30.0, 44.0, 39.0, 43.0, 39.0, 38.0, 46.0, 44.0, 42.0, 44.0, 48.0, 44.0, 31.0, 35.0, 30.0, 29.0, 20.0, 24.0, 30.0, 24.0, 16.0, 6.0, 12.0, 5.0, 9.0, 5.0, 7.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.33302307128906, -46.76298904418945, -45.192955017089844, -43.6229248046875, -42.05289077758789, -40.48285675048828, -38.91282272338867, -37.34278869628906, -35.77275848388672, -34.20272445678711, -32.6326904296875, -31.062658309936523, -29.492626190185547, -27.922592163085938, -26.352558135986328, -24.78252410888672, -23.21249008178711, -21.6424560546875, -20.072423934936523, -18.502389907836914, -16.932357788085938, -15.362323760986328, -13.792289733886719, -12.222256660461426, -10.652223587036133, -9.08219051361084, -7.512156963348389, -5.9421234130859375, -4.3720903396606445, -2.8020572662353516, -1.2320232391357422, 0.3380098342895508, 1.9080467224121094, 3.4780800342559814, 5.0481133460998535, 6.618146896362305, 8.188179969787598, 9.75821304321289, 11.3282470703125, 12.898280143737793, 14.468313217163086, 16.038347244262695, 17.608379364013672, 19.17841339111328, 20.74844741821289, 22.318479537963867, 23.888513565063477, 25.458545684814453, 27.028579711914062, 28.598613739013672, 30.16864585876465, 31.738679885864258, 33.308712005615234, 34.878746032714844, 36.44878005981445, 38.01881408691406, 39.588844299316406, 41.158878326416016, 42.728912353515625, 44.29894256591797, 45.86897659301758, 47.43901062011719, 49.0090446472168, 50.579078674316406, 52.149112701416016]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 9.0, 5.0, 7.0, 13.0, 10.0, 9.0, 22.0, 17.0, 24.0, 29.0, 27.0, 27.0, 21.0, 24.0, 36.0, 31.0, 47.0, 39.0, 53.0, 47.0, 39.0, 46.0, 30.0, 33.0, 31.0, 36.0, 42.0, 28.0, 22.0, 29.0, 17.0, 26.0, 23.0, 18.0, 8.0, 6.0, 8.0, 14.0, 8.0, 10.0, 4.0, 5.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.6171875, -6.40484619140625, -6.1925048828125, -5.98016357421875, -5.767822265625, -5.55548095703125, -5.3431396484375, -5.13079833984375, -4.91845703125, -4.70611572265625, -4.4937744140625, -4.28143310546875, -4.069091796875, -3.85675048828125, -3.6444091796875, -3.43206787109375, -3.2197265625, -3.00738525390625, -2.7950439453125, -2.58270263671875, -2.370361328125, -2.15802001953125, -1.9456787109375, -1.73333740234375, -1.52099609375, -1.30865478515625, -1.0963134765625, -0.88397216796875, -0.671630859375, -0.45928955078125, -0.2469482421875, -0.03460693359375, 0.177734375, 0.39007568359375, 0.6024169921875, 0.81475830078125, 1.027099609375, 1.23944091796875, 1.4517822265625, 1.66412353515625, 1.87646484375, 2.08880615234375, 2.3011474609375, 2.51348876953125, 2.725830078125, 2.93817138671875, 3.1505126953125, 3.36285400390625, 3.5751953125, 3.78753662109375, 3.9998779296875, 4.21221923828125, 4.424560546875, 4.63690185546875, 4.8492431640625, 5.06158447265625, 5.27392578125, 5.48626708984375, 5.6986083984375, 5.91094970703125, 6.123291015625, 6.33563232421875, 6.5479736328125, 6.76031494140625, 6.97265625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 8.0, 18.0, 22.0, 44.0, 55.0, 96.0, 139.0, 202.0, 280.0, 404.0, 697.0, 1021.0, 1467.0, 2312.0, 3313.0, 5239.0, 7612.0, 11082.0, 16041.0, 23204.0, 32393.0, 44306.0, 58566.0, 74660.0, 90416.0, 103396.0, 108031.0, 102195.0, 88657.0, 72706.0, 56697.0, 42539.0, 30880.0, 22156.0, 15308.0, 10700.0, 7187.0, 4804.0, 3351.0, 2150.0, 1408.0, 916.0, 640.0, 415.0, 272.0, 205.0, 118.0, 85.0, 43.0, 25.0, 28.0, 22.0, 8.0, 9.0, 3.0, 5.0], "bins": [-1.1826171875, -1.1482696533203125, -1.113922119140625, -1.0795745849609375, -1.04522705078125, -1.0108795166015625, -0.976531982421875, -0.9421844482421875, -0.9078369140625, -0.8734893798828125, -0.839141845703125, -0.8047943115234375, -0.77044677734375, -0.7360992431640625, -0.701751708984375, -0.6674041748046875, -0.633056640625, -0.5987091064453125, -0.564361572265625, -0.5300140380859375, -0.49566650390625, -0.4613189697265625, -0.426971435546875, -0.3926239013671875, -0.3582763671875, -0.3239288330078125, -0.289581298828125, -0.2552337646484375, -0.22088623046875, -0.1865386962890625, -0.152191162109375, -0.1178436279296875, -0.08349609375, -0.0491485595703125, -0.014801025390625, 0.0195465087890625, 0.05389404296875, 0.0882415771484375, 0.122589111328125, 0.1569366455078125, 0.1912841796875, 0.2256317138671875, 0.259979248046875, 0.2943267822265625, 0.32867431640625, 0.3630218505859375, 0.397369384765625, 0.4317169189453125, 0.466064453125, 0.5004119873046875, 0.534759521484375, 0.5691070556640625, 0.60345458984375, 0.6378021240234375, 0.672149658203125, 0.7064971923828125, 0.7408447265625, 0.7751922607421875, 0.809539794921875, 0.8438873291015625, 0.87823486328125, 0.9125823974609375, 0.946929931640625, 0.9812774658203125, 1.015625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 9.0, 2.0, 10.0, 10.0, 10.0, 7.0, 8.0, 20.0, 11.0, 15.0, 24.0, 29.0, 36.0, 28.0, 29.0, 47.0, 38.0, 33.0, 51.0, 30.0, 38.0, 1057.0, 49.0, 40.0, 46.0, 53.0, 28.0, 35.0, 31.0, 38.0, 27.0, 18.0, 21.0, 16.0, 11.0, 16.0, 10.0, 13.0, 13.0, 10.0, 4.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.296875, -5.1241455078125, -4.951416015625, -4.7786865234375, -4.60595703125, -4.4332275390625, -4.260498046875, -4.0877685546875, -3.9150390625, -3.7423095703125, -3.569580078125, -3.3968505859375, -3.22412109375, -3.0513916015625, -2.878662109375, -2.7059326171875, -2.533203125, -2.3604736328125, -2.187744140625, -2.0150146484375, -1.84228515625, -1.6695556640625, -1.496826171875, -1.3240966796875, -1.1513671875, -0.9786376953125, -0.805908203125, -0.6331787109375, -0.46044921875, -0.2877197265625, -0.114990234375, 0.0577392578125, 0.23046875, 0.4031982421875, 0.575927734375, 0.7486572265625, 0.92138671875, 1.0941162109375, 1.266845703125, 1.4395751953125, 1.6123046875, 1.7850341796875, 1.957763671875, 2.1304931640625, 2.30322265625, 2.4759521484375, 2.648681640625, 2.8214111328125, 2.994140625, 3.1668701171875, 3.339599609375, 3.5123291015625, 3.68505859375, 3.8577880859375, 4.030517578125, 4.2032470703125, 4.3759765625, 4.5487060546875, 4.721435546875, 4.8941650390625, 5.06689453125, 5.2396240234375, 5.412353515625, 5.5850830078125, 5.7578125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 10.0, 3.0, 9.0, 10.0, 17.0, 23.0, 42.0, 81.0, 75.0, 123.0, 165.0, 266.0, 329.0, 488.0, 705.0, 1114.0, 1518.0, 2357.0, 3351.0, 4869.0, 6958.0, 10126.0, 15044.0, 22512.0, 37522.0, 1862692.0, 48732.0, 25165.0, 16683.0, 11330.0, 7592.0, 5359.0, 3672.0, 2562.0, 1782.0, 1216.0, 818.0, 581.0, 390.0, 270.0, 185.0, 123.0, 79.0, 52.0, 39.0, 29.0, 21.0, 12.0, 17.0, 6.0, 7.0, 3.0, 3.0, 0.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.013671875, -1.945709228515625, -1.87774658203125, -1.809783935546875, -1.7418212890625, -1.673858642578125, -1.60589599609375, -1.537933349609375, -1.469970703125, -1.402008056640625, -1.33404541015625, -1.266082763671875, -1.1981201171875, -1.130157470703125, -1.06219482421875, -0.994232177734375, -0.92626953125, -0.858306884765625, -0.79034423828125, -0.722381591796875, -0.6544189453125, -0.586456298828125, -0.51849365234375, -0.450531005859375, -0.382568359375, -0.314605712890625, -0.24664306640625, -0.178680419921875, -0.1107177734375, -0.042755126953125, 0.02520751953125, 0.093170166015625, 0.1611328125, 0.229095458984375, 0.29705810546875, 0.365020751953125, 0.4329833984375, 0.500946044921875, 0.56890869140625, 0.636871337890625, 0.704833984375, 0.772796630859375, 0.84075927734375, 0.908721923828125, 0.9766845703125, 1.044647216796875, 1.11260986328125, 1.180572509765625, 1.24853515625, 1.316497802734375, 1.38446044921875, 1.452423095703125, 1.5203857421875, 1.588348388671875, 1.65631103515625, 1.724273681640625, 1.792236328125, 1.860198974609375, 1.92816162109375, 1.996124267578125, 2.0640869140625, 2.132049560546875, 2.20001220703125, 2.267974853515625, 2.3359375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 8.0, 4.0, 11.0, 10.0, 12.0, 15.0, 17.0, 12.0, 28.0, 28.0, 45.0, 63.0, 90.0, 120.0, 142.0, 113.0, 65.0, 44.0, 33.0, 22.0, 24.0, 12.0, 15.0, 11.0, 8.0, 13.0, 5.0, 3.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1195068359375, -0.1157846450805664, -0.11206245422363281, -0.10834026336669922, -0.10461807250976562, -0.10089588165283203, -0.09717369079589844, -0.09345149993896484, -0.08972930908203125, -0.08600711822509766, -0.08228492736816406, -0.07856273651123047, -0.07484054565429688, -0.07111835479736328, -0.06739616394042969, -0.0636739730834961, -0.0599517822265625, -0.056229591369628906, -0.05250740051269531, -0.04878520965576172, -0.045063018798828125, -0.04134082794189453, -0.03761863708496094, -0.033896446228027344, -0.03017425537109375, -0.026452064514160156, -0.022729873657226562, -0.01900768280029297, -0.015285491943359375, -0.011563301086425781, -0.007841110229492188, -0.004118919372558594, -0.000396728515625, 0.0033254623413085938, 0.0070476531982421875, 0.010769844055175781, 0.014492034912109375, 0.01821422576904297, 0.021936416625976562, 0.025658607482910156, 0.02938079833984375, 0.033102989196777344, 0.03682518005371094, 0.04054737091064453, 0.044269561767578125, 0.04799175262451172, 0.05171394348144531, 0.055436134338378906, 0.0591583251953125, 0.0628805160522461, 0.06660270690917969, 0.07032489776611328, 0.07404708862304688, 0.07776927947998047, 0.08149147033691406, 0.08521366119384766, 0.08893585205078125, 0.09265804290771484, 0.09638023376464844, 0.10010242462158203, 0.10382461547851562, 0.10754680633544922, 0.11126899719238281, 0.1149911880493164, 0.11871337890625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 5.0, 8.0, 4.0, 6.0, 6.0, 11.0, 12.0, 13.0, 19.0, 32.0, 24.0, 50.0, 51.0, 136.0, 420.0, 3260.0, 933907.0, 108350.0, 1604.0, 279.0, 126.0, 52.0, 45.0, 26.0, 19.0, 11.0, 19.0, 13.0, 12.0, 5.0, 8.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.587890625, -2.50665283203125, -2.4254150390625, -2.34417724609375, -2.262939453125, -2.18170166015625, -2.1004638671875, -2.01922607421875, -1.93798828125, -1.85675048828125, -1.7755126953125, -1.69427490234375, -1.613037109375, -1.53179931640625, -1.4505615234375, -1.36932373046875, -1.2880859375, -1.20684814453125, -1.1256103515625, -1.04437255859375, -0.963134765625, -0.88189697265625, -0.8006591796875, -0.71942138671875, -0.63818359375, -0.55694580078125, -0.4757080078125, -0.39447021484375, -0.313232421875, -0.23199462890625, -0.1507568359375, -0.06951904296875, 0.01171875, 0.09295654296875, 0.1741943359375, 0.25543212890625, 0.336669921875, 0.41790771484375, 0.4991455078125, 0.58038330078125, 0.66162109375, 0.74285888671875, 0.8240966796875, 0.90533447265625, 0.986572265625, 1.06781005859375, 1.1490478515625, 1.23028564453125, 1.3115234375, 1.39276123046875, 1.4739990234375, 1.55523681640625, 1.636474609375, 1.71771240234375, 1.7989501953125, 1.88018798828125, 1.96142578125, 2.04266357421875, 2.1239013671875, 2.20513916015625, 2.286376953125, 2.36761474609375, 2.4488525390625, 2.53009033203125, 2.611328125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 9.0, 95.0, 646.0, 238.0, 25.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.945443868637085, -2.88840913772583, -2.831374168395996, -2.774339437484741, -2.7173044681549072, -2.6602697372436523, -2.6032347679138184, -2.5462000370025635, -2.4891650676727295, -2.4321303367614746, -2.3750953674316406, -2.3180606365203857, -2.2610256671905518, -2.203990936279297, -2.146955966949463, -2.089921236038208, -2.032886266708374, -1.9758514165878296, -1.9188165664672852, -1.8617817163467407, -1.8047468662261963, -1.7477120161056519, -1.6906771659851074, -1.633642315864563, -1.576607584953308, -1.5195727348327637, -1.4625378847122192, -1.4055030345916748, -1.3484681844711304, -1.291433334350586, -1.2343984842300415, -1.177363634109497, -1.1203287839889526, -1.0632939338684082, -1.0062590837478638, -0.9492242336273193, -0.8921893835067749, -0.8351545333862305, -0.778119683265686, -0.7210848331451416, -0.6640499830245972, -0.6070151329040527, -0.5499802827835083, -0.49294543266296387, -0.43591058254241943, -0.3788757622241974, -0.32184091210365295, -0.2648060619831085, -0.20777124166488647, -0.15073639154434204, -0.0937015488743782, -0.03666670620441437, 0.020368143916130066, 0.0774029791355133, 0.13443782925605774, 0.19147267937660217, 0.2485075294971466, 0.30554237961769104, 0.3625772297382355, 0.4196120500564575, 0.47664690017700195, 0.5336817502975464, 0.5907166004180908, 0.6477514505386353, 0.7047863006591797]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 5.0, 5.0, 5.0, 8.0, 12.0, 9.0, 20.0, 31.0, 15.0, 25.0, 27.0, 40.0, 35.0, 45.0, 42.0, 53.0, 42.0, 43.0, 47.0, 58.0, 58.0, 56.0, 53.0, 31.0, 25.0, 34.0, 24.0, 27.0, 22.0, 29.0, 16.0, 19.0, 9.0, 4.0, 10.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.24442321062088013, -0.23671577870845795, -0.22900836169719696, -0.22130092978477478, -0.2135934978723526, -0.20588606595993042, -0.19817864894866943, -0.19047121703624725, -0.18276378512382507, -0.1750563532114029, -0.1673489362001419, -0.15964150428771973, -0.15193407237529755, -0.14422664046287537, -0.13651922345161438, -0.1288117915391922, -0.12110437452793121, -0.11339695006608963, -0.10568951815366745, -0.09798209369182587, -0.09027466177940369, -0.0825672373175621, -0.07485981285572052, -0.06715238094329834, -0.05944495648145676, -0.051737528294324875, -0.04403010010719299, -0.03632267564535141, -0.028615247458219528, -0.020907819271087646, -0.013200394809246063, -0.0054929666221141815, 0.0022144615650177, 0.009921888820827007, 0.017629316076636314, 0.025336742401123047, 0.03304417058825493, 0.04075159877538681, 0.048459023237228394, 0.056166451424360275, 0.06387387961149216, 0.07158130407333374, 0.07928873598575592, 0.0869961604475975, 0.09470358490943909, 0.10241101682186127, 0.11011844128370285, 0.11782586574554443, 0.1255332976579666, 0.1332407295703888, 0.14094814658164978, 0.14865557849407196, 0.15636301040649414, 0.16407042741775513, 0.1717778593301773, 0.1794852912425995, 0.18719270825386047, 0.19490014016628265, 0.20260755717754364, 0.21031498908996582, 0.218022421002388, 0.22572985291481018, 0.23343726992607117, 0.24114470183849335, 0.24885213375091553]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 12.0, 7.0, 14.0, 9.0, 14.0, 12.0, 27.0, 11.0, 29.0, 29.0, 24.0, 39.0, 33.0, 34.0, 31.0, 31.0, 33.0, 49.0, 35.0, 45.0, 45.0, 44.0, 39.0, 45.0, 27.0, 29.0, 27.0, 27.0, 22.0, 24.0, 20.0, 14.0, 17.0, 18.0, 16.0, 10.0, 9.0, 11.0, 8.0, 12.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.39453125, -6.18206787109375, -5.9696044921875, -5.75714111328125, -5.544677734375, -5.33221435546875, -5.1197509765625, -4.90728759765625, -4.69482421875, -4.48236083984375, -4.2698974609375, -4.05743408203125, -3.844970703125, -3.63250732421875, -3.4200439453125, -3.20758056640625, -2.9951171875, -2.78265380859375, -2.5701904296875, -2.35772705078125, -2.145263671875, -1.93280029296875, -1.7203369140625, -1.50787353515625, -1.29541015625, -1.08294677734375, -0.8704833984375, -0.65802001953125, -0.445556640625, -0.23309326171875, -0.0206298828125, 0.19183349609375, 0.404296875, 0.61676025390625, 0.8292236328125, 1.04168701171875, 1.254150390625, 1.46661376953125, 1.6790771484375, 1.89154052734375, 2.10400390625, 2.31646728515625, 2.5289306640625, 2.74139404296875, 2.953857421875, 3.16632080078125, 3.3787841796875, 3.59124755859375, 3.8037109375, 4.01617431640625, 4.2286376953125, 4.44110107421875, 4.653564453125, 4.86602783203125, 5.0784912109375, 5.29095458984375, 5.50341796875, 5.71588134765625, 5.9283447265625, 6.14080810546875, 6.353271484375, 6.56573486328125, 6.7781982421875, 6.99066162109375, 7.203125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 11.0, 13.0, 16.0, 23.0, 23.0, 50.0, 84.0, 113.0, 168.0, 230.0, 381.0, 634.0, 974.0, 1675.0, 2699.0, 4613.0, 8109.0, 14779.0, 27540.0, 55232.0, 110686.0, 230734.0, 303823.0, 140247.0, 69355.0, 34625.0, 18168.0, 9661.0, 5542.0, 3136.0, 1915.0, 1197.0, 724.0, 492.0, 313.0, 192.0, 120.0, 75.0, 57.0, 40.0, 29.0, 23.0, 14.0, 11.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.50390625, -7.2706298828125, -7.037353515625, -6.8040771484375, -6.57080078125, -6.3375244140625, -6.104248046875, -5.8709716796875, -5.6376953125, -5.4044189453125, -5.171142578125, -4.9378662109375, -4.70458984375, -4.4713134765625, -4.238037109375, -4.0047607421875, -3.771484375, -3.5382080078125, -3.304931640625, -3.0716552734375, -2.83837890625, -2.6051025390625, -2.371826171875, -2.1385498046875, -1.9052734375, -1.6719970703125, -1.438720703125, -1.2054443359375, -0.97216796875, -0.7388916015625, -0.505615234375, -0.2723388671875, -0.0390625, 0.1942138671875, 0.427490234375, 0.6607666015625, 0.89404296875, 1.1273193359375, 1.360595703125, 1.5938720703125, 1.8271484375, 2.0604248046875, 2.293701171875, 2.5269775390625, 2.76025390625, 2.9935302734375, 3.226806640625, 3.4600830078125, 3.693359375, 3.9266357421875, 4.159912109375, 4.3931884765625, 4.62646484375, 4.8597412109375, 5.093017578125, 5.3262939453125, 5.5595703125, 5.7928466796875, 6.026123046875, 6.2593994140625, 6.49267578125, 6.7259521484375, 6.959228515625, 7.1925048828125, 7.42578125]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 6.0, 2.0, 3.0, 7.0, 12.0, 8.0, 9.0, 14.0, 12.0, 16.0, 18.0, 21.0, 25.0, 27.0, 32.0, 32.0, 37.0, 50.0, 41.0, 67.0, 123.0, 230.0, 1434.0, 245.0, 142.0, 83.0, 56.0, 52.0, 32.0, 26.0, 35.0, 33.0, 20.0, 12.0, 18.0, 9.0, 18.0, 6.0, 8.0, 7.0, 6.0, 6.0, 5.0, 7.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.75, -26.97265625, -26.1953125, -25.41796875, -24.640625, -23.86328125, -23.0859375, -22.30859375, -21.53125, -20.75390625, -19.9765625, -19.19921875, -18.421875, -17.64453125, -16.8671875, -16.08984375, -15.3125, -14.53515625, -13.7578125, -12.98046875, -12.203125, -11.42578125, -10.6484375, -9.87109375, -9.09375, -8.31640625, -7.5390625, -6.76171875, -5.984375, -5.20703125, -4.4296875, -3.65234375, -2.875, -2.09765625, -1.3203125, -0.54296875, 0.234375, 1.01171875, 1.7890625, 2.56640625, 3.34375, 4.12109375, 4.8984375, 5.67578125, 6.453125, 7.23046875, 8.0078125, 8.78515625, 9.5625, 10.33984375, 11.1171875, 11.89453125, 12.671875, 13.44921875, 14.2265625, 15.00390625, 15.78125, 16.55859375, 17.3359375, 18.11328125, 18.890625, 19.66796875, 20.4453125, 21.22265625, 22.0]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 12.0, 15.0, 12.0, 21.0, 21.0, 29.0, 34.0, 29.0, 54.0, 66.0, 86.0, 163.0, 193.0, 358.0, 690.0, 2098.0, 26633.0, 2907558.0, 200929.0, 4269.0, 1021.0, 442.0, 252.0, 182.0, 119.0, 99.0, 63.0, 55.0, 39.0, 27.0, 20.0, 29.0, 21.0, 13.0, 11.0, 9.0, 8.0, 4.0, 1.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.21875, -46.41259765625, -44.6064453125, -42.80029296875, -40.994140625, -39.18798828125, -37.3818359375, -35.57568359375, -33.76953125, -31.96337890625, -30.1572265625, -28.35107421875, -26.544921875, -24.73876953125, -22.9326171875, -21.12646484375, -19.3203125, -17.51416015625, -15.7080078125, -13.90185546875, -12.095703125, -10.28955078125, -8.4833984375, -6.67724609375, -4.87109375, -3.06494140625, -1.2587890625, 0.54736328125, 2.353515625, 4.15966796875, 5.9658203125, 7.77197265625, 9.578125, 11.38427734375, 13.1904296875, 14.99658203125, 16.802734375, 18.60888671875, 20.4150390625, 22.22119140625, 24.02734375, 25.83349609375, 27.6396484375, 29.44580078125, 31.251953125, 33.05810546875, 34.8642578125, 36.67041015625, 38.4765625, 40.28271484375, 42.0888671875, 43.89501953125, 45.701171875, 47.50732421875, 49.3134765625, 51.11962890625, 52.92578125, 54.73193359375, 56.5380859375, 58.34423828125, 60.150390625, 61.95654296875, 63.7626953125, 65.56884765625, 67.375]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 20.0, 32.0, 54.0, 102.0, 128.0, 133.0, 128.0, 133.0, 116.0, 77.0, 43.0, 24.0, 9.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.1012077331543, -61.44902038574219, -59.796836853027344, -58.144649505615234, -56.492462158203125, -54.840274810791016, -53.188087463378906, -51.53590393066406, -49.88371658325195, -48.231529235839844, -46.579345703125, -44.92715835571289, -43.27497100830078, -41.62278366088867, -39.97059631347656, -38.31841278076172, -36.66622543334961, -35.0140380859375, -33.361854553222656, -31.709667205810547, -30.057479858398438, -28.405292510986328, -26.75310707092285, -25.100921630859375, -23.448734283447266, -21.796546936035156, -20.14436149597168, -18.492176055908203, -16.839988708496094, -15.1878023147583, -13.535615921020508, -11.883429527282715, -10.231239318847656, -8.579052925109863, -6.92686653137207, -5.274680137634277, -3.6224937438964844, -1.9703073501586914, -0.31812095642089844, 1.3340654373168945, 2.9862518310546875, 4.6384382247924805, 6.290624618530273, 7.942811012268066, 9.59499740600586, 11.247183799743652, 12.899370193481445, 14.551556587219238, 16.20374298095703, 17.85593032836914, 19.508115768432617, 21.160301208496094, 22.812488555908203, 24.464675903320312, 26.11686134338379, 27.769046783447266, 29.421234130859375, 31.073421478271484, 32.725608825683594, 34.37779235839844, 36.02997970581055, 37.682167053222656, 39.3343505859375, 40.98653793334961, 42.63872528076172]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 8.0, 2.0, 4.0, 9.0, 5.0, 5.0, 10.0, 11.0, 12.0, 15.0, 26.0, 19.0, 27.0, 26.0, 33.0, 25.0, 32.0, 31.0, 25.0, 40.0, 31.0, 38.0, 42.0, 38.0, 47.0, 36.0, 36.0, 34.0, 38.0, 40.0, 30.0, 26.0, 20.0, 25.0, 19.0, 24.0, 18.0, 17.0, 13.0, 9.0, 11.0, 13.0, 8.0, 5.0, 5.0, 5.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.78588104248047, -57.76874923706055, -55.751617431640625, -53.73448944091797, -51.71735763549805, -49.700225830078125, -47.68309783935547, -45.66596603393555, -43.648834228515625, -41.6317024230957, -39.61457061767578, -37.597442626953125, -35.5803108215332, -33.56317901611328, -31.546049118041992, -29.528919219970703, -27.51178741455078, -25.49465560913086, -23.47752571105957, -21.46039581298828, -19.44326400756836, -17.426132202148438, -15.409002304077148, -13.391871452331543, -11.374740600585938, -9.357609748840332, -7.340478897094727, -5.323348045349121, -3.3062171936035156, -1.2890863418579102, 0.7280445098876953, 2.745175361633301, 4.7623138427734375, 6.779444694519043, 8.796575546264648, 10.813706398010254, 12.83083724975586, 14.847968101501465, 16.86509895324707, 18.88222885131836, 20.89936065673828, 22.916492462158203, 24.933622360229492, 26.95075225830078, 28.967884063720703, 30.985015869140625, 33.00214385986328, 35.0192756652832, 37.036407470703125, 39.05353927612305, 41.07067108154297, 43.087799072265625, 45.10493087768555, 47.12206268310547, 49.139190673828125, 51.15632247924805, 53.17345428466797, 55.19058609008789, 57.20771789550781, 59.22484588623047, 61.24197769165039, 63.25910949707031, 65.27623748779297, 67.29337310791016, 69.31050109863281]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 11.0, 6.0, 11.0, 8.0, 11.0, 13.0, 10.0, 22.0, 18.0, 25.0, 22.0, 22.0, 35.0, 16.0, 27.0, 26.0, 37.0, 37.0, 36.0, 34.0, 39.0, 27.0, 41.0, 38.0, 43.0, 34.0, 38.0, 37.0, 27.0, 25.0, 22.0, 28.0, 22.0, 25.0, 24.0, 13.0, 21.0, 10.0, 13.0, 7.0, 8.0, 9.0, 5.0, 2.0, 3.0, 4.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.72265625, -6.50390625, -6.28515625, -6.06640625, -5.84765625, -5.62890625, -5.41015625, -5.19140625, -4.97265625, -4.75390625, -4.53515625, -4.31640625, -4.09765625, -3.87890625, -3.66015625, -3.44140625, -3.22265625, -3.00390625, -2.78515625, -2.56640625, -2.34765625, -2.12890625, -1.91015625, -1.69140625, -1.47265625, -1.25390625, -1.03515625, -0.81640625, -0.59765625, -0.37890625, -0.16015625, 0.05859375, 0.27734375, 0.49609375, 0.71484375, 0.93359375, 1.15234375, 1.37109375, 1.58984375, 1.80859375, 2.02734375, 2.24609375, 2.46484375, 2.68359375, 2.90234375, 3.12109375, 3.33984375, 3.55859375, 3.77734375, 3.99609375, 4.21484375, 4.43359375, 4.65234375, 4.87109375, 5.08984375, 5.30859375, 5.52734375, 5.74609375, 5.96484375, 6.18359375, 6.40234375, 6.62109375, 6.83984375, 7.05859375, 7.27734375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 4.0, 1.0, 6.0, 5.0, 2.0, 12.0, 11.0, 16.0, 21.0, 26.0, 36.0, 40.0, 57.0, 88.0, 121.0, 188.0, 328.0, 612.0, 1427.0, 3658.0, 9900.0, 31399.0, 102910.0, 345180.0, 997405.0, 1512862.0, 809540.0, 263598.0, 78152.0, 23734.0, 7749.0, 2739.0, 1109.0, 531.0, 268.0, 162.0, 112.0, 66.0, 48.0, 34.0, 28.0, 22.0, 11.0, 15.0, 12.0, 10.0, 6.0, 1.0, 10.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.421875, -9.0899658203125, -8.758056640625, -8.4261474609375, -8.09423828125, -7.7623291015625, -7.430419921875, -7.0985107421875, -6.7666015625, -6.4346923828125, -6.102783203125, -5.7708740234375, -5.43896484375, -5.1070556640625, -4.775146484375, -4.4432373046875, -4.111328125, -3.7794189453125, -3.447509765625, -3.1156005859375, -2.78369140625, -2.4517822265625, -2.119873046875, -1.7879638671875, -1.4560546875, -1.1241455078125, -0.792236328125, -0.4603271484375, -0.12841796875, 0.2034912109375, 0.535400390625, 0.8673095703125, 1.19921875, 1.5311279296875, 1.863037109375, 2.1949462890625, 2.52685546875, 2.8587646484375, 3.190673828125, 3.5225830078125, 3.8544921875, 4.1864013671875, 4.518310546875, 4.8502197265625, 5.18212890625, 5.5140380859375, 5.845947265625, 6.1778564453125, 6.509765625, 6.8416748046875, 7.173583984375, 7.5054931640625, 7.83740234375, 8.1693115234375, 8.501220703125, 8.8331298828125, 9.1650390625, 9.4969482421875, 9.828857421875, 10.1607666015625, 10.49267578125, 10.8245849609375, 11.156494140625, 11.4884033203125, 11.8203125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 4.0, 8.0, 6.0, 8.0, 9.0, 10.0, 11.0, 11.0, 17.0, 31.0, 41.0, 46.0, 54.0, 79.0, 95.0, 118.0, 164.0, 172.0, 205.0, 251.0, 304.0, 332.0, 335.0, 336.0, 277.0, 249.0, 188.0, 157.0, 134.0, 93.0, 62.0, 61.0, 48.0, 43.0, 29.0, 19.0, 16.0, 18.0, 7.0, 7.0, 5.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5234375, -10.1490478515625, -9.774658203125, -9.4002685546875, -9.02587890625, -8.6514892578125, -8.277099609375, -7.9027099609375, -7.5283203125, -7.1539306640625, -6.779541015625, -6.4051513671875, -6.03076171875, -5.6563720703125, -5.281982421875, -4.9075927734375, -4.533203125, -4.1588134765625, -3.784423828125, -3.4100341796875, -3.03564453125, -2.6612548828125, -2.286865234375, -1.9124755859375, -1.5380859375, -1.1636962890625, -0.789306640625, -0.4149169921875, -0.04052734375, 0.3338623046875, 0.708251953125, 1.0826416015625, 1.45703125, 1.8314208984375, 2.205810546875, 2.5802001953125, 2.95458984375, 3.3289794921875, 3.703369140625, 4.0777587890625, 4.4521484375, 4.8265380859375, 5.200927734375, 5.5753173828125, 5.94970703125, 6.3240966796875, 6.698486328125, 7.0728759765625, 7.447265625, 7.8216552734375, 8.196044921875, 8.5704345703125, 8.94482421875, 9.3192138671875, 9.693603515625, 10.0679931640625, 10.4423828125, 10.8167724609375, 11.191162109375, 11.5655517578125, 11.93994140625, 12.3143310546875, 12.688720703125, 13.0631103515625, 13.4375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 6.0, 12.0, 9.0, 12.0, 17.0, 16.0, 28.0, 32.0, 49.0, 60.0, 63.0, 90.0, 135.0, 169.0, 200.0, 331.0, 687.0, 12201.0, 1113209.0, 3016971.0, 47412.0, 1215.0, 335.0, 233.0, 189.0, 143.0, 83.0, 84.0, 66.0, 50.0, 36.0, 25.0, 26.0, 13.0, 10.0, 12.0, 8.0, 10.0, 6.0, 4.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0], "bins": [-59.125, -57.48974609375, -55.8544921875, -54.21923828125, -52.583984375, -50.94873046875, -49.3134765625, -47.67822265625, -46.04296875, -44.40771484375, -42.7724609375, -41.13720703125, -39.501953125, -37.86669921875, -36.2314453125, -34.59619140625, -32.9609375, -31.32568359375, -29.6904296875, -28.05517578125, -26.419921875, -24.78466796875, -23.1494140625, -21.51416015625, -19.87890625, -18.24365234375, -16.6083984375, -14.97314453125, -13.337890625, -11.70263671875, -10.0673828125, -8.43212890625, -6.796875, -5.16162109375, -3.5263671875, -1.89111328125, -0.255859375, 1.37939453125, 3.0146484375, 4.64990234375, 6.28515625, 7.92041015625, 9.5556640625, 11.19091796875, 12.826171875, 14.46142578125, 16.0966796875, 17.73193359375, 19.3671875, 21.00244140625, 22.6376953125, 24.27294921875, 25.908203125, 27.54345703125, 29.1787109375, 30.81396484375, 32.44921875, 34.08447265625, 35.7197265625, 37.35498046875, 38.990234375, 40.62548828125, 42.2607421875, 43.89599609375, 45.53125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 14.0, 23.0, 52.0, 50.0, 85.0, 97.0, 116.0, 137.0, 131.0, 102.0, 88.0, 41.0, 26.0, 22.0, 8.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.75456237792969, -95.06242370605469, -92.37027740478516, -89.67813110351562, -86.98599243164062, -84.29385375976562, -81.6017074584961, -78.90956115722656, -76.21742248535156, -73.52528381347656, -70.83313751220703, -68.1409912109375, -65.4488525390625, -62.756710052490234, -60.06456756591797, -57.3724250793457, -54.68028259277344, -51.98814010620117, -49.295997619628906, -46.60385513305664, -43.911712646484375, -41.21957015991211, -38.527427673339844, -35.83528518676758, -33.14314270019531, -30.451000213623047, -27.75885772705078, -25.066715240478516, -22.37457275390625, -19.682430267333984, -16.99028778076172, -14.298145294189453, -11.606010437011719, -8.913867950439453, -6.2217254638671875, -3.529582977294922, -0.8374404907226562, 1.8547019958496094, 4.546844482421875, 7.238986968994141, 9.931129455566406, 12.623271942138672, 15.315414428710938, 18.007556915283203, 20.69969940185547, 23.391841888427734, 26.083984375, 28.776126861572266, 31.46826934814453, 34.1604118347168, 36.85255432128906, 39.54469680786133, 42.236839294433594, 44.92898178100586, 47.621124267578125, 50.31326675415039, 53.005409240722656, 55.69755172729492, 58.38969421386719, 61.08183670043945, 63.77397918701172, 66.46612548828125, 69.15826416015625, 71.85040283203125, 74.54254913330078]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 6.0, 6.0, 8.0, 4.0, 17.0, 11.0, 18.0, 19.0, 26.0, 18.0, 21.0, 32.0, 36.0, 31.0, 40.0, 37.0, 39.0, 35.0, 46.0, 47.0, 50.0, 35.0, 47.0, 39.0, 43.0, 42.0, 31.0, 38.0, 27.0, 19.0, 28.0, 20.0, 22.0, 15.0, 13.0, 9.0, 9.0, 5.0, 5.0, 4.0, 7.0, 4.0, 1.0, 1.0, 2.0], "bins": [-65.33230590820312, -63.650184631347656, -61.96806716918945, -60.28594970703125, -58.60382843017578, -56.92170715332031, -55.23958969116211, -53.557472229003906, -51.87535095214844, -50.19322967529297, -48.511112213134766, -46.82899475097656, -45.146873474121094, -43.464752197265625, -41.78263473510742, -40.10051727294922, -38.41839599609375, -36.73627471923828, -35.05415725708008, -33.372039794921875, -31.689918518066406, -30.00779914855957, -28.325679779052734, -26.6435604095459, -24.961441040039062, -23.279321670532227, -21.59720230102539, -19.915082931518555, -18.23296356201172, -16.550844192504883, -14.868724822998047, -13.186605453491211, -11.50448989868164, -9.822370529174805, -8.140251159667969, -6.458131790161133, -4.776012420654297, -3.093893051147461, -1.411773681640625, 0.27034568786621094, 1.9524650573730469, 3.634584426879883, 5.316703796386719, 6.998823165893555, 8.68094253540039, 10.363061904907227, 12.045181274414062, 13.727300643920898, 15.409420013427734, 17.09153938293457, 18.773658752441406, 20.455778121948242, 22.137897491455078, 23.820016860961914, 25.50213623046875, 27.184255599975586, 28.866374969482422, 30.548494338989258, 32.230613708496094, 33.91273498535156, 35.594852447509766, 37.27696990966797, 38.95909118652344, 40.641212463378906, 42.32332992553711]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 7.0, 12.0, 10.0, 8.0, 10.0, 16.0, 14.0, 17.0, 24.0, 23.0, 42.0, 42.0, 29.0, 30.0, 37.0, 45.0, 42.0, 36.0, 39.0, 25.0, 31.0, 37.0, 39.0, 36.0, 41.0, 29.0, 26.0, 26.0, 25.0, 24.0, 34.0, 18.0, 14.0, 13.0, 22.0, 17.0, 10.0, 8.0, 7.0, 4.0, 7.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-6.33203125, -6.12579345703125, -5.9195556640625, -5.71331787109375, -5.507080078125, -5.30084228515625, -5.0946044921875, -4.88836669921875, -4.68212890625, -4.47589111328125, -4.2696533203125, -4.06341552734375, -3.857177734375, -3.65093994140625, -3.4447021484375, -3.23846435546875, -3.0322265625, -2.82598876953125, -2.6197509765625, -2.41351318359375, -2.207275390625, -2.00103759765625, -1.7947998046875, -1.58856201171875, -1.38232421875, -1.17608642578125, -0.9698486328125, -0.76361083984375, -0.557373046875, -0.35113525390625, -0.1448974609375, 0.06134033203125, 0.267578125, 0.47381591796875, 0.6800537109375, 0.88629150390625, 1.092529296875, 1.29876708984375, 1.5050048828125, 1.71124267578125, 1.91748046875, 2.12371826171875, 2.3299560546875, 2.53619384765625, 2.742431640625, 2.94866943359375, 3.1549072265625, 3.36114501953125, 3.5673828125, 3.77362060546875, 3.9798583984375, 4.18609619140625, 4.392333984375, 4.59857177734375, 4.8048095703125, 5.01104736328125, 5.21728515625, 5.42352294921875, 5.6297607421875, 5.83599853515625, 6.042236328125, 6.24847412109375, 6.4547119140625, 6.66094970703125, 6.8671875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 8.0, 14.0, 16.0, 32.0, 25.0, 40.0, 63.0, 64.0, 113.0, 165.0, 194.0, 330.0, 465.0, 745.0, 1151.0, 1877.0, 2999.0, 4801.0, 8062.0, 13157.0, 21919.0, 35319.0, 55871.0, 82519.0, 115024.0, 141387.0, 148353.0, 128880.0, 98715.0, 68794.0, 44871.0, 27948.0, 17342.0, 10508.0, 6295.0, 3850.0, 2346.0, 1467.0, 927.0, 648.0, 365.0, 264.0, 186.0, 121.0, 91.0, 69.0, 35.0, 42.0, 27.0, 15.0, 11.0, 13.0, 8.0, 3.0, 3.0, 3.0], "bins": [-1.654296875, -1.6060028076171875, -1.557708740234375, -1.5094146728515625, -1.46112060546875, -1.4128265380859375, -1.364532470703125, -1.3162384033203125, -1.2679443359375, -1.2196502685546875, -1.171356201171875, -1.1230621337890625, -1.07476806640625, -1.0264739990234375, -0.978179931640625, -0.9298858642578125, -0.881591796875, -0.8332977294921875, -0.785003662109375, -0.7367095947265625, -0.68841552734375, -0.6401214599609375, -0.591827392578125, -0.5435333251953125, -0.4952392578125, -0.4469451904296875, -0.398651123046875, -0.3503570556640625, -0.30206298828125, -0.2537689208984375, -0.205474853515625, -0.1571807861328125, -0.10888671875, -0.0605926513671875, -0.012298583984375, 0.0359954833984375, 0.08428955078125, 0.1325836181640625, 0.180877685546875, 0.2291717529296875, 0.2774658203125, 0.3257598876953125, 0.374053955078125, 0.4223480224609375, 0.47064208984375, 0.5189361572265625, 0.567230224609375, 0.6155242919921875, 0.663818359375, 0.7121124267578125, 0.760406494140625, 0.8087005615234375, 0.85699462890625, 0.9052886962890625, 0.953582763671875, 1.0018768310546875, 1.0501708984375, 1.0984649658203125, 1.146759033203125, 1.1950531005859375, 1.24334716796875, 1.2916412353515625, 1.339935302734375, 1.3882293701171875, 1.4365234375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 8.0, 3.0, 11.0, 7.0, 11.0, 23.0, 13.0, 25.0, 17.0, 22.0, 24.0, 31.0, 20.0, 29.0, 39.0, 44.0, 29.0, 32.0, 37.0, 1058.0, 39.0, 51.0, 33.0, 50.0, 36.0, 33.0, 38.0, 27.0, 31.0, 31.0, 32.0, 24.0, 20.0, 16.0, 16.0, 13.0, 14.0, 8.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.5406494140625, -4.378173828125, -4.2156982421875, -4.05322265625, -3.8907470703125, -3.728271484375, -3.5657958984375, -3.4033203125, -3.2408447265625, -3.078369140625, -2.9158935546875, -2.75341796875, -2.5909423828125, -2.428466796875, -2.2659912109375, -2.103515625, -1.9410400390625, -1.778564453125, -1.6160888671875, -1.45361328125, -1.2911376953125, -1.128662109375, -0.9661865234375, -0.8037109375, -0.6412353515625, -0.478759765625, -0.3162841796875, -0.15380859375, 0.0086669921875, 0.171142578125, 0.3336181640625, 0.49609375, 0.6585693359375, 0.821044921875, 0.9835205078125, 1.14599609375, 1.3084716796875, 1.470947265625, 1.6334228515625, 1.7958984375, 1.9583740234375, 2.120849609375, 2.2833251953125, 2.44580078125, 2.6082763671875, 2.770751953125, 2.9332275390625, 3.095703125, 3.2581787109375, 3.420654296875, 3.5831298828125, 3.74560546875, 3.9080810546875, 4.070556640625, 4.2330322265625, 4.3955078125, 4.5579833984375, 4.720458984375, 4.8829345703125, 5.04541015625, 5.2078857421875, 5.370361328125, 5.5328369140625, 5.6953125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 18.0, 26.0, 38.0, 61.0, 90.0, 143.0, 233.0, 303.0, 509.0, 798.0, 1358.0, 2108.0, 3304.0, 5068.0, 8388.0, 13454.0, 22010.0, 39244.0, 1871751.0, 57849.0, 27143.0, 16328.0, 9940.0, 6246.0, 4000.0, 2496.0, 1560.0, 941.0, 630.0, 409.0, 247.0, 148.0, 96.0, 67.0, 33.0, 23.0, 21.0, 15.0, 7.0, 7.0, 3.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.08203125, -2.993194580078125, -2.90435791015625, -2.815521240234375, -2.7266845703125, -2.637847900390625, -2.54901123046875, -2.460174560546875, -2.371337890625, -2.282501220703125, -2.19366455078125, -2.104827880859375, -2.0159912109375, -1.927154541015625, -1.83831787109375, -1.749481201171875, -1.66064453125, -1.571807861328125, -1.48297119140625, -1.394134521484375, -1.3052978515625, -1.216461181640625, -1.12762451171875, -1.038787841796875, -0.949951171875, -0.861114501953125, -0.77227783203125, -0.683441162109375, -0.5946044921875, -0.505767822265625, -0.41693115234375, -0.328094482421875, -0.2392578125, -0.150421142578125, -0.06158447265625, 0.027252197265625, 0.1160888671875, 0.204925537109375, 0.29376220703125, 0.382598876953125, 0.471435546875, 0.560272216796875, 0.64910888671875, 0.737945556640625, 0.8267822265625, 0.915618896484375, 1.00445556640625, 1.093292236328125, 1.18212890625, 1.270965576171875, 1.35980224609375, 1.448638916015625, 1.5374755859375, 1.626312255859375, 1.71514892578125, 1.803985595703125, 1.892822265625, 1.981658935546875, 2.07049560546875, 2.159332275390625, 2.2481689453125, 2.337005615234375, 2.42584228515625, 2.514678955078125, 2.603515625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 4.0, 2.0, 9.0, 10.0, 8.0, 14.0, 10.0, 14.0, 28.0, 37.0, 21.0, 36.0, 45.0, 50.0, 41.0, 59.0, 64.0, 75.0, 52.0, 76.0, 58.0, 51.0, 34.0, 37.0, 28.0, 24.0, 24.0, 28.0, 17.0, 12.0, 9.0, 8.0, 6.0, 4.0, 8.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1380615234375, -0.13410091400146484, -0.1301403045654297, -0.12617969512939453, -0.12221908569335938, -0.11825847625732422, -0.11429786682128906, -0.1103372573852539, -0.10637664794921875, -0.1024160385131836, -0.09845542907714844, -0.09449481964111328, -0.09053421020507812, -0.08657360076904297, -0.08261299133300781, -0.07865238189697266, -0.0746917724609375, -0.07073116302490234, -0.06677055358886719, -0.06280994415283203, -0.058849334716796875, -0.05488872528076172, -0.05092811584472656, -0.046967506408691406, -0.04300689697265625, -0.039046287536621094, -0.03508567810058594, -0.03112506866455078, -0.027164459228515625, -0.02320384979248047, -0.019243240356445312, -0.015282630920410156, -0.011322021484375, -0.007361412048339844, -0.0034008026123046875, 0.0005598068237304688, 0.004520416259765625, 0.008481025695800781, 0.012441635131835938, 0.016402244567871094, 0.02036285400390625, 0.024323463439941406, 0.028284072875976562, 0.03224468231201172, 0.036205291748046875, 0.04016590118408203, 0.04412651062011719, 0.048087120056152344, 0.0520477294921875, 0.056008338928222656, 0.05996894836425781, 0.06392955780029297, 0.06789016723632812, 0.07185077667236328, 0.07581138610839844, 0.0797719955444336, 0.08373260498046875, 0.0876932144165039, 0.09165382385253906, 0.09561443328857422, 0.09957504272460938, 0.10353565216064453, 0.10749626159667969, 0.11145687103271484, 0.11541748046875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 8.0, 4.0, 5.0, 10.0, 5.0, 19.0, 19.0, 20.0, 24.0, 29.0, 39.0, 54.0, 84.0, 137.0, 254.0, 876.0, 121195.0, 923703.0, 1214.0, 316.0, 165.0, 97.0, 61.0, 48.0, 33.0, 30.0, 27.0, 20.0, 13.0, 9.0, 8.0, 11.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5859375, -2.497100830078125, -2.40826416015625, -2.319427490234375, -2.2305908203125, -2.141754150390625, -2.05291748046875, -1.964080810546875, -1.875244140625, -1.786407470703125, -1.69757080078125, -1.608734130859375, -1.5198974609375, -1.431060791015625, -1.34222412109375, -1.253387451171875, -1.16455078125, -1.075714111328125, -0.98687744140625, -0.898040771484375, -0.8092041015625, -0.720367431640625, -0.63153076171875, -0.542694091796875, -0.453857421875, -0.365020751953125, -0.27618408203125, -0.187347412109375, -0.0985107421875, -0.009674072265625, 0.07916259765625, 0.167999267578125, 0.2568359375, 0.345672607421875, 0.43450927734375, 0.523345947265625, 0.6121826171875, 0.701019287109375, 0.78985595703125, 0.878692626953125, 0.967529296875, 1.056365966796875, 1.14520263671875, 1.234039306640625, 1.3228759765625, 1.411712646484375, 1.50054931640625, 1.589385986328125, 1.67822265625, 1.767059326171875, 1.85589599609375, 1.944732666015625, 2.0335693359375, 2.122406005859375, 2.21124267578125, 2.300079345703125, 2.388916015625, 2.477752685546875, 2.56658935546875, 2.655426025390625, 2.7442626953125, 2.833099365234375, 2.92193603515625, 3.010772705078125, 3.099609375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 19.0, 895.0, 101.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.527682304382324, -5.42288064956665, -5.318078994750977, -5.213277339935303, -5.108475685119629, -5.003673553466797, -4.898871898651123, -4.794070243835449, -4.689268589019775, -4.584466934204102, -4.479665279388428, -4.374863624572754, -4.270061492919922, -4.165259838104248, -4.060458183288574, -3.9556565284729004, -3.8508548736572266, -3.7460532188415527, -3.641251564025879, -3.536449670791626, -3.431648015975952, -3.3268463611602783, -3.2220444679260254, -3.1172428131103516, -3.0124411582946777, -2.907639503479004, -2.80283784866333, -2.698035955429077, -2.5932343006134033, -2.4884326457977295, -2.3836307525634766, -2.2788290977478027, -2.17402720451355, -2.069225549697876, -1.9644237756729126, -1.8596220016479492, -1.7548203468322754, -1.6500186920166016, -1.5452169179916382, -1.4404151439666748, -1.335613489151001, -1.2308118343353271, -1.1260100603103638, -1.0212082862854004, -0.9164066314697266, -0.811604917049408, -0.7068032026290894, -0.6020014882087708, -0.49719977378845215, -0.39239805936813354, -0.28759634494781494, -0.18279463052749634, -0.07799291610717773, 0.02680879831314087, 0.13161051273345947, 0.23641222715377808, 0.3412139415740967, 0.4460156559944153, 0.5508173704147339, 0.6556190848350525, 0.7604207992553711, 0.8652225136756897, 0.9700242280960083, 1.0748260021209717, 1.1796276569366455]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 10.0, 9.0, 14.0, 17.0, 16.0, 18.0, 35.0, 28.0, 36.0, 33.0, 39.0, 37.0, 45.0, 48.0, 54.0, 48.0, 57.0, 45.0, 47.0, 54.0, 49.0, 34.0, 46.0, 26.0, 28.0, 28.0, 21.0, 23.0, 16.0, 5.0, 7.0, 9.0, 6.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4353649616241455, -0.4198808968067169, -0.4043968617916107, -0.38891279697418213, -0.37342873215675354, -0.35794466733932495, -0.34246063232421875, -0.32697656750679016, -0.3114925026893616, -0.296008437871933, -0.2805244028568268, -0.2650403380393982, -0.2495562732219696, -0.2340722233057022, -0.21858817338943481, -0.20310410857200623, -0.18762007355690002, -0.17213602364063263, -0.15665195882320404, -0.14116790890693665, -0.12568384408950806, -0.11019979417324066, -0.09471574425697327, -0.07923168689012527, -0.06374762952327728, -0.04826357215642929, -0.0327795185148716, -0.017295464873313904, -0.0018114075064659119, 0.01367264986038208, 0.029156699776649475, 0.04464075714349747, 0.06012481451034546, 0.07560887187719345, 0.09109292924404144, 0.10657697916030884, 0.12206103652715683, 0.13754509389400482, 0.15302914381027222, 0.1685132086277008, 0.1839972585439682, 0.1994813084602356, 0.21496537327766418, 0.23044942319393158, 0.24593347311019897, 0.26141753792762756, 0.27690160274505615, 0.29238563776016235, 0.30786970257759094, 0.32335376739501953, 0.33883780241012573, 0.3543218672275543, 0.3698059320449829, 0.3852899670600891, 0.4007740318775177, 0.4162580966949463, 0.4317421317100525, 0.4472261965274811, 0.4627102315425873, 0.47819429636001587, 0.49367836117744446, 0.509162425994873, 0.5246464610099792, 0.5401304960250854, 0.5556145906448364]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 4.0, 5.0, 6.0, 8.0, 14.0, 13.0, 18.0, 15.0, 27.0, 35.0, 35.0, 33.0, 35.0, 37.0, 44.0, 34.0, 32.0, 43.0, 33.0, 42.0, 43.0, 40.0, 40.0, 41.0, 34.0, 39.0, 36.0, 23.0, 34.0, 19.0, 16.0, 13.0, 21.0, 22.0, 16.0, 11.0, 9.0, 8.0, 4.0, 5.0, 2.0, 1.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-7.08984375, -6.86700439453125, -6.6441650390625, -6.42132568359375, -6.198486328125, -5.97564697265625, -5.7528076171875, -5.52996826171875, -5.30712890625, -5.08428955078125, -4.8614501953125, -4.63861083984375, -4.415771484375, -4.19293212890625, -3.9700927734375, -3.74725341796875, -3.5244140625, -3.30157470703125, -3.0787353515625, -2.85589599609375, -2.633056640625, -2.41021728515625, -2.1873779296875, -1.96453857421875, -1.74169921875, -1.51885986328125, -1.2960205078125, -1.07318115234375, -0.850341796875, -0.62750244140625, -0.4046630859375, -0.18182373046875, 0.041015625, 0.26385498046875, 0.4866943359375, 0.70953369140625, 0.932373046875, 1.15521240234375, 1.3780517578125, 1.60089111328125, 1.82373046875, 2.04656982421875, 2.2694091796875, 2.49224853515625, 2.715087890625, 2.93792724609375, 3.1607666015625, 3.38360595703125, 3.6064453125, 3.82928466796875, 4.0521240234375, 4.27496337890625, 4.497802734375, 4.72064208984375, 4.9434814453125, 5.16632080078125, 5.38916015625, 5.61199951171875, 5.8348388671875, 6.05767822265625, 6.280517578125, 6.50335693359375, 6.7261962890625, 6.94903564453125, 7.171875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 4.0, 9.0, 6.0, 15.0, 12.0, 24.0, 27.0, 35.0, 58.0, 87.0, 123.0, 199.0, 320.0, 431.0, 791.0, 1284.0, 2481.0, 4109.0, 7437.0, 14146.0, 27980.0, 59229.0, 130753.0, 306107.0, 272113.0, 114537.0, 52364.0, 24997.0, 12740.0, 6954.0, 3857.0, 2117.0, 1170.0, 761.0, 471.0, 275.0, 147.0, 118.0, 79.0, 47.0, 33.0, 28.0, 27.0, 19.0, 11.0, 8.0, 8.0, 1.0, 3.0, 5.0, 3.0, 0.0, 0.0, 2.0], "bins": [-8.828125, -8.56787109375, -8.3076171875, -8.04736328125, -7.787109375, -7.52685546875, -7.2666015625, -7.00634765625, -6.74609375, -6.48583984375, -6.2255859375, -5.96533203125, -5.705078125, -5.44482421875, -5.1845703125, -4.92431640625, -4.6640625, -4.40380859375, -4.1435546875, -3.88330078125, -3.623046875, -3.36279296875, -3.1025390625, -2.84228515625, -2.58203125, -2.32177734375, -2.0615234375, -1.80126953125, -1.541015625, -1.28076171875, -1.0205078125, -0.76025390625, -0.5, -0.23974609375, 0.0205078125, 0.28076171875, 0.541015625, 0.80126953125, 1.0615234375, 1.32177734375, 1.58203125, 1.84228515625, 2.1025390625, 2.36279296875, 2.623046875, 2.88330078125, 3.1435546875, 3.40380859375, 3.6640625, 3.92431640625, 4.1845703125, 4.44482421875, 4.705078125, 4.96533203125, 5.2255859375, 5.48583984375, 5.74609375, 6.00634765625, 6.2666015625, 6.52685546875, 6.787109375, 7.04736328125, 7.3076171875, 7.56787109375, 7.828125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 5.0, 6.0, 9.0, 4.0, 10.0, 11.0, 19.0, 14.0, 24.0, 28.0, 21.0, 27.0, 35.0, 33.0, 49.0, 53.0, 63.0, 114.0, 180.0, 1366.0, 345.0, 161.0, 72.0, 60.0, 47.0, 39.0, 47.0, 29.0, 25.0, 21.0, 26.0, 28.0, 18.0, 18.0, 12.0, 8.0, 8.0, 10.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.171875, -26.370849609375, -25.56982421875, -24.768798828125, -23.9677734375, -23.166748046875, -22.36572265625, -21.564697265625, -20.763671875, -19.962646484375, -19.16162109375, -18.360595703125, -17.5595703125, -16.758544921875, -15.95751953125, -15.156494140625, -14.35546875, -13.554443359375, -12.75341796875, -11.952392578125, -11.1513671875, -10.350341796875, -9.54931640625, -8.748291015625, -7.947265625, -7.146240234375, -6.34521484375, -5.544189453125, -4.7431640625, -3.942138671875, -3.14111328125, -2.340087890625, -1.5390625, -0.738037109375, 0.06298828125, 0.864013671875, 1.6650390625, 2.466064453125, 3.26708984375, 4.068115234375, 4.869140625, 5.670166015625, 6.47119140625, 7.272216796875, 8.0732421875, 8.874267578125, 9.67529296875, 10.476318359375, 11.27734375, 12.078369140625, 12.87939453125, 13.680419921875, 14.4814453125, 15.282470703125, 16.08349609375, 16.884521484375, 17.685546875, 18.486572265625, 19.28759765625, 20.088623046875, 20.8896484375, 21.690673828125, 22.49169921875, 23.292724609375, 24.09375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 11.0, 13.0, 9.0, 7.0, 20.0, 28.0, 36.0, 32.0, 41.0, 69.0, 88.0, 142.0, 192.0, 234.0, 444.0, 1404.0, 26214.0, 2938629.0, 173059.0, 3350.0, 662.0, 319.0, 196.0, 125.0, 87.0, 69.0, 62.0, 37.0, 38.0, 27.0, 20.0, 11.0, 8.0, 12.0, 7.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.34375, -45.42626953125, -43.5087890625, -41.59130859375, -39.673828125, -37.75634765625, -35.8388671875, -33.92138671875, -32.00390625, -30.08642578125, -28.1689453125, -26.25146484375, -24.333984375, -22.41650390625, -20.4990234375, -18.58154296875, -16.6640625, -14.74658203125, -12.8291015625, -10.91162109375, -8.994140625, -7.07666015625, -5.1591796875, -3.24169921875, -1.32421875, 0.59326171875, 2.5107421875, 4.42822265625, 6.345703125, 8.26318359375, 10.1806640625, 12.09814453125, 14.015625, 15.93310546875, 17.8505859375, 19.76806640625, 21.685546875, 23.60302734375, 25.5205078125, 27.43798828125, 29.35546875, 31.27294921875, 33.1904296875, 35.10791015625, 37.025390625, 38.94287109375, 40.8603515625, 42.77783203125, 44.6953125, 46.61279296875, 48.5302734375, 50.44775390625, 52.365234375, 54.28271484375, 56.2001953125, 58.11767578125, 60.03515625, 61.95263671875, 63.8701171875, 65.78759765625, 67.705078125, 69.62255859375, 71.5400390625, 73.45751953125, 75.375]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 374.0, 643.0], "bins": [-1011.0800170898438, -995.0448608398438, -979.0097045898438, -962.9745483398438, -946.9393920898438, -930.9042358398438, -914.8690795898438, -898.833984375, -882.798828125, -866.763671875, -850.728515625, -834.693359375, -818.658203125, -802.623046875, -786.587890625, -770.552734375, -754.517578125, -738.482421875, -722.447265625, -706.412109375, -690.376953125, -674.341796875, -658.306640625, -642.271484375, -626.236328125, -610.201171875, -594.166015625, -578.130859375, -562.095703125, -546.060546875, -530.025390625, -513.990234375, -497.9551086425781, -481.9199523925781, -465.8847961425781, -449.8496398925781, -433.81451416015625, -417.77935791015625, -401.74420166015625, -385.70904541015625, -369.67388916015625, -353.63873291015625, -337.60357666015625, -321.56842041015625, -305.53326416015625, -289.49810791015625, -273.4629821777344, -257.4278259277344, -241.39268493652344, -225.35752868652344, -209.3223876953125, -193.2872314453125, -177.2520751953125, -161.2169189453125, -145.1817626953125, -129.14662170410156, -113.11146545410156, -97.07630920410156, -81.0411605834961, -65.00601196289062, -48.970855712890625, -32.935699462890625, -16.900550842285156, -0.8654022216796875, 15.169755935668945]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 1.0, 6.0, 6.0, 7.0, 7.0, 8.0, 10.0, 13.0, 13.0, 5.0, 22.0, 27.0, 24.0, 23.0, 25.0, 42.0, 25.0, 33.0, 38.0, 37.0, 40.0, 33.0, 33.0, 39.0, 34.0, 28.0, 37.0, 30.0, 32.0, 37.0, 37.0, 32.0, 26.0, 20.0, 24.0, 22.0, 19.0, 15.0, 15.0, 13.0, 12.0, 6.0, 9.0, 12.0, 5.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-53.03400802612305, -51.27216720581055, -49.51032638549805, -47.74848556518555, -45.98664474487305, -44.22480392456055, -42.46296691894531, -40.70112609863281, -38.93928527832031, -37.17744445800781, -35.41560363769531, -33.65376281738281, -31.891921997070312, -30.130081176757812, -28.368242263793945, -26.606401443481445, -24.844558715820312, -23.082717895507812, -21.320877075195312, -19.559036254882812, -17.797195434570312, -16.035354614257812, -14.273515701293945, -12.511674880981445, -10.749834060668945, -8.987993240356445, -7.2261528968811035, -5.464312553405762, -3.7024717330932617, -1.9406309127807617, -0.17879104614257812, 1.5830497741699219, 3.3448867797851562, 5.106727600097656, 6.868567943572998, 8.63040828704834, 10.39224910736084, 12.15408992767334, 13.915929794311523, 15.677770614624023, 17.439611434936523, 19.201452255249023, 20.963293075561523, 22.72513198852539, 24.48697280883789, 26.24881362915039, 28.01065444946289, 29.77249526977539, 31.53433609008789, 33.29617691040039, 35.05801773071289, 36.81985855102539, 38.58169937133789, 40.34354019165039, 42.105377197265625, 43.867218017578125, 45.629058837890625, 47.390899658203125, 49.152740478515625, 50.914581298828125, 52.676422119140625, 54.438262939453125, 56.200103759765625, 57.961944580078125, 59.723785400390625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 5.0, 7.0, 9.0, 10.0, 13.0, 13.0, 10.0, 16.0, 22.0, 23.0, 24.0, 35.0, 27.0, 34.0, 46.0, 39.0, 34.0, 38.0, 28.0, 32.0, 41.0, 48.0, 45.0, 38.0, 34.0, 29.0, 37.0, 31.0, 33.0, 28.0, 21.0, 21.0, 27.0, 20.0, 14.0, 15.0, 8.0, 7.0, 6.0, 5.0, 7.0, 3.0, 2.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.69921875, -6.46685791015625, -6.2344970703125, -6.00213623046875, -5.769775390625, -5.53741455078125, -5.3050537109375, -5.07269287109375, -4.84033203125, -4.60797119140625, -4.3756103515625, -4.14324951171875, -3.910888671875, -3.67852783203125, -3.4461669921875, -3.21380615234375, -2.9814453125, -2.74908447265625, -2.5167236328125, -2.28436279296875, -2.052001953125, -1.81964111328125, -1.5872802734375, -1.35491943359375, -1.12255859375, -0.89019775390625, -0.6578369140625, -0.42547607421875, -0.193115234375, 0.03924560546875, 0.2716064453125, 0.50396728515625, 0.736328125, 0.96868896484375, 1.2010498046875, 1.43341064453125, 1.665771484375, 1.89813232421875, 2.1304931640625, 2.36285400390625, 2.59521484375, 2.82757568359375, 3.0599365234375, 3.29229736328125, 3.524658203125, 3.75701904296875, 3.9893798828125, 4.22174072265625, 4.4541015625, 4.68646240234375, 4.9188232421875, 5.15118408203125, 5.383544921875, 5.61590576171875, 5.8482666015625, 6.08062744140625, 6.31298828125, 6.54534912109375, 6.7777099609375, 7.01007080078125, 7.242431640625, 7.47479248046875, 7.7071533203125, 7.93951416015625, 8.171875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 6.0, 9.0, 4.0, 11.0, 7.0, 17.0, 24.0, 14.0, 39.0, 40.0, 68.0, 104.0, 144.0, 242.0, 436.0, 931.0, 2707.0, 10474.0, 52738.0, 294862.0, 1345544.0, 1860604.0, 508359.0, 92410.0, 17537.0, 4220.0, 1331.0, 559.0, 292.0, 157.0, 99.0, 73.0, 57.0, 39.0, 31.0, 15.0, 10.0, 14.0, 15.0, 13.0, 9.0, 3.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.7890625, -13.3162841796875, -12.843505859375, -12.3707275390625, -11.89794921875, -11.4251708984375, -10.952392578125, -10.4796142578125, -10.0068359375, -9.5340576171875, -9.061279296875, -8.5885009765625, -8.11572265625, -7.6429443359375, -7.170166015625, -6.6973876953125, -6.224609375, -5.7518310546875, -5.279052734375, -4.8062744140625, -4.33349609375, -3.8607177734375, -3.387939453125, -2.9151611328125, -2.4423828125, -1.9696044921875, -1.496826171875, -1.0240478515625, -0.55126953125, -0.0784912109375, 0.394287109375, 0.8670654296875, 1.33984375, 1.8126220703125, 2.285400390625, 2.7581787109375, 3.23095703125, 3.7037353515625, 4.176513671875, 4.6492919921875, 5.1220703125, 5.5948486328125, 6.067626953125, 6.5404052734375, 7.01318359375, 7.4859619140625, 7.958740234375, 8.4315185546875, 8.904296875, 9.3770751953125, 9.849853515625, 10.3226318359375, 10.79541015625, 11.2681884765625, 11.740966796875, 12.2137451171875, 12.6865234375, 13.1593017578125, 13.632080078125, 14.1048583984375, 14.57763671875, 15.0504150390625, 15.523193359375, 15.9959716796875, 16.46875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 8.0, 4.0, 12.0, 16.0, 15.0, 17.0, 28.0, 39.0, 58.0, 89.0, 107.0, 151.0, 180.0, 220.0, 303.0, 383.0, 468.0, 406.0, 367.0, 310.0, 214.0, 193.0, 132.0, 100.0, 73.0, 48.0, 27.0, 24.0, 18.0, 21.0, 10.0, 12.0, 6.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.015625, -15.55859375, -15.1015625, -14.64453125, -14.1875, -13.73046875, -13.2734375, -12.81640625, -12.359375, -11.90234375, -11.4453125, -10.98828125, -10.53125, -10.07421875, -9.6171875, -9.16015625, -8.703125, -8.24609375, -7.7890625, -7.33203125, -6.875, -6.41796875, -5.9609375, -5.50390625, -5.046875, -4.58984375, -4.1328125, -3.67578125, -3.21875, -2.76171875, -2.3046875, -1.84765625, -1.390625, -0.93359375, -0.4765625, -0.01953125, 0.4375, 0.89453125, 1.3515625, 1.80859375, 2.265625, 2.72265625, 3.1796875, 3.63671875, 4.09375, 4.55078125, 5.0078125, 5.46484375, 5.921875, 6.37890625, 6.8359375, 7.29296875, 7.75, 8.20703125, 8.6640625, 9.12109375, 9.578125, 10.03515625, 10.4921875, 10.94921875, 11.40625, 11.86328125, 12.3203125, 12.77734375, 13.234375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 6.0, 6.0, 12.0, 17.0, 21.0, 19.0, 27.0, 45.0, 61.0, 93.0, 143.0, 193.0, 260.0, 517.0, 4548.0, 928888.0, 3239375.0, 18201.0, 720.0, 331.0, 211.0, 167.0, 118.0, 87.0, 58.0, 37.0, 31.0, 18.0, 18.0, 17.0, 9.0, 4.0, 9.0, 7.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.3125, -60.24609375, -58.1796875, -56.11328125, -54.046875, -51.98046875, -49.9140625, -47.84765625, -45.78125, -43.71484375, -41.6484375, -39.58203125, -37.515625, -35.44921875, -33.3828125, -31.31640625, -29.25, -27.18359375, -25.1171875, -23.05078125, -20.984375, -18.91796875, -16.8515625, -14.78515625, -12.71875, -10.65234375, -8.5859375, -6.51953125, -4.453125, -2.38671875, -0.3203125, 1.74609375, 3.8125, 5.87890625, 7.9453125, 10.01171875, 12.078125, 14.14453125, 16.2109375, 18.27734375, 20.34375, 22.41015625, 24.4765625, 26.54296875, 28.609375, 30.67578125, 32.7421875, 34.80859375, 36.875, 38.94140625, 41.0078125, 43.07421875, 45.140625, 47.20703125, 49.2734375, 51.33984375, 53.40625, 55.47265625, 57.5390625, 59.60546875, 61.671875, 63.73828125, 65.8046875, 67.87109375, 69.9375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 10.0, 21.0, 47.0, 97.0, 153.0, 202.0, 186.0, 159.0, 76.0, 42.0, 18.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.58728790283203, -123.48802947998047, -119.38877868652344, -115.28952026367188, -111.19026947021484, -107.09101104736328, -102.99176025390625, -98.89250183105469, -94.79324340820312, -90.69398498535156, -86.59473419189453, -82.49547576904297, -78.39622497558594, -74.29696655273438, -70.19770812988281, -66.09845733642578, -61.99920654296875, -57.89995193481445, -53.800697326660156, -49.701438903808594, -45.60218811035156, -41.5029296875, -37.4036750793457, -33.304420471191406, -29.20516586303711, -25.105911254882812, -21.006656646728516, -16.907400131225586, -12.808145523071289, -8.708890914916992, -4.6096343994140625, -0.5103797912597656, 3.5888671875, 7.688122272491455, 11.78737735748291, 15.886632919311523, 19.98588752746582, 24.085142135620117, 28.184398651123047, 32.283653259277344, 36.38290786743164, 40.48216247558594, 44.581417083740234, 48.68067169189453, 52.779930114746094, 56.879180908203125, 60.97843933105469, 65.07769775390625, 69.17694854736328, 73.27620697021484, 77.37545776367188, 81.47471618652344, 85.57396697998047, 89.67322540283203, 93.77247619628906, 97.87173461914062, 101.97099304199219, 106.07025146484375, 110.16950225830078, 114.26876068115234, 118.36801147460938, 122.46726989746094, 126.5665283203125, 130.665771484375, 134.76502990722656]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 12.0, 6.0, 9.0, 10.0, 18.0, 7.0, 17.0, 14.0, 32.0, 25.0, 26.0, 22.0, 46.0, 47.0, 38.0, 44.0, 46.0, 42.0, 36.0, 60.0, 33.0, 34.0, 40.0, 30.0, 37.0, 30.0, 27.0, 27.0, 18.0, 16.0, 22.0, 16.0, 21.0, 15.0, 19.0, 15.0, 8.0, 5.0, 6.0, 7.0, 3.0, 6.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-50.886444091796875, -49.40039825439453, -47.91434860229492, -46.42830276489258, -44.942256927490234, -43.45621109008789, -41.97016143798828, -40.48411560058594, -38.998069763183594, -37.51202392578125, -36.02597427368164, -34.5399284362793, -33.05388259887695, -31.567834854125977, -30.081787109375, -28.595741271972656, -27.10969352722168, -25.623645782470703, -24.13759994506836, -22.651552200317383, -21.16550636291504, -19.679458618164062, -18.19341278076172, -16.707365036010742, -15.221318244934082, -13.735271453857422, -12.249224662780762, -10.763177871704102, -9.277130126953125, -7.791083812713623, -6.305036544799805, -4.8189897537231445, -3.3329429626464844, -1.8468960523605347, -0.36084914207458496, 1.1251978874206543, 2.6112446784973145, 4.097291469573975, 5.583338737487793, 7.069385528564453, 8.555432319641113, 10.041479110717773, 11.527525901794434, 13.013572692871094, 14.49962043762207, 15.985666275024414, 17.47171401977539, 18.957759857177734, 20.44380760192871, 21.929855346679688, 23.41590118408203, 24.901948928833008, 26.38799476623535, 27.874042510986328, 29.360088348388672, 30.84613609313965, 32.332183837890625, 33.81822967529297, 35.30427932739258, 36.79032516479492, 38.276371002197266, 39.76241683959961, 41.24846649169922, 42.73451232910156, 44.220558166503906]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 3.0, 11.0, 8.0, 14.0, 9.0, 16.0, 18.0, 26.0, 26.0, 30.0, 28.0, 26.0, 33.0, 24.0, 35.0, 47.0, 47.0, 35.0, 36.0, 38.0, 47.0, 41.0, 42.0, 30.0, 22.0, 30.0, 26.0, 28.0, 29.0, 28.0, 42.0, 16.0, 15.0, 15.0, 15.0, 5.0, 16.0, 9.0, 3.0, 8.0, 2.0, 8.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.6328125, -6.4110107421875, -6.189208984375, -5.9674072265625, -5.74560546875, -5.5238037109375, -5.302001953125, -5.0802001953125, -4.8583984375, -4.6365966796875, -4.414794921875, -4.1929931640625, -3.97119140625, -3.7493896484375, -3.527587890625, -3.3057861328125, -3.083984375, -2.8621826171875, -2.640380859375, -2.4185791015625, -2.19677734375, -1.9749755859375, -1.753173828125, -1.5313720703125, -1.3095703125, -1.0877685546875, -0.865966796875, -0.6441650390625, -0.42236328125, -0.2005615234375, 0.021240234375, 0.2430419921875, 0.46484375, 0.6866455078125, 0.908447265625, 1.1302490234375, 1.35205078125, 1.5738525390625, 1.795654296875, 2.0174560546875, 2.2392578125, 2.4610595703125, 2.682861328125, 2.9046630859375, 3.12646484375, 3.3482666015625, 3.570068359375, 3.7918701171875, 4.013671875, 4.2354736328125, 4.457275390625, 4.6790771484375, 4.90087890625, 5.1226806640625, 5.344482421875, 5.5662841796875, 5.7880859375, 6.0098876953125, 6.231689453125, 6.4534912109375, 6.67529296875, 6.8970947265625, 7.118896484375, 7.3406982421875, 7.5625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 12.0, 10.0, 21.0, 30.0, 40.0, 70.0, 103.0, 163.0, 252.0, 362.0, 644.0, 932.0, 1414.0, 2302.0, 3547.0, 5545.0, 8728.0, 13327.0, 20414.0, 30255.0, 43687.0, 60974.0, 79570.0, 99341.0, 114547.0, 119331.0, 109427.0, 92945.0, 72063.0, 54108.0, 38344.0, 26157.0, 17443.0, 11535.0, 7450.0, 4850.0, 3081.0, 2017.0, 1241.0, 811.0, 488.0, 333.0, 204.0, 185.0, 80.0, 57.0, 48.0, 33.0, 13.0, 6.0, 6.0, 7.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.1884765625, -1.151702880859375, -1.11492919921875, -1.078155517578125, -1.0413818359375, -1.004608154296875, -0.96783447265625, -0.931060791015625, -0.894287109375, -0.857513427734375, -0.82073974609375, -0.783966064453125, -0.7471923828125, -0.710418701171875, -0.67364501953125, -0.636871337890625, -0.60009765625, -0.563323974609375, -0.52655029296875, -0.489776611328125, -0.4530029296875, -0.416229248046875, -0.37945556640625, -0.342681884765625, -0.305908203125, -0.269134521484375, -0.23236083984375, -0.195587158203125, -0.1588134765625, -0.122039794921875, -0.08526611328125, -0.048492431640625, -0.01171875, 0.025054931640625, 0.06182861328125, 0.098602294921875, 0.1353759765625, 0.172149658203125, 0.20892333984375, 0.245697021484375, 0.282470703125, 0.319244384765625, 0.35601806640625, 0.392791748046875, 0.4295654296875, 0.466339111328125, 0.50311279296875, 0.539886474609375, 0.57666015625, 0.613433837890625, 0.65020751953125, 0.686981201171875, 0.7237548828125, 0.760528564453125, 0.79730224609375, 0.834075927734375, 0.870849609375, 0.907623291015625, 0.94439697265625, 0.981170654296875, 1.0179443359375, 1.054718017578125, 1.09149169921875, 1.128265380859375, 1.1650390625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 2.0, 3.0, 5.0, 6.0, 10.0, 7.0, 10.0, 16.0, 12.0, 10.0, 16.0, 15.0, 18.0, 24.0, 29.0, 24.0, 31.0, 35.0, 40.0, 38.0, 30.0, 32.0, 36.0, 44.0, 1066.0, 31.0, 45.0, 33.0, 38.0, 25.0, 33.0, 32.0, 27.0, 34.0, 20.0, 18.0, 21.0, 17.0, 8.0, 13.0, 9.0, 11.0, 11.0, 9.0, 9.0, 4.0, 6.0, 2.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.2734375, -5.1153564453125, -4.957275390625, -4.7991943359375, -4.64111328125, -4.4830322265625, -4.324951171875, -4.1668701171875, -4.0087890625, -3.8507080078125, -3.692626953125, -3.5345458984375, -3.37646484375, -3.2183837890625, -3.060302734375, -2.9022216796875, -2.744140625, -2.5860595703125, -2.427978515625, -2.2698974609375, -2.11181640625, -1.9537353515625, -1.795654296875, -1.6375732421875, -1.4794921875, -1.3214111328125, -1.163330078125, -1.0052490234375, -0.84716796875, -0.6890869140625, -0.531005859375, -0.3729248046875, -0.21484375, -0.0567626953125, 0.101318359375, 0.2593994140625, 0.41748046875, 0.5755615234375, 0.733642578125, 0.8917236328125, 1.0498046875, 1.2078857421875, 1.365966796875, 1.5240478515625, 1.68212890625, 1.8402099609375, 1.998291015625, 2.1563720703125, 2.314453125, 2.4725341796875, 2.630615234375, 2.7886962890625, 2.94677734375, 3.1048583984375, 3.262939453125, 3.4210205078125, 3.5791015625, 3.7371826171875, 3.895263671875, 4.0533447265625, 4.21142578125, 4.3695068359375, 4.527587890625, 4.6856689453125, 4.84375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 4.0, 5.0, 10.0, 23.0, 22.0, 27.0, 59.0, 106.0, 135.0, 242.0, 355.0, 517.0, 815.0, 1251.0, 1937.0, 3093.0, 4610.0, 7106.0, 10727.0, 16739.0, 27019.0, 56327.0, 1868500.0, 36100.0, 21926.0, 13759.0, 8914.0, 5852.0, 3785.0, 2428.0, 1615.0, 1041.0, 734.0, 472.0, 294.0, 199.0, 122.0, 89.0, 66.0, 31.0, 28.0, 15.0, 12.0, 8.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5703125, -2.488128662109375, -2.40594482421875, -2.323760986328125, -2.2415771484375, -2.159393310546875, -2.07720947265625, -1.995025634765625, -1.912841796875, -1.830657958984375, -1.74847412109375, -1.666290283203125, -1.5841064453125, -1.501922607421875, -1.41973876953125, -1.337554931640625, -1.25537109375, -1.173187255859375, -1.09100341796875, -1.008819580078125, -0.9266357421875, -0.844451904296875, -0.76226806640625, -0.680084228515625, -0.597900390625, -0.515716552734375, -0.43353271484375, -0.351348876953125, -0.2691650390625, -0.186981201171875, -0.10479736328125, -0.022613525390625, 0.0595703125, 0.141754150390625, 0.22393798828125, 0.306121826171875, 0.3883056640625, 0.470489501953125, 0.55267333984375, 0.634857177734375, 0.717041015625, 0.799224853515625, 0.88140869140625, 0.963592529296875, 1.0457763671875, 1.127960205078125, 1.21014404296875, 1.292327880859375, 1.37451171875, 1.456695556640625, 1.53887939453125, 1.621063232421875, 1.7032470703125, 1.785430908203125, 1.86761474609375, 1.949798583984375, 2.031982421875, 2.114166259765625, 2.19635009765625, 2.278533935546875, 2.3607177734375, 2.442901611328125, 2.52508544921875, 2.607269287109375, 2.689453125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 3.0, 2.0, 8.0, 14.0, 7.0, 12.0, 17.0, 19.0, 18.0, 24.0, 36.0, 42.0, 37.0, 67.0, 59.0, 83.0, 96.0, 79.0, 65.0, 62.0, 39.0, 33.0, 20.0, 25.0, 22.0, 12.0, 25.0, 10.0, 12.0, 7.0, 8.0, 15.0, 6.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0909423828125, -0.08796024322509766, -0.08497810363769531, -0.08199596405029297, -0.07901382446289062, -0.07603168487548828, -0.07304954528808594, -0.0700674057006836, -0.06708526611328125, -0.0641031265258789, -0.06112098693847656, -0.05813884735107422, -0.055156707763671875, -0.05217456817626953, -0.04919242858886719, -0.046210289001464844, -0.0432281494140625, -0.040246009826660156, -0.03726387023925781, -0.03428173065185547, -0.031299591064453125, -0.02831745147705078, -0.025335311889648438, -0.022353172302246094, -0.01937103271484375, -0.016388893127441406, -0.013406753540039062, -0.010424613952636719, -0.007442474365234375, -0.004460334777832031, -0.0014781951904296875, 0.0015039443969726562, 0.004486083984375, 0.007468223571777344, 0.010450363159179688, 0.013432502746582031, 0.016414642333984375, 0.01939678192138672, 0.022378921508789062, 0.025361061096191406, 0.02834320068359375, 0.031325340270996094, 0.03430747985839844, 0.03728961944580078, 0.040271759033203125, 0.04325389862060547, 0.04623603820800781, 0.049218177795410156, 0.0522003173828125, 0.055182456970214844, 0.05816459655761719, 0.06114673614501953, 0.06412887573242188, 0.06711101531982422, 0.07009315490722656, 0.0730752944946289, 0.07605743408203125, 0.0790395736694336, 0.08202171325683594, 0.08500385284423828, 0.08798599243164062, 0.09096813201904297, 0.09395027160644531, 0.09693241119384766, 0.09991455078125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 0.0, 6.0, 5.0, 9.0, 15.0, 10.0, 7.0, 17.0, 21.0, 20.0, 30.0, 23.0, 49.0, 52.0, 98.0, 204.0, 402.0, 2049.0, 1008199.0, 35930.0, 700.0, 259.0, 133.0, 78.0, 65.0, 30.0, 31.0, 22.0, 15.0, 14.0, 14.0, 12.0, 11.0, 7.0, 1.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.1796875, -2.115081787109375, -2.05047607421875, -1.985870361328125, -1.9212646484375, -1.856658935546875, -1.79205322265625, -1.727447509765625, -1.662841796875, -1.598236083984375, -1.53363037109375, -1.469024658203125, -1.4044189453125, -1.339813232421875, -1.27520751953125, -1.210601806640625, -1.14599609375, -1.081390380859375, -1.01678466796875, -0.952178955078125, -0.8875732421875, -0.822967529296875, -0.75836181640625, -0.693756103515625, -0.629150390625, -0.564544677734375, -0.49993896484375, -0.435333251953125, -0.3707275390625, -0.306121826171875, -0.24151611328125, -0.176910400390625, -0.1123046875, -0.047698974609375, 0.01690673828125, 0.081512451171875, 0.1461181640625, 0.210723876953125, 0.27532958984375, 0.339935302734375, 0.404541015625, 0.469146728515625, 0.53375244140625, 0.598358154296875, 0.6629638671875, 0.727569580078125, 0.79217529296875, 0.856781005859375, 0.92138671875, 0.985992431640625, 1.05059814453125, 1.115203857421875, 1.1798095703125, 1.244415283203125, 1.30902099609375, 1.373626708984375, 1.438232421875, 1.502838134765625, 1.56744384765625, 1.632049560546875, 1.6966552734375, 1.761260986328125, 1.82586669921875, 1.890472412109375, 1.955078125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 60.0, 917.0, 37.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.6929821968078613, -3.615173816680908, -3.537365674972534, -3.459557294845581, -3.381749153137207, -3.303940773010254, -3.22613263130188, -3.1483242511749268, -3.0705161094665527, -2.9927077293395996, -2.9148995876312256, -2.8370912075042725, -2.7592830657958984, -2.6814746856689453, -2.6036665439605713, -2.525858163833618, -2.448049783706665, -2.370241403579712, -2.292433261871338, -2.2146248817443848, -2.1368167400360107, -2.0590083599090576, -1.981200098991394, -1.9033918380737305, -1.825583577156067, -1.7477753162384033, -1.6699670553207397, -1.5921587944030762, -1.514350414276123, -1.436542272567749, -1.358733892440796, -1.2809256315231323, -1.2031174898147583, -1.1253092288970947, -1.0475009679794312, -0.9696926474571228, -0.8918843865394592, -0.8140761256217957, -0.7362678050994873, -0.6584595441818237, -0.5806512832641602, -0.5028430223464966, -0.4250347316265106, -0.34722644090652466, -0.2694181799888611, -0.1916099190711975, -0.11380162835121155, -0.035993337631225586, 0.04181492328643799, 0.11962319910526276, 0.19743147492408752, 0.2752397656440735, 0.35304802656173706, 0.43085628747940063, 0.508664608001709, 0.5864728689193726, 0.6642811298370361, 0.7420893907546997, 0.8198976516723633, 0.8977059721946716, 0.9755142331123352, 1.0533225536346436, 1.1311308145523071, 1.2089390754699707, 1.2867473363876343]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0, 7.0, 5.0, 8.0, 11.0, 11.0, 18.0, 27.0, 20.0, 23.0, 36.0, 26.0, 36.0, 40.0, 38.0, 34.0, 55.0, 35.0, 44.0, 54.0, 51.0, 56.0, 52.0, 38.0, 36.0, 41.0, 33.0, 35.0, 18.0, 19.0, 27.0, 16.0, 11.0, 12.0, 11.0, 8.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3222694993019104, -0.3116346597671509, -0.30099982023239136, -0.29036498069763184, -0.2797301411628723, -0.2690952718257904, -0.2584604322910309, -0.24782559275627136, -0.23719075322151184, -0.22655591368675232, -0.2159210741519928, -0.20528621971607208, -0.19465138018131256, -0.18401654064655304, -0.17338168621063232, -0.1627468466758728, -0.15211200714111328, -0.14147716760635376, -0.13084232807159424, -0.12020747363567352, -0.109572634100914, -0.09893779456615448, -0.08830294758081436, -0.07766810059547424, -0.06703326106071472, -0.0563984178006649, -0.04576357454061508, -0.03512873128056526, -0.024493888020515442, -0.013859044760465622, -0.003224201500415802, 0.007410645484924316, 0.018045485019683838, 0.028680328279733658, 0.03931517153978348, 0.0499500147998333, 0.06058485805988312, 0.07121969759464264, 0.08185454457998276, 0.09248939156532288, 0.1031242311000824, 0.11375907063484192, 0.12439391762018204, 0.13502876460552216, 0.14566360414028168, 0.1562984436750412, 0.16693329811096191, 0.17756813764572144, 0.18820297718048096, 0.19883781671524048, 0.20947265625, 0.22010751068592072, 0.23074235022068024, 0.24137718975543976, 0.2520120441913605, 0.26264688372612, 0.2732817232608795, 0.28391656279563904, 0.29455140233039856, 0.3051862418651581, 0.31582111120224, 0.3264559507369995, 0.33709079027175903, 0.34772562980651855, 0.3583604693412781]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 3.0, 9.0, 6.0, 8.0, 8.0, 15.0, 17.0, 15.0, 18.0, 25.0, 22.0, 27.0, 30.0, 23.0, 43.0, 29.0, 41.0, 35.0, 43.0, 36.0, 47.0, 38.0, 32.0, 38.0, 38.0, 27.0, 30.0, 38.0, 33.0, 32.0, 25.0, 18.0, 22.0, 21.0, 14.0, 18.0, 15.0, 11.0, 12.0, 6.0, 7.0, 6.0, 6.0, 4.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.96875, -5.752197265625, -5.53564453125, -5.319091796875, -5.1025390625, -4.885986328125, -4.66943359375, -4.452880859375, -4.236328125, -4.019775390625, -3.80322265625, -3.586669921875, -3.3701171875, -3.153564453125, -2.93701171875, -2.720458984375, -2.50390625, -2.287353515625, -2.07080078125, -1.854248046875, -1.6376953125, -1.421142578125, -1.20458984375, -0.988037109375, -0.771484375, -0.554931640625, -0.33837890625, -0.121826171875, 0.0947265625, 0.311279296875, 0.52783203125, 0.744384765625, 0.9609375, 1.177490234375, 1.39404296875, 1.610595703125, 1.8271484375, 2.043701171875, 2.26025390625, 2.476806640625, 2.693359375, 2.909912109375, 3.12646484375, 3.343017578125, 3.5595703125, 3.776123046875, 3.99267578125, 4.209228515625, 4.42578125, 4.642333984375, 4.85888671875, 5.075439453125, 5.2919921875, 5.508544921875, 5.72509765625, 5.941650390625, 6.158203125, 6.374755859375, 6.59130859375, 6.807861328125, 7.0244140625, 7.240966796875, 7.45751953125, 7.674072265625, 7.890625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 10.0, 6.0, 15.0, 22.0, 30.0, 38.0, 52.0, 69.0, 100.0, 133.0, 210.0, 362.0, 589.0, 960.0, 1743.0, 3198.0, 5424.0, 9953.0, 17873.0, 31747.0, 56932.0, 102268.0, 178369.0, 253876.0, 168071.0, 95599.0, 53173.0, 29839.0, 16595.0, 9204.0, 5148.0, 2837.0, 1597.0, 988.0, 516.0, 332.0, 200.0, 138.0, 80.0, 69.0, 47.0, 30.0, 27.0, 24.0, 19.0, 13.0, 9.0, 10.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-6.609375, -6.3848876953125, -6.160400390625, -5.9359130859375, -5.71142578125, -5.4869384765625, -5.262451171875, -5.0379638671875, -4.8134765625, -4.5889892578125, -4.364501953125, -4.1400146484375, -3.91552734375, -3.6910400390625, -3.466552734375, -3.2420654296875, -3.017578125, -2.7930908203125, -2.568603515625, -2.3441162109375, -2.11962890625, -1.8951416015625, -1.670654296875, -1.4461669921875, -1.2216796875, -0.9971923828125, -0.772705078125, -0.5482177734375, -0.32373046875, -0.0992431640625, 0.125244140625, 0.3497314453125, 0.57421875, 0.7987060546875, 1.023193359375, 1.2476806640625, 1.47216796875, 1.6966552734375, 1.921142578125, 2.1456298828125, 2.3701171875, 2.5946044921875, 2.819091796875, 3.0435791015625, 3.26806640625, 3.4925537109375, 3.717041015625, 3.9415283203125, 4.166015625, 4.3905029296875, 4.614990234375, 4.8394775390625, 5.06396484375, 5.2884521484375, 5.512939453125, 5.7374267578125, 5.9619140625, 6.1864013671875, 6.410888671875, 6.6353759765625, 6.85986328125, 7.0843505859375, 7.308837890625, 7.5333251953125, 7.7578125]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 2.0, 5.0, 9.0, 15.0, 8.0, 4.0, 14.0, 26.0, 24.0, 22.0, 22.0, 24.0, 30.0, 29.0, 38.0, 42.0, 42.0, 45.0, 87.0, 143.0, 217.0, 1315.0, 216.0, 141.0, 85.0, 78.0, 41.0, 43.0, 36.0, 26.0, 22.0, 32.0, 22.0, 15.0, 16.0, 14.0, 17.0, 13.0, 6.0, 14.0, 7.0, 9.0, 7.0, 3.0, 4.0, 6.0, 5.0, 4.0, 1.0, 2.0, 3.0], "bins": [-20.640625, -20.044677734375, -19.44873046875, -18.852783203125, -18.2568359375, -17.660888671875, -17.06494140625, -16.468994140625, -15.873046875, -15.277099609375, -14.68115234375, -14.085205078125, -13.4892578125, -12.893310546875, -12.29736328125, -11.701416015625, -11.10546875, -10.509521484375, -9.91357421875, -9.317626953125, -8.7216796875, -8.125732421875, -7.52978515625, -6.933837890625, -6.337890625, -5.741943359375, -5.14599609375, -4.550048828125, -3.9541015625, -3.358154296875, -2.76220703125, -2.166259765625, -1.5703125, -0.974365234375, -0.37841796875, 0.217529296875, 0.8134765625, 1.409423828125, 2.00537109375, 2.601318359375, 3.197265625, 3.793212890625, 4.38916015625, 4.985107421875, 5.5810546875, 6.177001953125, 6.77294921875, 7.368896484375, 7.96484375, 8.560791015625, 9.15673828125, 9.752685546875, 10.3486328125, 10.944580078125, 11.54052734375, 12.136474609375, 12.732421875, 13.328369140625, 13.92431640625, 14.520263671875, 15.1162109375, 15.712158203125, 16.30810546875, 16.904052734375, 17.5]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 5.0, 4.0, 7.0, 8.0, 8.0, 21.0, 22.0, 49.0, 44.0, 89.0, 125.0, 223.0, 389.0, 1076.0, 8202.0, 3021040.0, 111120.0, 1895.0, 629.0, 282.0, 163.0, 95.0, 65.0, 32.0, 27.0, 32.0, 13.0, 6.0, 6.0, 8.0, 5.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.625, -84.7724609375, -81.919921875, -79.0673828125, -76.21484375, -73.3623046875, -70.509765625, -67.6572265625, -64.8046875, -61.9521484375, -59.099609375, -56.2470703125, -53.39453125, -50.5419921875, -47.689453125, -44.8369140625, -41.984375, -39.1318359375, -36.279296875, -33.4267578125, -30.57421875, -27.7216796875, -24.869140625, -22.0166015625, -19.1640625, -16.3115234375, -13.458984375, -10.6064453125, -7.75390625, -4.9013671875, -2.048828125, 0.8037109375, 3.65625, 6.5087890625, 9.361328125, 12.2138671875, 15.06640625, 17.9189453125, 20.771484375, 23.6240234375, 26.4765625, 29.3291015625, 32.181640625, 35.0341796875, 37.88671875, 40.7392578125, 43.591796875, 46.4443359375, 49.296875, 52.1494140625, 55.001953125, 57.8544921875, 60.70703125, 63.5595703125, 66.412109375, 69.2646484375, 72.1171875, 74.9697265625, 77.822265625, 80.6748046875, 83.52734375, 86.3798828125, 89.232421875, 92.0849609375, 94.9375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 91.0, 395.0, 448.0, 66.0, 12.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.925743103027344, -45.48971939086914, -39.05369567871094, -32.617671966552734, -26.18164825439453, -19.745624542236328, -13.309600830078125, -6.873577117919922, -0.43755340576171875, 5.998470306396484, 12.434494018554688, 18.87051773071289, 25.306541442871094, 31.742565155029297, 38.1785888671875, 44.6146125793457, 51.050636291503906, 57.48666000366211, 63.92268371582031, 70.35870361328125, 76.79473114013672, 83.23075866699219, 89.66677856445312, 96.10279846191406, 102.53882598876953, 108.974853515625, 115.41087341308594, 121.84689331054688, 128.28292846679688, 134.7189483642578, 141.15496826171875, 147.5909881591797, 154.02700805664062, 160.46302795410156, 166.8990478515625, 173.3350830078125, 179.77110290527344, 186.20712280273438, 192.64315795898438, 199.0791778564453, 205.51519775390625, 211.9512176513672, 218.38723754882812, 224.82327270507812, 231.25929260253906, 237.6953125, 244.13134765625, 250.56736755371094, 257.0033874511719, 263.4394226074219, 269.87542724609375, 276.31146240234375, 282.74749755859375, 289.1835021972656, 295.6195373535156, 302.0555419921875, 308.4915771484375, 314.9276123046875, 321.3636169433594, 327.7996520996094, 334.23565673828125, 340.67169189453125, 347.10772705078125, 353.5437316894531, 359.9797668457031]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 6.0, 4.0, 7.0, 8.0, 8.0, 11.0, 7.0, 21.0, 24.0, 20.0, 24.0, 24.0, 27.0, 29.0, 30.0, 28.0, 35.0, 35.0, 46.0, 41.0, 48.0, 44.0, 31.0, 26.0, 34.0, 38.0, 35.0, 30.0, 44.0, 36.0, 28.0, 23.0, 24.0, 16.0, 26.0, 22.0, 15.0, 10.0, 7.0, 14.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-57.39506149291992, -55.68384552001953, -53.97262954711914, -52.26141357421875, -50.550201416015625, -48.838985443115234, -47.127769470214844, -45.41655349731445, -43.70533752441406, -41.99412155151367, -40.28290557861328, -38.571693420410156, -36.860477447509766, -35.149261474609375, -33.438045501708984, -31.726829528808594, -30.01561737060547, -28.304401397705078, -26.59318733215332, -24.88197135925293, -23.170757293701172, -21.45954132080078, -19.74832534790039, -18.037109375, -16.325895309448242, -14.614680290222168, -12.903465270996094, -11.192249298095703, -9.481034278869629, -7.769819259643555, -6.058603286743164, -4.34738826751709, -2.63616943359375, -0.9249541759490967, 0.7862610816955566, 2.497476577758789, 4.208691596984863, 5.9199066162109375, 7.631122589111328, 9.342337608337402, 11.053552627563477, 12.76476764678955, 14.475982666015625, 16.187198638916016, 17.898414611816406, 19.609628677368164, 21.320844650268555, 23.032058715820312, 24.743274688720703, 26.454490661621094, 28.16570472717285, 29.876920700073242, 31.588134765625, 33.29935073852539, 35.01056671142578, 36.72178268432617, 38.43299865722656, 40.14421463012695, 41.855430603027344, 43.56664276123047, 45.27785873413086, 46.98907470703125, 48.70029067993164, 50.41150665283203, 52.122718811035156]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 9.0, 2.0, 12.0, 14.0, 14.0, 18.0, 24.0, 26.0, 21.0, 26.0, 27.0, 41.0, 34.0, 36.0, 42.0, 35.0, 37.0, 36.0, 52.0, 38.0, 48.0, 42.0, 36.0, 41.0, 39.0, 28.0, 45.0, 22.0, 17.0, 17.0, 25.0, 19.0, 15.0, 23.0, 5.0, 9.0, 7.0, 4.0, 4.0, 5.0, 0.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4453125, -7.1881103515625, -6.930908203125, -6.6737060546875, -6.41650390625, -6.1593017578125, -5.902099609375, -5.6448974609375, -5.3876953125, -5.1304931640625, -4.873291015625, -4.6160888671875, -4.35888671875, -4.1016845703125, -3.844482421875, -3.5872802734375, -3.330078125, -3.0728759765625, -2.815673828125, -2.5584716796875, -2.30126953125, -2.0440673828125, -1.786865234375, -1.5296630859375, -1.2724609375, -1.0152587890625, -0.758056640625, -0.5008544921875, -0.24365234375, 0.0135498046875, 0.270751953125, 0.5279541015625, 0.78515625, 1.0423583984375, 1.299560546875, 1.5567626953125, 1.81396484375, 2.0711669921875, 2.328369140625, 2.5855712890625, 2.8427734375, 3.0999755859375, 3.357177734375, 3.6143798828125, 3.87158203125, 4.1287841796875, 4.385986328125, 4.6431884765625, 4.900390625, 5.1575927734375, 5.414794921875, 5.6719970703125, 5.92919921875, 6.1864013671875, 6.443603515625, 6.7008056640625, 6.9580078125, 7.2152099609375, 7.472412109375, 7.7296142578125, 7.98681640625, 8.2440185546875, 8.501220703125, 8.7584228515625, 9.015625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 4.0, 7.0, 4.0, 11.0, 6.0, 14.0, 16.0, 21.0, 25.0, 20.0, 28.0, 41.0, 50.0, 101.0, 261.0, 843.0, 3775.0, 23962.0, 225480.0, 1833039.0, 1853516.0, 224043.0, 23825.0, 3710.0, 873.0, 250.0, 90.0, 60.0, 40.0, 31.0, 34.0, 19.0, 21.0, 13.0, 7.0, 15.0, 8.0, 2.0, 12.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.328125, -18.683837890625, -18.03955078125, -17.395263671875, -16.7509765625, -16.106689453125, -15.46240234375, -14.818115234375, -14.173828125, -13.529541015625, -12.88525390625, -12.240966796875, -11.5966796875, -10.952392578125, -10.30810546875, -9.663818359375, -9.01953125, -8.375244140625, -7.73095703125, -7.086669921875, -6.4423828125, -5.798095703125, -5.15380859375, -4.509521484375, -3.865234375, -3.220947265625, -2.57666015625, -1.932373046875, -1.2880859375, -0.643798828125, 0.00048828125, 0.644775390625, 1.2890625, 1.933349609375, 2.57763671875, 3.221923828125, 3.8662109375, 4.510498046875, 5.15478515625, 5.799072265625, 6.443359375, 7.087646484375, 7.73193359375, 8.376220703125, 9.0205078125, 9.664794921875, 10.30908203125, 10.953369140625, 11.59765625, 12.241943359375, 12.88623046875, 13.530517578125, 14.1748046875, 14.819091796875, 15.46337890625, 16.107666015625, 16.751953125, 17.396240234375, 18.04052734375, 18.684814453125, 19.3291015625, 19.973388671875, 20.61767578125, 21.261962890625, 21.90625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 0.0, 6.0, 2.0, 4.0, 5.0, 6.0, 14.0, 17.0, 22.0, 40.0, 34.0, 41.0, 61.0, 76.0, 91.0, 118.0, 171.0, 181.0, 243.0, 329.0, 353.0, 363.0, 374.0, 299.0, 266.0, 207.0, 166.0, 129.0, 109.0, 63.0, 71.0, 51.0, 33.0, 28.0, 25.0, 21.0, 10.0, 12.0, 12.0, 4.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.2890625, -11.9117431640625, -11.534423828125, -11.1571044921875, -10.77978515625, -10.4024658203125, -10.025146484375, -9.6478271484375, -9.2705078125, -8.8931884765625, -8.515869140625, -8.1385498046875, -7.76123046875, -7.3839111328125, -7.006591796875, -6.6292724609375, -6.251953125, -5.8746337890625, -5.497314453125, -5.1199951171875, -4.74267578125, -4.3653564453125, -3.988037109375, -3.6107177734375, -3.2333984375, -2.8560791015625, -2.478759765625, -2.1014404296875, -1.72412109375, -1.3468017578125, -0.969482421875, -0.5921630859375, -0.21484375, 0.1624755859375, 0.539794921875, 0.9171142578125, 1.29443359375, 1.6717529296875, 2.049072265625, 2.4263916015625, 2.8037109375, 3.1810302734375, 3.558349609375, 3.9356689453125, 4.31298828125, 4.6903076171875, 5.067626953125, 5.4449462890625, 5.822265625, 6.1995849609375, 6.576904296875, 6.9542236328125, 7.33154296875, 7.7088623046875, 8.086181640625, 8.4635009765625, 8.8408203125, 9.2181396484375, 9.595458984375, 9.9727783203125, 10.35009765625, 10.7274169921875, 11.104736328125, 11.4820556640625, 11.859375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 4.0, 7.0, 11.0, 12.0, 23.0, 19.0, 27.0, 37.0, 36.0, 48.0, 84.0, 62.0, 145.0, 158.0, 232.0, 359.0, 806.0, 19752.0, 3144869.0, 1020412.0, 5517.0, 566.0, 277.0, 185.0, 137.0, 115.0, 88.0, 60.0, 56.0, 43.0, 25.0, 33.0, 19.0, 13.0, 11.0, 4.0, 4.0, 5.0, 3.0, 2.0, 3.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-64.25, -62.2333984375, -60.216796875, -58.2001953125, -56.18359375, -54.1669921875, -52.150390625, -50.1337890625, -48.1171875, -46.1005859375, -44.083984375, -42.0673828125, -40.05078125, -38.0341796875, -36.017578125, -34.0009765625, -31.984375, -29.9677734375, -27.951171875, -25.9345703125, -23.91796875, -21.9013671875, -19.884765625, -17.8681640625, -15.8515625, -13.8349609375, -11.818359375, -9.8017578125, -7.78515625, -5.7685546875, -3.751953125, -1.7353515625, 0.28125, 2.2978515625, 4.314453125, 6.3310546875, 8.34765625, 10.3642578125, 12.380859375, 14.3974609375, 16.4140625, 18.4306640625, 20.447265625, 22.4638671875, 24.48046875, 26.4970703125, 28.513671875, 30.5302734375, 32.546875, 34.5634765625, 36.580078125, 38.5966796875, 40.61328125, 42.6298828125, 44.646484375, 46.6630859375, 48.6796875, 50.6962890625, 52.712890625, 54.7294921875, 56.74609375, 58.7626953125, 60.779296875, 62.7958984375, 64.8125]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 25.0, 68.0, 166.0, 302.0, 279.0, 129.0, 36.0, 7.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.364219665527344, -32.702911376953125, -27.041603088378906, -21.380294799804688, -15.718986511230469, -10.05767822265625, -4.396369934082031, 1.2649383544921875, 6.926246643066406, 12.587554931640625, 18.248863220214844, 23.910171508789062, 29.57147979736328, 35.2327880859375, 40.89409637451172, 46.55540466308594, 52.216712951660156, 57.878021240234375, 63.539329528808594, 69.20063781738281, 74.86194610595703, 80.52325439453125, 86.18456268310547, 91.84587097167969, 97.5071792602539, 103.16848754882812, 108.82979583740234, 114.49110412597656, 120.15241241455078, 125.813720703125, 131.47503662109375, 137.13633728027344, 142.79763793945312, 148.45895385742188, 154.12025451660156, 159.78155517578125, 165.44287109375, 171.10418701171875, 176.76548767089844, 182.42678833007812, 188.08810424804688, 193.74942016601562, 199.4107208251953, 205.072021484375, 210.73333740234375, 216.3946533203125, 222.0559539794922, 227.71725463867188, 233.37857055664062, 239.03988647460938, 244.70118713378906, 250.36248779296875, 256.0238037109375, 261.68511962890625, 267.346435546875, 273.0077209472656, 278.6690368652344, 284.3303527832031, 289.99163818359375, 295.6529541015625, 301.31427001953125, 306.9755859375, 312.63690185546875, 318.2981872558594, 323.9595031738281]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 7.0, 4.0, 11.0, 12.0, 11.0, 19.0, 14.0, 20.0, 41.0, 36.0, 36.0, 34.0, 31.0, 47.0, 51.0, 43.0, 42.0, 47.0, 59.0, 51.0, 47.0, 39.0, 36.0, 41.0, 30.0, 29.0, 26.0, 26.0, 28.0, 17.0, 15.0, 9.0, 11.0, 7.0, 8.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-57.03199768066406, -55.364864349365234, -53.697731018066406, -52.03059387207031, -50.363460540771484, -48.696327209472656, -47.02919387817383, -45.362060546875, -43.694923400878906, -42.02779006958008, -40.36065673828125, -38.693519592285156, -37.02638626098633, -35.3592529296875, -33.69211959838867, -32.024986267089844, -30.357851028442383, -28.690717697143555, -27.023582458496094, -25.356449127197266, -23.689313888549805, -22.022180557250977, -20.355045318603516, -18.687911987304688, -17.02077865600586, -15.353644371032715, -13.68651008605957, -12.019376754760742, -10.352241516113281, -8.685108184814453, -7.017973899841309, -5.350839614868164, -3.683704376220703, -2.0165700912475586, -0.34943604469299316, 1.3176980018615723, 2.984832286834717, 4.651966094970703, 6.319100379943848, 7.986234664916992, 9.653368949890137, 11.320503234863281, 12.987637519836426, 14.65477180480957, 16.3219051361084, 17.98904037475586, 19.656173706054688, 21.323307037353516, 22.990442276000977, 24.657575607299805, 26.324710845947266, 27.991844177246094, 29.658979415893555, 31.326112747192383, 32.993247985839844, 34.66038131713867, 36.3275146484375, 37.99464797973633, 39.661781311035156, 41.32891845703125, 42.99605178833008, 44.663185119628906, 46.330318450927734, 47.99745178222656, 49.664588928222656]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 6.0, 3.0, 12.0, 4.0, 12.0, 15.0, 23.0, 11.0, 25.0, 15.0, 29.0, 27.0, 35.0, 26.0, 38.0, 41.0, 40.0, 42.0, 43.0, 37.0, 45.0, 41.0, 34.0, 41.0, 42.0, 28.0, 40.0, 40.0, 25.0, 21.0, 14.0, 29.0, 26.0, 11.0, 17.0, 15.0, 12.0, 7.0, 7.0, 6.0, 4.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30078125, -7.05377197265625, -6.8067626953125, -6.55975341796875, -6.312744140625, -6.06573486328125, -5.8187255859375, -5.57171630859375, -5.32470703125, -5.07769775390625, -4.8306884765625, -4.58367919921875, -4.336669921875, -4.08966064453125, -3.8426513671875, -3.59564208984375, -3.3486328125, -3.10162353515625, -2.8546142578125, -2.60760498046875, -2.360595703125, -2.11358642578125, -1.8665771484375, -1.61956787109375, -1.37255859375, -1.12554931640625, -0.8785400390625, -0.63153076171875, -0.384521484375, -0.13751220703125, 0.1094970703125, 0.35650634765625, 0.603515625, 0.85052490234375, 1.0975341796875, 1.34454345703125, 1.591552734375, 1.83856201171875, 2.0855712890625, 2.33258056640625, 2.57958984375, 2.82659912109375, 3.0736083984375, 3.32061767578125, 3.567626953125, 3.81463623046875, 4.0616455078125, 4.30865478515625, 4.5556640625, 4.80267333984375, 5.0496826171875, 5.29669189453125, 5.543701171875, 5.79071044921875, 6.0377197265625, 6.28472900390625, 6.53173828125, 6.77874755859375, 7.0257568359375, 7.27276611328125, 7.519775390625, 7.76678466796875, 8.0137939453125, 8.26080322265625, 8.5078125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 7.0, 15.0, 18.0, 35.0, 42.0, 96.0, 104.0, 190.0, 242.0, 424.0, 659.0, 1034.0, 1601.0, 2430.0, 3674.0, 5921.0, 8908.0, 13730.0, 20493.0, 30385.0, 43910.0, 61222.0, 82561.0, 103755.0, 119656.0, 122864.0, 110512.0, 90244.0, 69182.0, 49876.0, 35093.0, 23868.0, 16004.0, 10349.0, 6863.0, 4548.0, 2898.0, 1776.0, 1267.0, 770.0, 481.0, 314.0, 195.0, 115.0, 77.0, 58.0, 37.0, 17.0, 9.0, 12.0, 4.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.103515625, -1.0692291259765625, -1.034942626953125, -1.0006561279296875, -0.96636962890625, -0.9320831298828125, -0.897796630859375, -0.8635101318359375, -0.8292236328125, -0.7949371337890625, -0.760650634765625, -0.7263641357421875, -0.69207763671875, -0.6577911376953125, -0.623504638671875, -0.5892181396484375, -0.554931640625, -0.5206451416015625, -0.486358642578125, -0.4520721435546875, -0.41778564453125, -0.3834991455078125, -0.349212646484375, -0.3149261474609375, -0.2806396484375, -0.2463531494140625, -0.212066650390625, -0.1777801513671875, -0.14349365234375, -0.1092071533203125, -0.074920654296875, -0.0406341552734375, -0.00634765625, 0.0279388427734375, 0.062225341796875, 0.0965118408203125, 0.13079833984375, 0.1650848388671875, 0.199371337890625, 0.2336578369140625, 0.2679443359375, 0.3022308349609375, 0.336517333984375, 0.3708038330078125, 0.40509033203125, 0.4393768310546875, 0.473663330078125, 0.5079498291015625, 0.542236328125, 0.5765228271484375, 0.610809326171875, 0.6450958251953125, 0.67938232421875, 0.7136688232421875, 0.747955322265625, 0.7822418212890625, 0.8165283203125, 0.8508148193359375, 0.885101318359375, 0.9193878173828125, 0.95367431640625, 0.9879608154296875, 1.022247314453125, 1.0565338134765625, 1.0908203125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 6.0, 12.0, 18.0, 19.0, 17.0, 12.0, 17.0, 23.0, 19.0, 42.0, 31.0, 32.0, 30.0, 32.0, 40.0, 52.0, 43.0, 1077.0, 44.0, 50.0, 43.0, 37.0, 47.0, 40.0, 23.0, 31.0, 28.0, 28.0, 20.0, 20.0, 15.0, 18.0, 11.0, 9.0, 12.0, 9.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.42578125, -5.24310302734375, -5.0604248046875, -4.87774658203125, -4.695068359375, -4.51239013671875, -4.3297119140625, -4.14703369140625, -3.96435546875, -3.78167724609375, -3.5989990234375, -3.41632080078125, -3.233642578125, -3.05096435546875, -2.8682861328125, -2.68560791015625, -2.5029296875, -2.32025146484375, -2.1375732421875, -1.95489501953125, -1.772216796875, -1.58953857421875, -1.4068603515625, -1.22418212890625, -1.04150390625, -0.85882568359375, -0.6761474609375, -0.49346923828125, -0.310791015625, -0.12811279296875, 0.0545654296875, 0.23724365234375, 0.419921875, 0.60260009765625, 0.7852783203125, 0.96795654296875, 1.150634765625, 1.33331298828125, 1.5159912109375, 1.69866943359375, 1.88134765625, 2.06402587890625, 2.2467041015625, 2.42938232421875, 2.612060546875, 2.79473876953125, 2.9774169921875, 3.16009521484375, 3.3427734375, 3.52545166015625, 3.7081298828125, 3.89080810546875, 4.073486328125, 4.25616455078125, 4.4388427734375, 4.62152099609375, 4.80419921875, 4.98687744140625, 5.1695556640625, 5.35223388671875, 5.534912109375, 5.71759033203125, 5.9002685546875, 6.08294677734375, 6.265625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 9.0, 16.0, 23.0, 34.0, 60.0, 94.0, 128.0, 176.0, 249.0, 370.0, 586.0, 858.0, 1251.0, 1947.0, 2840.0, 4175.0, 6258.0, 9090.0, 13541.0, 20814.0, 32193.0, 1790339.0, 126080.0, 28813.0, 18668.0, 12513.0, 8508.0, 5732.0, 3881.0, 2578.0, 1746.0, 1193.0, 774.0, 526.0, 354.0, 249.0, 156.0, 115.0, 67.0, 53.0, 25.0, 18.0, 12.0, 11.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.310546875, -2.24432373046875, -2.1781005859375, -2.11187744140625, -2.045654296875, -1.97943115234375, -1.9132080078125, -1.84698486328125, -1.78076171875, -1.71453857421875, -1.6483154296875, -1.58209228515625, -1.515869140625, -1.44964599609375, -1.3834228515625, -1.31719970703125, -1.2509765625, -1.18475341796875, -1.1185302734375, -1.05230712890625, -0.986083984375, -0.91986083984375, -0.8536376953125, -0.78741455078125, -0.72119140625, -0.65496826171875, -0.5887451171875, -0.52252197265625, -0.456298828125, -0.39007568359375, -0.3238525390625, -0.25762939453125, -0.19140625, -0.12518310546875, -0.0589599609375, 0.00726318359375, 0.073486328125, 0.13970947265625, 0.2059326171875, 0.27215576171875, 0.33837890625, 0.40460205078125, 0.4708251953125, 0.53704833984375, 0.603271484375, 0.66949462890625, 0.7357177734375, 0.80194091796875, 0.8681640625, 0.93438720703125, 1.0006103515625, 1.06683349609375, 1.133056640625, 1.19927978515625, 1.2655029296875, 1.33172607421875, 1.39794921875, 1.46417236328125, 1.5303955078125, 1.59661865234375, 1.662841796875, 1.72906494140625, 1.7952880859375, 1.86151123046875, 1.927734375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 1.0, 6.0, 7.0, 8.0, 5.0, 8.0, 12.0, 6.0, 14.0, 15.0, 16.0, 19.0, 33.0, 37.0, 46.0, 86.0, 88.0, 109.0, 105.0, 80.0, 70.0, 32.0, 36.0, 21.0, 29.0, 22.0, 17.0, 16.0, 7.0, 6.0, 11.0, 6.0, 9.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0924072265625, -0.08949947357177734, -0.08659172058105469, -0.08368396759033203, -0.08077621459960938, -0.07786846160888672, -0.07496070861816406, -0.0720529556274414, -0.06914520263671875, -0.0662374496459961, -0.06332969665527344, -0.06042194366455078, -0.057514190673828125, -0.05460643768310547, -0.05169868469238281, -0.048790931701660156, -0.0458831787109375, -0.042975425720214844, -0.04006767272949219, -0.03715991973876953, -0.034252166748046875, -0.03134441375732422, -0.028436660766601562, -0.025528907775878906, -0.02262115478515625, -0.019713401794433594, -0.016805648803710938, -0.013897895812988281, -0.010990142822265625, -0.008082389831542969, -0.0051746368408203125, -0.0022668838500976562, 0.000640869140625, 0.0035486221313476562, 0.0064563751220703125, 0.009364128112792969, 0.012271881103515625, 0.015179634094238281, 0.018087387084960938, 0.020995140075683594, 0.02390289306640625, 0.026810646057128906, 0.029718399047851562, 0.03262615203857422, 0.035533905029296875, 0.03844165802001953, 0.04134941101074219, 0.044257164001464844, 0.0471649169921875, 0.050072669982910156, 0.05298042297363281, 0.05588817596435547, 0.058795928955078125, 0.06170368194580078, 0.06461143493652344, 0.0675191879272461, 0.07042694091796875, 0.0733346939086914, 0.07624244689941406, 0.07915019989013672, 0.08205795288085938, 0.08496570587158203, 0.08787345886230469, 0.09078121185302734, 0.09368896484375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 4.0, 6.0, 10.0, 7.0, 10.0, 8.0, 18.0, 20.0, 22.0, 28.0, 32.0, 45.0, 67.0, 148.0, 333.0, 1666.0, 84939.0, 956359.0, 3755.0, 562.0, 172.0, 77.0, 64.0, 35.0, 33.0, 20.0, 12.0, 10.0, 17.0, 11.0, 8.0, 7.0, 9.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.9248046875, -1.864990234375, -1.80517578125, -1.745361328125, -1.685546875, -1.625732421875, -1.56591796875, -1.506103515625, -1.4462890625, -1.386474609375, -1.32666015625, -1.266845703125, -1.20703125, -1.147216796875, -1.08740234375, -1.027587890625, -0.9677734375, -0.907958984375, -0.84814453125, -0.788330078125, -0.728515625, -0.668701171875, -0.60888671875, -0.549072265625, -0.4892578125, -0.429443359375, -0.36962890625, -0.309814453125, -0.25, -0.190185546875, -0.13037109375, -0.070556640625, -0.0107421875, 0.049072265625, 0.10888671875, 0.168701171875, 0.228515625, 0.288330078125, 0.34814453125, 0.407958984375, 0.4677734375, 0.527587890625, 0.58740234375, 0.647216796875, 0.70703125, 0.766845703125, 0.82666015625, 0.886474609375, 0.9462890625, 1.006103515625, 1.06591796875, 1.125732421875, 1.185546875, 1.245361328125, 1.30517578125, 1.364990234375, 1.4248046875, 1.484619140625, 1.54443359375, 1.604248046875, 1.6640625, 1.723876953125, 1.78369140625, 1.843505859375, 1.9033203125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 25.0, 158.0, 612.0, 172.0, 30.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1989675760269165, -1.1694070100784302, -1.1398464441299438, -1.1102858781814575, -1.0807251930236816, -1.0511646270751953, -1.021604061126709, -0.9920434951782227, -0.9624829292297363, -0.93292236328125, -0.9033617973327637, -0.8738011717796326, -0.8442406058311462, -0.8146800398826599, -0.7851194143295288, -0.7555588483810425, -0.7259982824325562, -0.6964377164840698, -0.6668771505355835, -0.6373165249824524, -0.6077559590339661, -0.5781953930854797, -0.5486347675323486, -0.5190742015838623, -0.489513635635376, -0.45995306968688965, -0.43039247393608093, -0.4008318781852722, -0.3712713122367859, -0.34171074628829956, -0.31215015053749084, -0.28258955478668213, -0.253028929233551, -0.2234683483839035, -0.19390776753425598, -0.16434718668460846, -0.13478660583496094, -0.10522602498531342, -0.0756654441356659, -0.04610486328601837, -0.01654428243637085, 0.013016298413276672, 0.042576879262924194, 0.07213746011257172, 0.10169804096221924, 0.13125862181186676, 0.16081920266151428, 0.1903797835111618, 0.21994036436080933, 0.24950094521045685, 0.27906152606010437, 0.3086221218109131, 0.3381826877593994, 0.36774325370788574, 0.39730384945869446, 0.4268644452095032, 0.4564250111579895, 0.48598557710647583, 0.5155462026596069, 0.5451067686080933, 0.5746673345565796, 0.6042279005050659, 0.6337884664535522, 0.6633490920066833, 0.6929096579551697]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 1.0, 5.0, 4.0, 8.0, 4.0, 10.0, 15.0, 7.0, 19.0, 15.0, 10.0, 18.0, 24.0, 24.0, 28.0, 25.0, 37.0, 36.0, 41.0, 40.0, 24.0, 43.0, 40.0, 35.0, 38.0, 42.0, 27.0, 33.0, 45.0, 38.0, 37.0, 31.0, 24.0, 27.0, 26.0, 15.0, 10.0, 11.0, 22.0, 10.0, 15.0, 9.0, 4.0, 6.0, 6.0, 4.0, 4.0, 1.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.16788947582244873, -0.16277065873146057, -0.1576518416404724, -0.15253302454948425, -0.1474142074584961, -0.14229537546634674, -0.13717655837535858, -0.13205774128437042, -0.12693892419338226, -0.1218201071023941, -0.11670129001140594, -0.11158246546983719, -0.10646364837884903, -0.10134483128786087, -0.09622600674629211, -0.09110718965530396, -0.0859883725643158, -0.08086955547332764, -0.07575073838233948, -0.07063191384077072, -0.06551309674978256, -0.0603942796587944, -0.055275458842515945, -0.05015663802623749, -0.04503782093524933, -0.03991900384426117, -0.03480018302798271, -0.029681364074349403, -0.024562545120716095, -0.019443726167082787, -0.014324907213449478, -0.00920608639717102, -0.004087269306182861, 0.001031549647450447, 0.0061503686010837555, 0.011269187554717064, 0.016388006508350372, 0.02150682546198368, 0.02662564441561699, 0.03174446523189545, 0.036863282322883606, 0.041982099413871765, 0.04710092023015022, 0.05221974104642868, 0.05733855813741684, 0.062457375228405, 0.06757619976997375, 0.07269501686096191, 0.07781383395195007, 0.08293265104293823, 0.08805146813392639, 0.09317029267549515, 0.0982891097664833, 0.10340792685747147, 0.10852675139904022, 0.11364556849002838, 0.11876438558101654, 0.1238832026720047, 0.12900201976299286, 0.13412083685398102, 0.13923966884613037, 0.14435848593711853, 0.1494773030281067, 0.15459612011909485, 0.159714937210083]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 1.0, 5.0, 7.0, 8.0, 7.0, 12.0, 11.0, 15.0, 20.0, 21.0, 23.0, 21.0, 25.0, 23.0, 21.0, 36.0, 37.0, 33.0, 38.0, 32.0, 45.0, 42.0, 41.0, 38.0, 32.0, 51.0, 33.0, 33.0, 27.0, 41.0, 28.0, 25.0, 18.0, 25.0, 19.0, 13.0, 13.0, 12.0, 12.0, 12.0, 10.0, 7.0, 6.0, 3.0, 6.0, 6.0, 1.0, 0.0, 5.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.55078125, -6.32122802734375, -6.0916748046875, -5.86212158203125, -5.632568359375, -5.40301513671875, -5.1734619140625, -4.94390869140625, -4.71435546875, -4.48480224609375, -4.2552490234375, -4.02569580078125, -3.796142578125, -3.56658935546875, -3.3370361328125, -3.10748291015625, -2.8779296875, -2.64837646484375, -2.4188232421875, -2.18927001953125, -1.959716796875, -1.73016357421875, -1.5006103515625, -1.27105712890625, -1.04150390625, -0.81195068359375, -0.5823974609375, -0.35284423828125, -0.123291015625, 0.10626220703125, 0.3358154296875, 0.56536865234375, 0.794921875, 1.02447509765625, 1.2540283203125, 1.48358154296875, 1.713134765625, 1.94268798828125, 2.1722412109375, 2.40179443359375, 2.63134765625, 2.86090087890625, 3.0904541015625, 3.32000732421875, 3.549560546875, 3.77911376953125, 4.0086669921875, 4.23822021484375, 4.4677734375, 4.69732666015625, 4.9268798828125, 5.15643310546875, 5.385986328125, 5.61553955078125, 5.8450927734375, 6.07464599609375, 6.30419921875, 6.53375244140625, 6.7633056640625, 6.99285888671875, 7.222412109375, 7.45196533203125, 7.6815185546875, 7.91107177734375, 8.140625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 4.0, 3.0, 8.0, 8.0, 19.0, 11.0, 9.0, 23.0, 24.0, 40.0, 65.0, 94.0, 142.0, 198.0, 419.0, 741.0, 1757.0, 4671.0, 12665.0, 34744.0, 96512.0, 270060.0, 387295.0, 151974.0, 54546.0, 20143.0, 7285.0, 2680.0, 1146.0, 512.0, 286.0, 142.0, 89.0, 64.0, 39.0, 26.0, 25.0, 11.0, 11.0, 14.0, 12.0, 9.0, 4.0, 4.0, 3.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.1484375, -9.8011474609375, -9.453857421875, -9.1065673828125, -8.75927734375, -8.4119873046875, -8.064697265625, -7.7174072265625, -7.3701171875, -7.0228271484375, -6.675537109375, -6.3282470703125, -5.98095703125, -5.6336669921875, -5.286376953125, -4.9390869140625, -4.591796875, -4.2445068359375, -3.897216796875, -3.5499267578125, -3.20263671875, -2.8553466796875, -2.508056640625, -2.1607666015625, -1.8134765625, -1.4661865234375, -1.118896484375, -0.7716064453125, -0.42431640625, -0.0770263671875, 0.270263671875, 0.6175537109375, 0.96484375, 1.3121337890625, 1.659423828125, 2.0067138671875, 2.35400390625, 2.7012939453125, 3.048583984375, 3.3958740234375, 3.7431640625, 4.0904541015625, 4.437744140625, 4.7850341796875, 5.13232421875, 5.4796142578125, 5.826904296875, 6.1741943359375, 6.521484375, 6.8687744140625, 7.216064453125, 7.5633544921875, 7.91064453125, 8.2579345703125, 8.605224609375, 8.9525146484375, 9.2998046875, 9.6470947265625, 9.994384765625, 10.3416748046875, 10.68896484375, 11.0362548828125, 11.383544921875, 11.7308349609375, 12.078125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 3.0, 4.0, 13.0, 7.0, 13.0, 20.0, 16.0, 19.0, 24.0, 32.0, 37.0, 36.0, 42.0, 58.0, 68.0, 78.0, 164.0, 1403.0, 373.0, 170.0, 105.0, 55.0, 41.0, 43.0, 37.0, 33.0, 22.0, 26.0, 15.0, 20.0, 13.0, 8.0, 7.0, 4.0, 12.0, 8.0, 3.0, 3.0, 5.0, 6.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.53125, -22.65869140625, -21.7861328125, -20.91357421875, -20.041015625, -19.16845703125, -18.2958984375, -17.42333984375, -16.55078125, -15.67822265625, -14.8056640625, -13.93310546875, -13.060546875, -12.18798828125, -11.3154296875, -10.44287109375, -9.5703125, -8.69775390625, -7.8251953125, -6.95263671875, -6.080078125, -5.20751953125, -4.3349609375, -3.46240234375, -2.58984375, -1.71728515625, -0.8447265625, 0.02783203125, 0.900390625, 1.77294921875, 2.6455078125, 3.51806640625, 4.390625, 5.26318359375, 6.1357421875, 7.00830078125, 7.880859375, 8.75341796875, 9.6259765625, 10.49853515625, 11.37109375, 12.24365234375, 13.1162109375, 13.98876953125, 14.861328125, 15.73388671875, 16.6064453125, 17.47900390625, 18.3515625, 19.22412109375, 20.0966796875, 20.96923828125, 21.841796875, 22.71435546875, 23.5869140625, 24.45947265625, 25.33203125, 26.20458984375, 27.0771484375, 27.94970703125, 28.822265625, 29.69482421875, 30.5673828125, 31.43994140625, 32.3125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 7.0, 7.0, 12.0, 6.0, 7.0, 14.0, 14.0, 21.0, 35.0, 44.0, 41.0, 66.0, 73.0, 100.0, 171.0, 228.0, 511.0, 1769.0, 33249.0, 2956175.0, 148459.0, 3044.0, 675.0, 284.0, 192.0, 100.0, 100.0, 70.0, 49.0, 40.0, 26.0, 24.0, 23.0, 16.0, 14.0, 8.0, 6.0, 7.0, 5.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 4.0], "bins": [-70.6875, -68.8095703125, -66.931640625, -65.0537109375, -63.17578125, -61.2978515625, -59.419921875, -57.5419921875, -55.6640625, -53.7861328125, -51.908203125, -50.0302734375, -48.15234375, -46.2744140625, -44.396484375, -42.5185546875, -40.640625, -38.7626953125, -36.884765625, -35.0068359375, -33.12890625, -31.2509765625, -29.373046875, -27.4951171875, -25.6171875, -23.7392578125, -21.861328125, -19.9833984375, -18.10546875, -16.2275390625, -14.349609375, -12.4716796875, -10.59375, -8.7158203125, -6.837890625, -4.9599609375, -3.08203125, -1.2041015625, 0.673828125, 2.5517578125, 4.4296875, 6.3076171875, 8.185546875, 10.0634765625, 11.94140625, 13.8193359375, 15.697265625, 17.5751953125, 19.453125, 21.3310546875, 23.208984375, 25.0869140625, 26.96484375, 28.8427734375, 30.720703125, 32.5986328125, 34.4765625, 36.3544921875, 38.232421875, 40.1103515625, 41.98828125, 43.8662109375, 45.744140625, 47.6220703125, 49.5]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 13.0, 27.0, 90.0, 152.0, 209.0, 219.0, 171.0, 95.0, 25.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.057279586791992, -27.76311492919922, -25.468950271606445, -23.174785614013672, -20.880619049072266, -18.586456298828125, -16.29228973388672, -13.998125076293945, -11.703960418701172, -9.409795761108398, -7.115630626678467, -4.821465492248535, -2.5273008346557617, -0.23313617706298828, 2.0610294342041016, 4.355194091796875, 6.649358749389648, 8.943523406982422, 11.237688064575195, 13.531853675842285, 15.826018333435059, 18.120182037353516, 20.414348602294922, 22.708513259887695, 25.00267791748047, 27.296842575073242, 29.591007232666016, 31.885173797607422, 34.17933654785156, 36.47350311279297, 38.767669677734375, 41.061832427978516, 43.355995178222656, 45.65016174316406, 47.9443244934082, 50.23849105834961, 52.53265380859375, 54.826820373535156, 57.12098693847656, 59.4151496887207, 61.709312438964844, 64.00347900390625, 66.29764556884766, 68.59180450439453, 70.88597106933594, 73.18013763427734, 75.47430419921875, 77.76846313476562, 80.06263732910156, 82.35680389404297, 84.65097045898438, 86.94512939453125, 89.23929595947266, 91.53346252441406, 93.82762908935547, 96.12179565429688, 98.41595458984375, 100.71012115478516, 103.00428771972656, 105.29844665527344, 107.59261322021484, 109.88677978515625, 112.18094635009766, 114.47511291503906, 116.76927185058594]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 6.0, 4.0, 8.0, 5.0, 11.0, 10.0, 18.0, 13.0, 15.0, 18.0, 21.0, 26.0, 27.0, 23.0, 27.0, 49.0, 39.0, 27.0, 50.0, 39.0, 45.0, 44.0, 40.0, 42.0, 34.0, 22.0, 34.0, 20.0, 26.0, 30.0, 36.0, 25.0, 18.0, 20.0, 21.0, 23.0, 16.0, 11.0, 12.0, 8.0, 7.0, 4.0, 4.0, 9.0, 7.0, 3.0, 6.0, 4.0, 2.0], "bins": [-73.72003173828125, -71.75405883789062, -69.78807830810547, -67.82209777832031, -65.85612487792969, -63.8901481628418, -61.924171447753906, -59.958194732666016, -57.992218017578125, -56.026241302490234, -54.060264587402344, -52.09428787231445, -50.12831115722656, -48.16233444213867, -46.19635772705078, -44.23038101196289, -42.264404296875, -40.29842758178711, -38.33245086669922, -36.36647415161133, -34.40049743652344, -32.43452072143555, -30.468544006347656, -28.502567291259766, -26.536590576171875, -24.570613861083984, -22.604637145996094, -20.638660430908203, -18.672683715820312, -16.706707000732422, -14.740730285644531, -12.77475357055664, -10.80877685546875, -8.84280014038086, -6.876823425292969, -4.910846710205078, -2.9448699951171875, -0.9788932800292969, 0.9870834350585938, 2.9530601501464844, 4.919036865234375, 6.885013580322266, 8.850990295410156, 10.816967010498047, 12.782943725585938, 14.748920440673828, 16.71489715576172, 18.68087387084961, 20.6468505859375, 22.61282730102539, 24.57880401611328, 26.544780731201172, 28.510757446289062, 30.476734161376953, 32.442710876464844, 34.408687591552734, 36.374664306640625, 38.340641021728516, 40.306617736816406, 42.2725944519043, 44.23857116699219, 46.20454788208008, 48.17052459716797, 50.13650131225586, 52.10247802734375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 6.0, 5.0, 6.0, 13.0, 9.0, 22.0, 12.0, 25.0, 21.0, 23.0, 24.0, 28.0, 27.0, 44.0, 32.0, 47.0, 47.0, 52.0, 57.0, 40.0, 49.0, 50.0, 39.0, 42.0, 43.0, 36.0, 35.0, 27.0, 23.0, 20.0, 18.0, 13.0, 16.0, 12.0, 9.0, 7.0, 3.0, 1.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.4296875, -9.127685546875, -8.82568359375, -8.523681640625, -8.2216796875, -7.919677734375, -7.61767578125, -7.315673828125, -7.013671875, -6.711669921875, -6.40966796875, -6.107666015625, -5.8056640625, -5.503662109375, -5.20166015625, -4.899658203125, -4.59765625, -4.295654296875, -3.99365234375, -3.691650390625, -3.3896484375, -3.087646484375, -2.78564453125, -2.483642578125, -2.181640625, -1.879638671875, -1.57763671875, -1.275634765625, -0.9736328125, -0.671630859375, -0.36962890625, -0.067626953125, 0.234375, 0.536376953125, 0.83837890625, 1.140380859375, 1.4423828125, 1.744384765625, 2.04638671875, 2.348388671875, 2.650390625, 2.952392578125, 3.25439453125, 3.556396484375, 3.8583984375, 4.160400390625, 4.46240234375, 4.764404296875, 5.06640625, 5.368408203125, 5.67041015625, 5.972412109375, 6.2744140625, 6.576416015625, 6.87841796875, 7.180419921875, 7.482421875, 7.784423828125, 8.08642578125, 8.388427734375, 8.6904296875, 8.992431640625, 9.29443359375, 9.596435546875, 9.8984375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 8.0, 5.0, 7.0, 7.0, 9.0, 19.0, 16.0, 26.0, 47.0, 65.0, 94.0, 116.0, 195.0, 312.0, 643.0, 1228.0, 2767.0, 6994.0, 19030.0, 57596.0, 170248.0, 466360.0, 1014544.0, 1259979.0, 740211.0, 296648.0, 102742.0, 34162.0, 11754.0, 4554.0, 1878.0, 832.0, 430.0, 236.0, 147.0, 106.0, 71.0, 58.0, 32.0, 29.0, 21.0, 19.0, 8.0, 8.0, 14.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-9.6171875, -9.3095703125, -9.001953125, -8.6943359375, -8.38671875, -8.0791015625, -7.771484375, -7.4638671875, -7.15625, -6.8486328125, -6.541015625, -6.2333984375, -5.92578125, -5.6181640625, -5.310546875, -5.0029296875, -4.6953125, -4.3876953125, -4.080078125, -3.7724609375, -3.46484375, -3.1572265625, -2.849609375, -2.5419921875, -2.234375, -1.9267578125, -1.619140625, -1.3115234375, -1.00390625, -0.6962890625, -0.388671875, -0.0810546875, 0.2265625, 0.5341796875, 0.841796875, 1.1494140625, 1.45703125, 1.7646484375, 2.072265625, 2.3798828125, 2.6875, 2.9951171875, 3.302734375, 3.6103515625, 3.91796875, 4.2255859375, 4.533203125, 4.8408203125, 5.1484375, 5.4560546875, 5.763671875, 6.0712890625, 6.37890625, 6.6865234375, 6.994140625, 7.3017578125, 7.609375, 7.9169921875, 8.224609375, 8.5322265625, 8.83984375, 9.1474609375, 9.455078125, 9.7626953125, 10.0703125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 6.0, 10.0, 8.0, 12.0, 10.0, 18.0, 26.0, 25.0, 42.0, 70.0, 95.0, 116.0, 152.0, 228.0, 280.0, 335.0, 359.0, 407.0, 407.0, 312.0, 270.0, 220.0, 163.0, 135.0, 91.0, 69.0, 64.0, 42.0, 27.0, 23.0, 15.0, 11.0, 10.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.421875, -12.94970703125, -12.4775390625, -12.00537109375, -11.533203125, -11.06103515625, -10.5888671875, -10.11669921875, -9.64453125, -9.17236328125, -8.7001953125, -8.22802734375, -7.755859375, -7.28369140625, -6.8115234375, -6.33935546875, -5.8671875, -5.39501953125, -4.9228515625, -4.45068359375, -3.978515625, -3.50634765625, -3.0341796875, -2.56201171875, -2.08984375, -1.61767578125, -1.1455078125, -0.67333984375, -0.201171875, 0.27099609375, 0.7431640625, 1.21533203125, 1.6875, 2.15966796875, 2.6318359375, 3.10400390625, 3.576171875, 4.04833984375, 4.5205078125, 4.99267578125, 5.46484375, 5.93701171875, 6.4091796875, 6.88134765625, 7.353515625, 7.82568359375, 8.2978515625, 8.77001953125, 9.2421875, 9.71435546875, 10.1865234375, 10.65869140625, 11.130859375, 11.60302734375, 12.0751953125, 12.54736328125, 13.01953125, 13.49169921875, 13.9638671875, 14.43603515625, 14.908203125, 15.38037109375, 15.8525390625, 16.32470703125, 16.796875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 8.0, 10.0, 19.0, 17.0, 38.0, 54.0, 87.0, 122.0, 205.0, 349.0, 622.0, 1330.0, 10641.0, 2337511.0, 1832093.0, 8441.0, 1313.0, 615.0, 307.0, 182.0, 115.0, 65.0, 38.0, 32.0, 14.0, 15.0, 9.0, 13.0, 4.0, 1.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.0, -61.93359375, -59.8671875, -57.80078125, -55.734375, -53.66796875, -51.6015625, -49.53515625, -47.46875, -45.40234375, -43.3359375, -41.26953125, -39.203125, -37.13671875, -35.0703125, -33.00390625, -30.9375, -28.87109375, -26.8046875, -24.73828125, -22.671875, -20.60546875, -18.5390625, -16.47265625, -14.40625, -12.33984375, -10.2734375, -8.20703125, -6.140625, -4.07421875, -2.0078125, 0.05859375, 2.125, 4.19140625, 6.2578125, 8.32421875, 10.390625, 12.45703125, 14.5234375, 16.58984375, 18.65625, 20.72265625, 22.7890625, 24.85546875, 26.921875, 28.98828125, 31.0546875, 33.12109375, 35.1875, 37.25390625, 39.3203125, 41.38671875, 43.453125, 45.51953125, 47.5859375, 49.65234375, 51.71875, 53.78515625, 55.8515625, 57.91796875, 59.984375, 62.05078125, 64.1171875, 66.18359375, 68.25]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 12.0, 88.0, 182.0, 292.0, 266.0, 126.0, 38.0, 7.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-194.66017150878906, -188.87657165527344, -183.0929718017578, -177.3093719482422, -171.5257568359375, -165.74215698242188, -159.95855712890625, -154.17495727539062, -148.391357421875, -142.60775756835938, -136.82415771484375, -131.04055786132812, -125.25695037841797, -119.47335052490234, -113.68974304199219, -107.90614318847656, -102.12254333496094, -96.33894348144531, -90.55534362792969, -84.77173614501953, -78.9881362915039, -73.20453643798828, -67.42092895507812, -61.6373291015625, -55.853729248046875, -50.07012939453125, -44.28652572631836, -38.50292205810547, -32.719322204589844, -26.935720443725586, -21.152118682861328, -15.368515014648438, -9.58489990234375, -3.801298141479492, 1.9823036193847656, 7.765905380249023, 13.549507141113281, 19.33310890197754, 25.116710662841797, 30.900314331054688, 36.68391418457031, 42.46751403808594, 48.25111770629883, 54.03472137451172, 59.818321228027344, 65.60192108154297, 71.38552856445312, 77.16912841796875, 82.95272827148438, 88.736328125, 94.51992797851562, 100.30353546142578, 106.0871353149414, 111.87073516845703, 117.65434265136719, 123.43794250488281, 129.22154235839844, 135.00514221191406, 140.7887420654297, 146.5723419189453, 152.35595703125, 158.13955688476562, 163.92315673828125, 169.70675659179688, 175.4903564453125]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 8.0, 7.0, 3.0, 8.0, 16.0, 15.0, 20.0, 25.0, 25.0, 16.0, 33.0, 33.0, 37.0, 32.0, 38.0, 41.0, 44.0, 37.0, 40.0, 46.0, 42.0, 37.0, 49.0, 33.0, 48.0, 33.0, 31.0, 26.0, 23.0, 24.0, 22.0, 11.0, 10.0, 19.0, 11.0, 17.0, 10.0, 13.0, 6.0, 7.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-59.246925354003906, -57.48983383178711, -55.73273849487305, -53.97564697265625, -52.21855545043945, -50.46146011352539, -48.704368591308594, -46.94727325439453, -45.190181732177734, -43.43309020996094, -41.675994873046875, -39.91890335083008, -38.16181182861328, -36.40471649169922, -34.64762496948242, -32.890533447265625, -31.133440017700195, -29.376346588134766, -27.61925506591797, -25.86216163635254, -24.10506820678711, -22.347976684570312, -20.590883255004883, -18.833789825439453, -17.076698303222656, -15.319605827331543, -13.562512397766113, -11.805419921875, -10.04832649230957, -8.291234016418457, -6.534141540527344, -4.777048110961914, -3.0199546813964844, -1.2628618478775024, 0.4942309856414795, 2.251323699951172, 4.008416652679443, 5.765509605407715, 7.522602081298828, 9.279695510864258, 11.036787986755371, 12.793880462646484, 14.550973892211914, 16.308067321777344, 18.06515884399414, 19.82225227355957, 21.579345703125, 23.336437225341797, 25.093530654907227, 26.850624084472656, 28.607715606689453, 30.364809036254883, 32.12190246582031, 33.87899398803711, 35.636085510253906, 37.39318084716797, 39.150272369384766, 40.90736389160156, 42.664459228515625, 44.42155075073242, 46.17864227294922, 47.93573760986328, 49.69282913208008, 51.449920654296875, 53.20701599121094]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 5.0, 7.0, 8.0, 7.0, 3.0, 5.0, 20.0, 17.0, 21.0, 24.0, 30.0, 30.0, 35.0, 28.0, 39.0, 43.0, 38.0, 47.0, 46.0, 47.0, 41.0, 39.0, 54.0, 41.0, 54.0, 39.0, 27.0, 35.0, 21.0, 24.0, 18.0, 18.0, 15.0, 14.0, 11.0, 16.0, 11.0, 5.0, 6.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.546875, -8.27099609375, -7.9951171875, -7.71923828125, -7.443359375, -7.16748046875, -6.8916015625, -6.61572265625, -6.33984375, -6.06396484375, -5.7880859375, -5.51220703125, -5.236328125, -4.96044921875, -4.6845703125, -4.40869140625, -4.1328125, -3.85693359375, -3.5810546875, -3.30517578125, -3.029296875, -2.75341796875, -2.4775390625, -2.20166015625, -1.92578125, -1.64990234375, -1.3740234375, -1.09814453125, -0.822265625, -0.54638671875, -0.2705078125, 0.00537109375, 0.28125, 0.55712890625, 0.8330078125, 1.10888671875, 1.384765625, 1.66064453125, 1.9365234375, 2.21240234375, 2.48828125, 2.76416015625, 3.0400390625, 3.31591796875, 3.591796875, 3.86767578125, 4.1435546875, 4.41943359375, 4.6953125, 4.97119140625, 5.2470703125, 5.52294921875, 5.798828125, 6.07470703125, 6.3505859375, 6.62646484375, 6.90234375, 7.17822265625, 7.4541015625, 7.72998046875, 8.005859375, 8.28173828125, 8.5576171875, 8.83349609375, 9.109375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 12.0, 14.0, 31.0, 34.0, 63.0, 74.0, 112.0, 179.0, 313.0, 411.0, 664.0, 1072.0, 1644.0, 2675.0, 4349.0, 6681.0, 10443.0, 16556.0, 25567.0, 38381.0, 55928.0, 77044.0, 101149.0, 121160.0, 131178.0, 119133.0, 99636.0, 75540.0, 53633.0, 36685.0, 24379.0, 16088.0, 10184.0, 6479.0, 4227.0, 2501.0, 1626.0, 966.0, 626.0, 425.0, 251.0, 178.0, 92.0, 59.0, 35.0, 30.0, 16.0, 16.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.2685546875, -1.2317352294921875, -1.194915771484375, -1.1580963134765625, -1.12127685546875, -1.0844573974609375, -1.047637939453125, -1.0108184814453125, -0.9739990234375, -0.9371795654296875, -0.900360107421875, -0.8635406494140625, -0.82672119140625, -0.7899017333984375, -0.753082275390625, -0.7162628173828125, -0.679443359375, -0.6426239013671875, -0.605804443359375, -0.5689849853515625, -0.53216552734375, -0.4953460693359375, -0.458526611328125, -0.4217071533203125, -0.3848876953125, -0.3480682373046875, -0.311248779296875, -0.2744293212890625, -0.23760986328125, -0.2007904052734375, -0.163970947265625, -0.1271514892578125, -0.09033203125, -0.0535125732421875, -0.016693115234375, 0.0201263427734375, 0.05694580078125, 0.0937652587890625, 0.130584716796875, 0.1674041748046875, 0.2042236328125, 0.2410430908203125, 0.277862548828125, 0.3146820068359375, 0.35150146484375, 0.3883209228515625, 0.425140380859375, 0.4619598388671875, 0.498779296875, 0.5355987548828125, 0.572418212890625, 0.6092376708984375, 0.64605712890625, 0.6828765869140625, 0.719696044921875, 0.7565155029296875, 0.7933349609375, 0.8301544189453125, 0.866973876953125, 0.9037933349609375, 0.94061279296875, 0.9774322509765625, 1.014251708984375, 1.0510711669921875, 1.087890625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 8.0, 8.0, 8.0, 3.0, 9.0, 14.0, 13.0, 17.0, 22.0, 17.0, 33.0, 21.0, 24.0, 31.0, 36.0, 39.0, 36.0, 42.0, 42.0, 48.0, 1074.0, 44.0, 44.0, 51.0, 30.0, 40.0, 33.0, 22.0, 22.0, 37.0, 28.0, 22.0, 19.0, 19.0, 14.0, 14.0, 9.0, 7.0, 9.0, 2.0, 8.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.83984375, -5.65838623046875, -5.4769287109375, -5.29547119140625, -5.114013671875, -4.93255615234375, -4.7510986328125, -4.56964111328125, -4.38818359375, -4.20672607421875, -4.0252685546875, -3.84381103515625, -3.662353515625, -3.48089599609375, -3.2994384765625, -3.11798095703125, -2.9365234375, -2.75506591796875, -2.5736083984375, -2.39215087890625, -2.210693359375, -2.02923583984375, -1.8477783203125, -1.66632080078125, -1.48486328125, -1.30340576171875, -1.1219482421875, -0.94049072265625, -0.759033203125, -0.57757568359375, -0.3961181640625, -0.21466064453125, -0.033203125, 0.14825439453125, 0.3297119140625, 0.51116943359375, 0.692626953125, 0.87408447265625, 1.0555419921875, 1.23699951171875, 1.41845703125, 1.59991455078125, 1.7813720703125, 1.96282958984375, 2.144287109375, 2.32574462890625, 2.5072021484375, 2.68865966796875, 2.8701171875, 3.05157470703125, 3.2330322265625, 3.41448974609375, 3.595947265625, 3.77740478515625, 3.9588623046875, 4.14031982421875, 4.32177734375, 4.50323486328125, 4.6846923828125, 4.86614990234375, 5.047607421875, 5.22906494140625, 5.4105224609375, 5.59197998046875, 5.7734375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 4.0, 4.0, 10.0, 13.0, 30.0, 36.0, 43.0, 64.0, 86.0, 117.0, 180.0, 267.0, 376.0, 535.0, 702.0, 1098.0, 1546.0, 2055.0, 3065.0, 4374.0, 6050.0, 8539.0, 11968.0, 16743.0, 23985.0, 42324.0, 1857560.0, 36849.0, 23162.0, 15909.0, 11497.0, 8028.0, 5863.0, 4167.0, 2904.0, 2015.0, 1479.0, 1058.0, 707.0, 489.0, 400.0, 264.0, 171.0, 117.0, 91.0, 58.0, 42.0, 31.0, 29.0, 8.0, 9.0, 3.0, 7.0, 1.0, 2.0, 3.0, 4.0], "bins": [-1.990234375, -1.9307098388671875, -1.871185302734375, -1.8116607666015625, -1.75213623046875, -1.6926116943359375, -1.633087158203125, -1.5735626220703125, -1.5140380859375, -1.4545135498046875, -1.394989013671875, -1.3354644775390625, -1.27593994140625, -1.2164154052734375, -1.156890869140625, -1.0973663330078125, -1.037841796875, -0.9783172607421875, -0.918792724609375, -0.8592681884765625, -0.79974365234375, -0.7402191162109375, -0.680694580078125, -0.6211700439453125, -0.5616455078125, -0.5021209716796875, -0.442596435546875, -0.3830718994140625, -0.32354736328125, -0.2640228271484375, -0.204498291015625, -0.1449737548828125, -0.08544921875, -0.0259246826171875, 0.033599853515625, 0.0931243896484375, 0.15264892578125, 0.2121734619140625, 0.271697998046875, 0.3312225341796875, 0.3907470703125, 0.4502716064453125, 0.509796142578125, 0.5693206787109375, 0.62884521484375, 0.6883697509765625, 0.747894287109375, 0.8074188232421875, 0.866943359375, 0.9264678955078125, 0.985992431640625, 1.0455169677734375, 1.10504150390625, 1.1645660400390625, 1.224090576171875, 1.2836151123046875, 1.3431396484375, 1.4026641845703125, 1.462188720703125, 1.5217132568359375, 1.58123779296875, 1.6407623291015625, 1.700286865234375, 1.7598114013671875, 1.8193359375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 7.0, 4.0, 8.0, 14.0, 14.0, 15.0, 17.0, 26.0, 23.0, 35.0, 37.0, 39.0, 52.0, 49.0, 46.0, 71.0, 66.0, 62.0, 68.0, 54.0, 40.0, 34.0, 42.0, 32.0, 31.0, 26.0, 18.0, 14.0, 6.0, 5.0, 4.0, 9.0, 9.0, 3.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.053619384765625, -0.05199146270751953, -0.05036354064941406, -0.048735618591308594, -0.047107696533203125, -0.045479774475097656, -0.04385185241699219, -0.04222393035888672, -0.04059600830078125, -0.03896808624267578, -0.03734016418457031, -0.035712242126464844, -0.034084320068359375, -0.032456398010253906, -0.030828475952148438, -0.02920055389404297, -0.0275726318359375, -0.02594470977783203, -0.024316787719726562, -0.022688865661621094, -0.021060943603515625, -0.019433021545410156, -0.017805099487304688, -0.01617717742919922, -0.01454925537109375, -0.012921333312988281, -0.011293411254882812, -0.009665489196777344, -0.008037567138671875, -0.006409645080566406, -0.0047817230224609375, -0.0031538009643554688, -0.00152587890625, 0.00010204315185546875, 0.0017299652099609375, 0.0033578872680664062, 0.004985809326171875, 0.006613731384277344, 0.008241653442382812, 0.009869575500488281, 0.01149749755859375, 0.013125419616699219, 0.014753341674804688, 0.016381263732910156, 0.018009185791015625, 0.019637107849121094, 0.021265029907226562, 0.02289295196533203, 0.0245208740234375, 0.02614879608154297, 0.027776718139648438, 0.029404640197753906, 0.031032562255859375, 0.032660484313964844, 0.03428840637207031, 0.03591632843017578, 0.03754425048828125, 0.03917217254638672, 0.04080009460449219, 0.042428016662597656, 0.044055938720703125, 0.045683860778808594, 0.04731178283691406, 0.04893970489501953, 0.050567626953125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 7.0, 7.0, 9.0, 1.0, 6.0, 14.0, 14.0, 23.0, 31.0, 54.0, 49.0, 69.0, 96.0, 159.0, 399.0, 1922.0, 231287.0, 810517.0, 2889.0, 450.0, 186.0, 103.0, 54.0, 47.0, 32.0, 28.0, 21.0, 16.0, 17.0, 7.0, 6.0, 7.0, 5.0, 3.0, 4.0, 0.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2578125, -1.21734619140625, -1.1768798828125, -1.13641357421875, -1.095947265625, -1.05548095703125, -1.0150146484375, -0.97454833984375, -0.93408203125, -0.89361572265625, -0.8531494140625, -0.81268310546875, -0.772216796875, -0.73175048828125, -0.6912841796875, -0.65081787109375, -0.6103515625, -0.56988525390625, -0.5294189453125, -0.48895263671875, -0.448486328125, -0.40802001953125, -0.3675537109375, -0.32708740234375, -0.28662109375, -0.24615478515625, -0.2056884765625, -0.16522216796875, -0.124755859375, -0.08428955078125, -0.0438232421875, -0.00335693359375, 0.037109375, 0.07757568359375, 0.1180419921875, 0.15850830078125, 0.198974609375, 0.23944091796875, 0.2799072265625, 0.32037353515625, 0.36083984375, 0.40130615234375, 0.4417724609375, 0.48223876953125, 0.522705078125, 0.56317138671875, 0.6036376953125, 0.64410400390625, 0.6845703125, 0.72503662109375, 0.7655029296875, 0.80596923828125, 0.846435546875, 0.88690185546875, 0.9273681640625, 0.96783447265625, 1.00830078125, 1.04876708984375, 1.0892333984375, 1.12969970703125, 1.170166015625, 1.21063232421875, 1.2510986328125, 1.29156494140625, 1.33203125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 11.0, 15.0, 43.0, 98.0, 199.0, 321.0, 203.0, 57.0, 32.0, 13.0, 11.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4161803424358368, -0.4082532227039337, -0.400326132774353, -0.39239901304244995, -0.3844718933105469, -0.3765448033809662, -0.3686176836490631, -0.3606905937194824, -0.35276347398757935, -0.34483635425567627, -0.3369092643260956, -0.3289821445941925, -0.3210550546646118, -0.31312793493270874, -0.30520081520080566, -0.297273725271225, -0.2893466055393219, -0.2814194858074188, -0.27349239587783813, -0.26556527614593506, -0.257638156414032, -0.2497110664844513, -0.24178394675254822, -0.23385684192180634, -0.22592973709106445, -0.21800263226032257, -0.2100755274295807, -0.2021484076976776, -0.19422130286693573, -0.18629419803619385, -0.17836707830429077, -0.1704399734735489, -0.1625128984451294, -0.1545857936143875, -0.14665868878364563, -0.13873156905174255, -0.13080446422100067, -0.12287735939025879, -0.11495024710893631, -0.10702313482761383, -0.09909602254629135, -0.09116891026496887, -0.08324180543422699, -0.07531470060348511, -0.06738758832216263, -0.05946047976613045, -0.05153337121009827, -0.043606262654066086, -0.035679154098033905, -0.027752045542001724, -0.019824936985969543, -0.011897828429937363, -0.003970719873905182, 0.003956388682126999, 0.01188349723815918, 0.01981060579419136, 0.02773771435022354, 0.03566482290625572, 0.0435919314622879, 0.051519040018320084, 0.059446148574352264, 0.06737326085567474, 0.07530036568641663, 0.08322747051715851, 0.09115458279848099]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 0.0, 4.0, 4.0, 9.0, 5.0, 5.0, 12.0, 12.0, 15.0, 14.0, 17.0, 18.0, 21.0, 31.0, 38.0, 40.0, 32.0, 59.0, 46.0, 38.0, 45.0, 56.0, 33.0, 41.0, 50.0, 49.0, 38.0, 33.0, 40.0, 28.0, 33.0, 28.0, 16.0, 20.0, 13.0, 15.0, 16.0, 10.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.05021035671234131, -0.04884457588195801, -0.04747879505157471, -0.04611301049590111, -0.04474722966551781, -0.043381448835134506, -0.04201566427946091, -0.040649883449077606, -0.039284102618694305, -0.037918321788311005, -0.036552540957927704, -0.035186756402254105, -0.033820975571870804, -0.0324551947414875, -0.031089412048459053, -0.029723629355430603, -0.028357848525047302, -0.026992067694664, -0.02562628500163555, -0.0242605023086071, -0.0228947214782238, -0.0215289406478405, -0.02016315795481205, -0.0187973752617836, -0.0174315944314003, -0.016065813601017, -0.014700030907988548, -0.013334249146282673, -0.011968467384576797, -0.010602685622870922, -0.009236903861165047, -0.007871122099459171, -0.006505340337753296, -0.0051395585760474205, -0.003773776814341545, -0.0024079950526356697, -0.0010422132909297943, 0.0003235684707760811, 0.0016893502324819565, 0.003055131994187832, 0.004420913755893707, 0.005786695517599583, 0.007152477279305458, 0.008518259041011333, 0.009884040802717209, 0.011249822564423084, 0.01261560432612896, 0.013981386087834835, 0.01534716784954071, 0.01671294867992401, 0.01807873137295246, 0.01944451406598091, 0.020810294896364212, 0.022176075726747513, 0.023541858419775963, 0.024907641112804413, 0.026273421943187714, 0.027639202773571014, 0.029004985466599464, 0.030370768159627914, 0.031736548990011215, 0.033102329820394516, 0.034468114376068115, 0.035833895206451416, 0.03719967603683472]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 7.0, 2.0, 4.0, 3.0, 2.0, 6.0, 4.0, 8.0, 11.0, 13.0, 11.0, 24.0, 25.0, 22.0, 27.0, 30.0, 27.0, 34.0, 30.0, 41.0, 38.0, 53.0, 38.0, 53.0, 49.0, 44.0, 47.0, 41.0, 30.0, 35.0, 34.0, 34.0, 25.0, 23.0, 27.0, 21.0, 10.0, 14.0, 16.0, 10.0, 10.0, 8.0, 7.0, 4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.2578125, -7.990234375, -7.72265625, -7.455078125, -7.1875, -6.919921875, -6.65234375, -6.384765625, -6.1171875, -5.849609375, -5.58203125, -5.314453125, -5.046875, -4.779296875, -4.51171875, -4.244140625, -3.9765625, -3.708984375, -3.44140625, -3.173828125, -2.90625, -2.638671875, -2.37109375, -2.103515625, -1.8359375, -1.568359375, -1.30078125, -1.033203125, -0.765625, -0.498046875, -0.23046875, 0.037109375, 0.3046875, 0.572265625, 0.83984375, 1.107421875, 1.375, 1.642578125, 1.91015625, 2.177734375, 2.4453125, 2.712890625, 2.98046875, 3.248046875, 3.515625, 3.783203125, 4.05078125, 4.318359375, 4.5859375, 4.853515625, 5.12109375, 5.388671875, 5.65625, 5.923828125, 6.19140625, 6.458984375, 6.7265625, 6.994140625, 7.26171875, 7.529296875, 7.796875, 8.064453125, 8.33203125, 8.599609375, 8.8671875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 11.0, 10.0, 7.0, 13.0, 22.0, 32.0, 62.0, 93.0, 148.0, 247.0, 376.0, 638.0, 1042.0, 1648.0, 2717.0, 4602.0, 7647.0, 12770.0, 22445.0, 39797.0, 73131.0, 135648.0, 219454.0, 221233.0, 136652.0, 73617.0, 39881.0, 22256.0, 13017.0, 7520.0, 4756.0, 2727.0, 1666.0, 1017.0, 610.0, 398.0, 247.0, 135.0, 95.0, 53.0, 34.0, 24.0, 16.0, 11.0, 11.0, 5.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.46875, -6.2457275390625, -6.022705078125, -5.7996826171875, -5.57666015625, -5.3536376953125, -5.130615234375, -4.9075927734375, -4.6845703125, -4.4615478515625, -4.238525390625, -4.0155029296875, -3.79248046875, -3.5694580078125, -3.346435546875, -3.1234130859375, -2.900390625, -2.6773681640625, -2.454345703125, -2.2313232421875, -2.00830078125, -1.7852783203125, -1.562255859375, -1.3392333984375, -1.1162109375, -0.8931884765625, -0.670166015625, -0.4471435546875, -0.22412109375, -0.0010986328125, 0.221923828125, 0.4449462890625, 0.66796875, 0.8909912109375, 1.114013671875, 1.3370361328125, 1.56005859375, 1.7830810546875, 2.006103515625, 2.2291259765625, 2.4521484375, 2.6751708984375, 2.898193359375, 3.1212158203125, 3.34423828125, 3.5672607421875, 3.790283203125, 4.0133056640625, 4.236328125, 4.4593505859375, 4.682373046875, 4.9053955078125, 5.12841796875, 5.3514404296875, 5.574462890625, 5.7974853515625, 6.0205078125, 6.2435302734375, 6.466552734375, 6.6895751953125, 6.91259765625, 7.1356201171875, 7.358642578125, 7.5816650390625, 7.8046875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 13.0, 5.0, 11.0, 8.0, 15.0, 21.0, 18.0, 21.0, 32.0, 25.0, 35.0, 41.0, 41.0, 49.0, 49.0, 84.0, 213.0, 1412.0, 295.0, 179.0, 78.0, 61.0, 43.0, 44.0, 41.0, 35.0, 28.0, 32.0, 20.0, 25.0, 19.0, 9.0, 10.0, 8.0, 8.0, 3.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.984375, -29.09814453125, -28.2119140625, -27.32568359375, -26.439453125, -25.55322265625, -24.6669921875, -23.78076171875, -22.89453125, -22.00830078125, -21.1220703125, -20.23583984375, -19.349609375, -18.46337890625, -17.5771484375, -16.69091796875, -15.8046875, -14.91845703125, -14.0322265625, -13.14599609375, -12.259765625, -11.37353515625, -10.4873046875, -9.60107421875, -8.71484375, -7.82861328125, -6.9423828125, -6.05615234375, -5.169921875, -4.28369140625, -3.3974609375, -2.51123046875, -1.625, -0.73876953125, 0.1474609375, 1.03369140625, 1.919921875, 2.80615234375, 3.6923828125, 4.57861328125, 5.46484375, 6.35107421875, 7.2373046875, 8.12353515625, 9.009765625, 9.89599609375, 10.7822265625, 11.66845703125, 12.5546875, 13.44091796875, 14.3271484375, 15.21337890625, 16.099609375, 16.98583984375, 17.8720703125, 18.75830078125, 19.64453125, 20.53076171875, 21.4169921875, 22.30322265625, 23.189453125, 24.07568359375, 24.9619140625, 25.84814453125, 26.734375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 10.0, 11.0, 10.0, 15.0, 20.0, 33.0, 39.0, 50.0, 61.0, 94.0, 149.0, 240.0, 415.0, 908.0, 6445.0, 258821.0, 2826067.0, 48506.0, 2233.0, 598.0, 360.0, 176.0, 117.0, 82.0, 73.0, 39.0, 37.0, 24.0, 17.0, 20.0, 16.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-56.125, -54.5791015625, -53.033203125, -51.4873046875, -49.94140625, -48.3955078125, -46.849609375, -45.3037109375, -43.7578125, -42.2119140625, -40.666015625, -39.1201171875, -37.57421875, -36.0283203125, -34.482421875, -32.9365234375, -31.390625, -29.8447265625, -28.298828125, -26.7529296875, -25.20703125, -23.6611328125, -22.115234375, -20.5693359375, -19.0234375, -17.4775390625, -15.931640625, -14.3857421875, -12.83984375, -11.2939453125, -9.748046875, -8.2021484375, -6.65625, -5.1103515625, -3.564453125, -2.0185546875, -0.47265625, 1.0732421875, 2.619140625, 4.1650390625, 5.7109375, 7.2568359375, 8.802734375, 10.3486328125, 11.89453125, 13.4404296875, 14.986328125, 16.5322265625, 18.078125, 19.6240234375, 21.169921875, 22.7158203125, 24.26171875, 25.8076171875, 27.353515625, 28.8994140625, 30.4453125, 31.9912109375, 33.537109375, 35.0830078125, 36.62890625, 38.1748046875, 39.720703125, 41.2666015625, 42.8125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [4.0, 2.0, 14.0, 20.0, 54.0, 125.0, 167.0, 191.0, 175.0, 140.0, 76.0, 22.0, 19.0, 8.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.88594627380371, -14.706725120544434, -12.527503967285156, -10.348283767700195, -8.169062614440918, -5.989841461181641, -3.8106212615966797, -1.6314001083374023, 0.547821044921875, 2.7270419597625732, 4.9062628746032715, 7.085483551025391, 9.264704704284668, 11.443925857543945, 13.623146057128906, 15.802367210388184, 17.98158836364746, 20.160808563232422, 22.340030670166016, 24.519250869750977, 26.698471069335938, 28.87769317626953, 31.056913375854492, 33.23613357543945, 35.41535568237305, 37.59457778930664, 39.77379608154297, 41.95301818847656, 44.132240295410156, 46.31146240234375, 48.49068069458008, 50.66990280151367, 52.84912109375, 55.028343200683594, 57.20756149291992, 59.386783599853516, 61.56600570678711, 63.74522399902344, 65.92444610595703, 68.10366821289062, 70.28289031982422, 72.46211242675781, 74.6413345336914, 76.820556640625, 78.99977111816406, 81.17899322509766, 83.35821533203125, 85.53743743896484, 87.71665954589844, 89.89588165283203, 92.07510375976562, 94.25431823730469, 96.43354034423828, 98.61276245117188, 100.79198455810547, 102.97120666503906, 105.15042114257812, 107.32964324951172, 109.50886535644531, 111.68807983398438, 113.86730194091797, 116.04652404785156, 118.22574615478516, 120.40496826171875, 122.58419036865234]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 3.0, 5.0, 7.0, 10.0, 10.0, 21.0, 14.0, 22.0, 21.0, 21.0, 23.0, 27.0, 21.0, 30.0, 36.0, 29.0, 47.0, 33.0, 47.0, 41.0, 41.0, 36.0, 35.0, 37.0, 34.0, 44.0, 34.0, 27.0, 33.0, 35.0, 16.0, 21.0, 19.0, 20.0, 13.0, 17.0, 13.0, 12.0, 5.0, 6.0, 4.0, 9.0, 6.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-69.65784454345703, -67.64164733886719, -65.62545013427734, -63.6092529296875, -61.593055725097656, -59.57685852050781, -57.56066131591797, -55.544464111328125, -53.52826690673828, -51.51206970214844, -49.495872497558594, -47.47967529296875, -45.463478088378906, -43.44728088378906, -41.43108367919922, -39.414886474609375, -37.398685455322266, -35.38248825073242, -33.36629104614258, -31.350093841552734, -29.33389663696289, -27.317699432373047, -25.30150032043457, -23.285303115844727, -21.269105911254883, -19.25290870666504, -17.236711502075195, -15.220513343811035, -13.204316139221191, -11.188118934631348, -9.171920776367188, -7.155723571777344, -5.1395263671875, -3.123328924179077, -1.1071314811706543, 0.9090662002563477, 2.9252634048461914, 4.941460609436035, 6.957658767700195, 8.973855972290039, 10.990053176879883, 13.006250381469727, 15.02244758605957, 17.038646697998047, 19.05484390258789, 21.071041107177734, 23.087238311767578, 25.103435516357422, 27.119632720947266, 29.13582992553711, 31.152027130126953, 33.1682243347168, 35.18442153930664, 37.200618743896484, 39.216819763183594, 41.23301696777344, 43.24921417236328, 45.265411376953125, 47.28160858154297, 49.29780578613281, 51.314002990722656, 53.3302001953125, 55.346397399902344, 57.36259460449219, 59.37879180908203]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 7.0, 10.0, 10.0, 14.0, 12.0, 23.0, 18.0, 16.0, 27.0, 28.0, 29.0, 45.0, 39.0, 32.0, 39.0, 42.0, 54.0, 49.0, 50.0, 58.0, 38.0, 42.0, 39.0, 36.0, 40.0, 35.0, 33.0, 19.0, 20.0, 16.0, 12.0, 13.0, 14.0, 5.0, 9.0, 7.0, 3.0, 9.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.25, -7.9632568359375, -7.676513671875, -7.3897705078125, -7.10302734375, -6.8162841796875, -6.529541015625, -6.2427978515625, -5.9560546875, -5.6693115234375, -5.382568359375, -5.0958251953125, -4.80908203125, -4.5223388671875, -4.235595703125, -3.9488525390625, -3.662109375, -3.3753662109375, -3.088623046875, -2.8018798828125, -2.51513671875, -2.2283935546875, -1.941650390625, -1.6549072265625, -1.3681640625, -1.0814208984375, -0.794677734375, -0.5079345703125, -0.22119140625, 0.0655517578125, 0.352294921875, 0.6390380859375, 0.92578125, 1.2125244140625, 1.499267578125, 1.7860107421875, 2.07275390625, 2.3594970703125, 2.646240234375, 2.9329833984375, 3.2197265625, 3.5064697265625, 3.793212890625, 4.0799560546875, 4.36669921875, 4.6534423828125, 4.940185546875, 5.2269287109375, 5.513671875, 5.8004150390625, 6.087158203125, 6.3739013671875, 6.66064453125, 6.9473876953125, 7.234130859375, 7.5208740234375, 7.8076171875, 8.0943603515625, 8.381103515625, 8.6678466796875, 8.95458984375, 9.2413330078125, 9.528076171875, 9.8148193359375, 10.1015625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 1.0, 3.0, 8.0, 3.0, 6.0, 8.0, 14.0, 9.0, 21.0, 31.0, 26.0, 29.0, 33.0, 48.0, 80.0, 163.0, 449.0, 1858.0, 9880.0, 65499.0, 473495.0, 2177390.0, 1246585.0, 186335.0, 26334.0, 4317.0, 975.0, 273.0, 121.0, 72.0, 40.0, 34.0, 25.0, 27.0, 22.0, 13.0, 14.0, 14.0, 11.0, 5.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.265625, -14.7158203125, -14.166015625, -13.6162109375, -13.06640625, -12.5166015625, -11.966796875, -11.4169921875, -10.8671875, -10.3173828125, -9.767578125, -9.2177734375, -8.66796875, -8.1181640625, -7.568359375, -7.0185546875, -6.46875, -5.9189453125, -5.369140625, -4.8193359375, -4.26953125, -3.7197265625, -3.169921875, -2.6201171875, -2.0703125, -1.5205078125, -0.970703125, -0.4208984375, 0.12890625, 0.6787109375, 1.228515625, 1.7783203125, 2.328125, 2.8779296875, 3.427734375, 3.9775390625, 4.52734375, 5.0771484375, 5.626953125, 6.1767578125, 6.7265625, 7.2763671875, 7.826171875, 8.3759765625, 8.92578125, 9.4755859375, 10.025390625, 10.5751953125, 11.125, 11.6748046875, 12.224609375, 12.7744140625, 13.32421875, 13.8740234375, 14.423828125, 14.9736328125, 15.5234375, 16.0732421875, 16.623046875, 17.1728515625, 17.72265625, 18.2724609375, 18.822265625, 19.3720703125, 19.921875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 5.0, 9.0, 3.0, 9.0, 14.0, 18.0, 34.0, 55.0, 61.0, 93.0, 116.0, 181.0, 256.0, 312.0, 405.0, 511.0, 472.0, 422.0, 303.0, 224.0, 157.0, 132.0, 82.0, 56.0, 46.0, 36.0, 18.0, 17.0, 12.0, 4.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9140625, -13.4339599609375, -12.953857421875, -12.4737548828125, -11.99365234375, -11.5135498046875, -11.033447265625, -10.5533447265625, -10.0732421875, -9.5931396484375, -9.113037109375, -8.6329345703125, -8.15283203125, -7.6727294921875, -7.192626953125, -6.7125244140625, -6.232421875, -5.7523193359375, -5.272216796875, -4.7921142578125, -4.31201171875, -3.8319091796875, -3.351806640625, -2.8717041015625, -2.3916015625, -1.9114990234375, -1.431396484375, -0.9512939453125, -0.47119140625, 0.0089111328125, 0.489013671875, 0.9691162109375, 1.44921875, 1.9293212890625, 2.409423828125, 2.8895263671875, 3.36962890625, 3.8497314453125, 4.329833984375, 4.8099365234375, 5.2900390625, 5.7701416015625, 6.250244140625, 6.7303466796875, 7.21044921875, 7.6905517578125, 8.170654296875, 8.6507568359375, 9.130859375, 9.6109619140625, 10.091064453125, 10.5711669921875, 11.05126953125, 11.5313720703125, 12.011474609375, 12.4915771484375, 12.9716796875, 13.4517822265625, 13.931884765625, 14.4119873046875, 14.89208984375, 15.3721923828125, 15.852294921875, 16.3323974609375, 16.8125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 11.0, 16.0, 16.0, 21.0, 38.0, 53.0, 70.0, 113.0, 180.0, 275.0, 455.0, 1170.0, 16978.0, 1184100.0, 2936777.0, 50529.0, 1946.0, 587.0, 322.0, 205.0, 134.0, 93.0, 60.0, 38.0, 29.0, 17.0, 11.0, 8.0, 7.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-55.96875, -54.3759765625, -52.783203125, -51.1904296875, -49.59765625, -48.0048828125, -46.412109375, -44.8193359375, -43.2265625, -41.6337890625, -40.041015625, -38.4482421875, -36.85546875, -35.2626953125, -33.669921875, -32.0771484375, -30.484375, -28.8916015625, -27.298828125, -25.7060546875, -24.11328125, -22.5205078125, -20.927734375, -19.3349609375, -17.7421875, -16.1494140625, -14.556640625, -12.9638671875, -11.37109375, -9.7783203125, -8.185546875, -6.5927734375, -5.0, -3.4072265625, -1.814453125, -0.2216796875, 1.37109375, 2.9638671875, 4.556640625, 6.1494140625, 7.7421875, 9.3349609375, 10.927734375, 12.5205078125, 14.11328125, 15.7060546875, 17.298828125, 18.8916015625, 20.484375, 22.0771484375, 23.669921875, 25.2626953125, 26.85546875, 28.4482421875, 30.041015625, 31.6337890625, 33.2265625, 34.8193359375, 36.412109375, 38.0048828125, 39.59765625, 41.1904296875, 42.783203125, 44.3759765625, 45.96875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [4.0, 9.0, 6.0, 10.0, 18.0, 26.0, 44.0, 42.0, 58.0, 77.0, 83.0, 96.0, 75.0, 80.0, 84.0, 79.0, 62.0, 50.0, 31.0, 28.0, 25.0, 15.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.46253776550293, -17.932510375976562, -16.402482986450195, -14.872454643249512, -13.342426300048828, -11.812398910522461, -10.282371520996094, -8.75234317779541, -7.222315788269043, -5.692287921905518, -4.162260055541992, -2.632232666015625, -1.1022047996520996, 0.4278230667114258, 1.957850456237793, 3.4878787994384766, 5.017906188964844, 6.547934055328369, 8.077961921691895, 9.607989311218262, 11.138017654418945, 12.668045043945312, 14.19807243347168, 15.728100776672363, 17.258129119873047, 18.788156509399414, 20.31818389892578, 21.84821319580078, 23.37824058532715, 24.908267974853516, 26.438295364379883, 27.96832275390625, 29.498348236083984, 31.02837562561035, 32.55840301513672, 34.08843231201172, 35.61845779418945, 37.14848709106445, 38.67851257324219, 40.20854187011719, 41.73857116699219, 43.26860046386719, 44.79862594604492, 46.32865524291992, 47.858680725097656, 49.388710021972656, 50.918739318847656, 52.44876480102539, 53.978790283203125, 55.508819580078125, 57.03884506225586, 58.56887435913086, 60.098899841308594, 61.628929138183594, 63.158958435058594, 64.6889877319336, 66.2190170288086, 67.7490463256836, 69.2790756225586, 70.80909729003906, 72.33912658691406, 73.86915588378906, 75.39918518066406, 76.92921447753906, 78.45923614501953]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 3.0, 8.0, 8.0, 11.0, 8.0, 13.0, 15.0, 16.0, 23.0, 23.0, 34.0, 24.0, 31.0, 43.0, 43.0, 39.0, 32.0, 43.0, 43.0, 43.0, 47.0, 43.0, 38.0, 37.0, 39.0, 44.0, 27.0, 25.0, 37.0, 26.0, 32.0, 22.0, 23.0, 12.0, 9.0, 6.0, 8.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.346771240234375, -47.77830123901367, -46.2098274230957, -44.641357421875, -43.07288360595703, -41.50441360473633, -39.93593978881836, -38.367469787597656, -36.79899597167969, -35.230525970458984, -33.662052154541016, -32.09358215332031, -30.525108337402344, -28.956636428833008, -27.388164520263672, -25.81969451904297, -24.251222610473633, -22.682750701904297, -21.11427879333496, -19.545806884765625, -17.97733497619629, -16.408863067626953, -14.840392112731934, -13.271920204162598, -11.703448295593262, -10.134976387023926, -8.56650447845459, -6.998033046722412, -5.429561138153076, -3.8610892295837402, -2.2926177978515625, -0.7241458892822266, 0.8443260192871094, 2.4127979278564453, 3.981269598007202, 5.549741268157959, 7.118213176727295, 8.686685562133789, 10.255156517028809, 11.823628425598145, 13.39210033416748, 14.960572242736816, 16.529043197631836, 18.097515106201172, 19.665987014770508, 21.234458923339844, 22.80293083190918, 24.371402740478516, 25.93987464904785, 27.508346557617188, 29.076818466186523, 30.64529037475586, 32.21376037597656, 33.78223419189453, 35.350704193115234, 36.9191780090332, 38.487648010253906, 40.05611801147461, 41.62459182739258, 43.19306182861328, 44.76153564453125, 46.33000564575195, 47.89847946166992, 49.466949462890625, 51.035423278808594]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 1.0, 4.0, 5.0, 6.0, 5.0, 7.0, 8.0, 16.0, 12.0, 16.0, 15.0, 23.0, 23.0, 30.0, 16.0, 29.0, 43.0, 33.0, 43.0, 42.0, 45.0, 35.0, 46.0, 50.0, 50.0, 37.0, 46.0, 36.0, 27.0, 38.0, 25.0, 27.0, 18.0, 16.0, 21.0, 13.0, 16.0, 16.0, 15.0, 8.0, 11.0, 5.0, 7.0, 6.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-8.65625, -8.4005126953125, -8.144775390625, -7.8890380859375, -7.63330078125, -7.3775634765625, -7.121826171875, -6.8660888671875, -6.6103515625, -6.3546142578125, -6.098876953125, -5.8431396484375, -5.58740234375, -5.3316650390625, -5.075927734375, -4.8201904296875, -4.564453125, -4.3087158203125, -4.052978515625, -3.7972412109375, -3.54150390625, -3.2857666015625, -3.030029296875, -2.7742919921875, -2.5185546875, -2.2628173828125, -2.007080078125, -1.7513427734375, -1.49560546875, -1.2398681640625, -0.984130859375, -0.7283935546875, -0.47265625, -0.2169189453125, 0.038818359375, 0.2945556640625, 0.55029296875, 0.8060302734375, 1.061767578125, 1.3175048828125, 1.5732421875, 1.8289794921875, 2.084716796875, 2.3404541015625, 2.59619140625, 2.8519287109375, 3.107666015625, 3.3634033203125, 3.619140625, 3.8748779296875, 4.130615234375, 4.3863525390625, 4.64208984375, 4.8978271484375, 5.153564453125, 5.4093017578125, 5.6650390625, 5.9207763671875, 6.176513671875, 6.4322509765625, 6.68798828125, 6.9437255859375, 7.199462890625, 7.4552001953125, 7.7109375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 13.0, 13.0, 17.0, 40.0, 59.0, 80.0, 140.0, 231.0, 391.0, 598.0, 908.0, 1407.0, 2177.0, 3303.0, 5104.0, 7582.0, 11370.0, 17269.0, 25071.0, 36484.0, 51128.0, 69953.0, 89201.0, 106523.0, 117036.0, 114674.0, 101388.0, 81782.0, 62422.0, 45048.0, 31755.0, 21840.0, 14627.0, 9901.0, 6641.0, 4297.0, 2899.0, 1801.0, 1189.0, 794.0, 509.0, 333.0, 216.0, 130.0, 80.0, 59.0, 24.0, 20.0, 12.0, 8.0, 10.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.0703125, -1.0386581420898438, -1.0070037841796875, -0.9753494262695312, -0.943695068359375, -0.9120407104492188, -0.8803863525390625, -0.8487319946289062, -0.81707763671875, -0.7854232788085938, -0.7537689208984375, -0.7221145629882812, -0.690460205078125, -0.6588058471679688, -0.6271514892578125, -0.5954971313476562, -0.5638427734375, -0.5321884155273438, -0.5005340576171875, -0.46887969970703125, -0.437225341796875, -0.40557098388671875, -0.3739166259765625, -0.34226226806640625, -0.31060791015625, -0.27895355224609375, -0.2472991943359375, -0.21564483642578125, -0.183990478515625, -0.15233612060546875, -0.1206817626953125, -0.08902740478515625, -0.057373046875, -0.02571868896484375, 0.0059356689453125, 0.03759002685546875, 0.069244384765625, 0.10089874267578125, 0.1325531005859375, 0.16420745849609375, 0.19586181640625, 0.22751617431640625, 0.2591705322265625, 0.29082489013671875, 0.322479248046875, 0.35413360595703125, 0.3857879638671875, 0.41744232177734375, 0.4490966796875, 0.48075103759765625, 0.5124053955078125, 0.5440597534179688, 0.575714111328125, 0.6073684692382812, 0.6390228271484375, 0.6706771850585938, 0.70233154296875, 0.7339859008789062, 0.7656402587890625, 0.7972946166992188, 0.828948974609375, 0.8606033325195312, 0.8922576904296875, 0.9239120483398438, 0.95556640625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 4.0, 7.0, 7.0, 6.0, 11.0, 13.0, 16.0, 16.0, 14.0, 23.0, 26.0, 31.0, 17.0, 36.0, 34.0, 31.0, 26.0, 31.0, 50.0, 44.0, 55.0, 1058.0, 34.0, 31.0, 40.0, 43.0, 47.0, 26.0, 28.0, 35.0, 31.0, 17.0, 24.0, 21.0, 18.0, 12.0, 12.0, 10.0, 11.0, 5.0, 6.0, 6.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.41015625, -5.23175048828125, -5.0533447265625, -4.87493896484375, -4.696533203125, -4.51812744140625, -4.3397216796875, -4.16131591796875, -3.98291015625, -3.80450439453125, -3.6260986328125, -3.44769287109375, -3.269287109375, -3.09088134765625, -2.9124755859375, -2.73406982421875, -2.5556640625, -2.37725830078125, -2.1988525390625, -2.02044677734375, -1.842041015625, -1.66363525390625, -1.4852294921875, -1.30682373046875, -1.12841796875, -0.95001220703125, -0.7716064453125, -0.59320068359375, -0.414794921875, -0.23638916015625, -0.0579833984375, 0.12042236328125, 0.298828125, 0.47723388671875, 0.6556396484375, 0.83404541015625, 1.012451171875, 1.19085693359375, 1.3692626953125, 1.54766845703125, 1.72607421875, 1.90447998046875, 2.0828857421875, 2.26129150390625, 2.439697265625, 2.61810302734375, 2.7965087890625, 2.97491455078125, 3.1533203125, 3.33172607421875, 3.5101318359375, 3.68853759765625, 3.866943359375, 4.04534912109375, 4.2237548828125, 4.40216064453125, 4.58056640625, 4.75897216796875, 4.9373779296875, 5.11578369140625, 5.294189453125, 5.47259521484375, 5.6510009765625, 5.82940673828125, 6.0078125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 9.0, 9.0, 19.0, 15.0, 28.0, 67.0, 67.0, 112.0, 195.0, 264.0, 387.0, 538.0, 762.0, 1023.0, 1543.0, 2200.0, 3150.0, 4478.0, 6367.0, 8923.0, 13028.0, 18722.0, 27523.0, 102154.0, 1805813.0, 31063.0, 20750.0, 14475.0, 9973.0, 7065.0, 4868.0, 3452.0, 2469.0, 1733.0, 1207.0, 831.0, 569.0, 381.0, 281.0, 166.0, 140.0, 101.0, 71.0, 46.0, 30.0, 26.0, 32.0, 9.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.83203125, -1.771240234375, -1.71044921875, -1.649658203125, -1.5888671875, -1.528076171875, -1.46728515625, -1.406494140625, -1.345703125, -1.284912109375, -1.22412109375, -1.163330078125, -1.1025390625, -1.041748046875, -0.98095703125, -0.920166015625, -0.859375, -0.798583984375, -0.73779296875, -0.677001953125, -0.6162109375, -0.555419921875, -0.49462890625, -0.433837890625, -0.373046875, -0.312255859375, -0.25146484375, -0.190673828125, -0.1298828125, -0.069091796875, -0.00830078125, 0.052490234375, 0.11328125, 0.174072265625, 0.23486328125, 0.295654296875, 0.3564453125, 0.417236328125, 0.47802734375, 0.538818359375, 0.599609375, 0.660400390625, 0.72119140625, 0.781982421875, 0.8427734375, 0.903564453125, 0.96435546875, 1.025146484375, 1.0859375, 1.146728515625, 1.20751953125, 1.268310546875, 1.3291015625, 1.389892578125, 1.45068359375, 1.511474609375, 1.572265625, 1.633056640625, 1.69384765625, 1.754638671875, 1.8154296875, 1.876220703125, 1.93701171875, 1.997802734375, 2.05859375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 3.0, 14.0, 10.0, 7.0, 13.0, 46.0, 36.0, 39.0, 55.0, 88.0, 83.0, 93.0, 108.0, 78.0, 70.0, 48.0, 41.0, 31.0, 26.0, 20.0, 18.0, 14.0, 7.0, 10.0, 1.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0633544921875, -0.06109428405761719, -0.058834075927734375, -0.05657386779785156, -0.05431365966796875, -0.05205345153808594, -0.049793243408203125, -0.04753303527832031, -0.0452728271484375, -0.04301261901855469, -0.040752410888671875, -0.03849220275878906, -0.03623199462890625, -0.03397178649902344, -0.031711578369140625, -0.029451370239257812, -0.027191162109375, -0.024930953979492188, -0.022670745849609375, -0.020410537719726562, -0.01815032958984375, -0.015890121459960938, -0.013629913330078125, -0.011369705200195312, -0.0091094970703125, -0.0068492889404296875, -0.004589080810546875, -0.0023288726806640625, -6.866455078125e-05, 0.0021915435791015625, 0.004451751708984375, 0.0067119598388671875, 0.00897216796875, 0.011232376098632812, 0.013492584228515625, 0.015752792358398438, 0.01801300048828125, 0.020273208618164062, 0.022533416748046875, 0.024793624877929688, 0.0270538330078125, 0.029314041137695312, 0.031574249267578125, 0.03383445739746094, 0.03609466552734375, 0.03835487365722656, 0.040615081787109375, 0.04287528991699219, 0.045135498046875, 0.04739570617675781, 0.049655914306640625, 0.05191612243652344, 0.05417633056640625, 0.05643653869628906, 0.058696746826171875, 0.06095695495605469, 0.0632171630859375, 0.06547737121582031, 0.06773757934570312, 0.06999778747558594, 0.07225799560546875, 0.07451820373535156, 0.07677841186523438, 0.07903861999511719, 0.081298828125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 10.0, 2.0, 8.0, 9.0, 17.0, 24.0, 16.0, 32.0, 44.0, 83.0, 141.0, 232.0, 777.0, 508339.0, 537393.0, 771.0, 262.0, 130.0, 72.0, 56.0, 44.0, 19.0, 9.0, 13.0, 10.0, 5.0, 5.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.923828125, -1.870391845703125, -1.81695556640625, -1.763519287109375, -1.7100830078125, -1.656646728515625, -1.60321044921875, -1.549774169921875, -1.496337890625, -1.442901611328125, -1.38946533203125, -1.336029052734375, -1.2825927734375, -1.229156494140625, -1.17572021484375, -1.122283935546875, -1.06884765625, -1.015411376953125, -0.96197509765625, -0.908538818359375, -0.8551025390625, -0.801666259765625, -0.74822998046875, -0.694793701171875, -0.641357421875, -0.587921142578125, -0.53448486328125, -0.481048583984375, -0.4276123046875, -0.374176025390625, -0.32073974609375, -0.267303466796875, -0.2138671875, -0.160430908203125, -0.10699462890625, -0.053558349609375, -0.0001220703125, 0.053314208984375, 0.10675048828125, 0.160186767578125, 0.213623046875, 0.267059326171875, 0.32049560546875, 0.373931884765625, 0.4273681640625, 0.480804443359375, 0.53424072265625, 0.587677001953125, 0.64111328125, 0.694549560546875, 0.74798583984375, 0.801422119140625, 0.8548583984375, 0.908294677734375, 0.96173095703125, 1.015167236328125, 1.068603515625, 1.122039794921875, 1.17547607421875, 1.228912353515625, 1.2823486328125, 1.335784912109375, 1.38922119140625, 1.442657470703125, 1.49609375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 29.0, 818.0, 157.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4877595901489258, -1.4528619050979614, -1.4179643392562866, -1.3830666542053223, -1.3481690883636475, -1.313271403312683, -1.2783737182617188, -1.243476152420044, -1.2085784673690796, -1.1736807823181152, -1.1387832164764404, -1.103885531425476, -1.0689879655838013, -1.034090280532837, -0.9991926550865173, -0.9642950296401978, -0.9293974041938782, -0.8944997787475586, -0.859602153301239, -0.8247045278549194, -0.7898068428039551, -0.7549092173576355, -0.7200115919113159, -0.6851139664649963, -0.6502163410186768, -0.6153187155723572, -0.5804210901260376, -0.5455234050750732, -0.5106257796287537, -0.4757281541824341, -0.4408305287361145, -0.4059329032897949, -0.3710351586341858, -0.3361375331878662, -0.30123987793922424, -0.26634225249290466, -0.2314446121454239, -0.19654697179794312, -0.16164934635162354, -0.12675170600414276, -0.09185406565666199, -0.05695642903447151, -0.022058792412281036, 0.01283884048461914, 0.047736480832099915, 0.08263412117958069, 0.11753174662590027, 0.15242938697338104, 0.18732702732086182, 0.2222246676683426, 0.25712230801582336, 0.29201993346214294, 0.3269175887107849, 0.3618152141571045, 0.3967128396034241, 0.43161046504974365, 0.4665081202983856, 0.5014057755470276, 0.5363034009933472, 0.5712010264396667, 0.6060986518859863, 0.6409963369369507, 0.6758939027786255, 0.7107915878295898, 0.7456892132759094]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 0.0, 10.0, 10.0, 9.0, 18.0, 15.0, 17.0, 15.0, 19.0, 29.0, 27.0, 20.0, 35.0, 33.0, 31.0, 33.0, 41.0, 38.0, 46.0, 48.0, 41.0, 40.0, 41.0, 42.0, 41.0, 35.0, 36.0, 27.0, 29.0, 30.0, 23.0, 23.0, 20.0, 15.0, 7.0, 9.0, 12.0, 11.0, 7.0, 5.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0], "bins": [-0.13878577947616577, -0.13512594997882843, -0.1314661204814911, -0.12780629098415375, -0.1241464614868164, -0.12048663198947906, -0.11682680249214172, -0.11316697299480438, -0.10950714349746704, -0.1058473140001297, -0.10218748450279236, -0.09852765500545502, -0.09486782550811768, -0.09120799601078033, -0.087548166513443, -0.08388833701610565, -0.08022850751876831, -0.07656867802143097, -0.07290884852409363, -0.06924901902675629, -0.06558918952941895, -0.061929360032081604, -0.05826953053474426, -0.05460970103740692, -0.05094987154006958, -0.04729004204273224, -0.0436302125453949, -0.039970383048057556, -0.036310553550720215, -0.032650724053382874, -0.028990894556045532, -0.02533106505870819, -0.02167123556137085, -0.01801140606403351, -0.014351576566696167, -0.010691747069358826, -0.007031917572021484, -0.003372088074684143, 0.00028774142265319824, 0.0039475709199905396, 0.007607400417327881, 0.011267229914665222, 0.014927059412002563, 0.018586888909339905, 0.022246718406677246, 0.025906547904014587, 0.02956637740135193, 0.03322620689868927, 0.03688603639602661, 0.04054586589336395, 0.044205695390701294, 0.047865524888038635, 0.05152535438537598, 0.05518518388271332, 0.05884501338005066, 0.062504842877388, 0.06616467237472534, 0.06982450187206268, 0.07348433136940002, 0.07714416086673737, 0.08080399036407471, 0.08446381986141205, 0.08812364935874939, 0.09178347885608673, 0.09544330835342407]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 4.0, 5.0, 4.0, 7.0, 4.0, 6.0, 10.0, 12.0, 18.0, 19.0, 16.0, 12.0, 18.0, 16.0, 22.0, 33.0, 30.0, 39.0, 26.0, 31.0, 44.0, 37.0, 44.0, 49.0, 36.0, 39.0, 29.0, 46.0, 37.0, 30.0, 31.0, 30.0, 20.0, 29.0, 29.0, 21.0, 22.0, 9.0, 17.0, 14.0, 12.0, 11.0, 7.0, 7.0, 9.0, 8.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.015625, -7.77239990234375, -7.5291748046875, -7.28594970703125, -7.042724609375, -6.79949951171875, -6.5562744140625, -6.31304931640625, -6.06982421875, -5.82659912109375, -5.5833740234375, -5.34014892578125, -5.096923828125, -4.85369873046875, -4.6104736328125, -4.36724853515625, -4.1240234375, -3.88079833984375, -3.6375732421875, -3.39434814453125, -3.151123046875, -2.90789794921875, -2.6646728515625, -2.42144775390625, -2.17822265625, -1.93499755859375, -1.6917724609375, -1.44854736328125, -1.205322265625, -0.96209716796875, -0.7188720703125, -0.47564697265625, -0.232421875, 0.01080322265625, 0.2540283203125, 0.49725341796875, 0.740478515625, 0.98370361328125, 1.2269287109375, 1.47015380859375, 1.71337890625, 1.95660400390625, 2.1998291015625, 2.44305419921875, 2.686279296875, 2.92950439453125, 3.1727294921875, 3.41595458984375, 3.6591796875, 3.90240478515625, 4.1456298828125, 4.38885498046875, 4.632080078125, 4.87530517578125, 5.1185302734375, 5.36175537109375, 5.60498046875, 5.84820556640625, 6.0914306640625, 6.33465576171875, 6.577880859375, 6.82110595703125, 7.0643310546875, 7.30755615234375, 7.55078125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 10.0, 5.0, 6.0, 17.0, 17.0, 19.0, 33.0, 29.0, 48.0, 48.0, 69.0, 113.0, 192.0, 319.0, 596.0, 1243.0, 2722.0, 5368.0, 11356.0, 24372.0, 60453.0, 166070.0, 378603.0, 245679.0, 87383.0, 34109.0, 15227.0, 7345.0, 3520.0, 1645.0, 804.0, 393.0, 216.0, 148.0, 74.0, 79.0, 44.0, 34.0, 31.0, 28.0, 12.0, 14.0, 13.0, 13.0, 9.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-10.34375, -10.02734375, -9.7109375, -9.39453125, -9.078125, -8.76171875, -8.4453125, -8.12890625, -7.8125, -7.49609375, -7.1796875, -6.86328125, -6.546875, -6.23046875, -5.9140625, -5.59765625, -5.28125, -4.96484375, -4.6484375, -4.33203125, -4.015625, -3.69921875, -3.3828125, -3.06640625, -2.75, -2.43359375, -2.1171875, -1.80078125, -1.484375, -1.16796875, -0.8515625, -0.53515625, -0.21875, 0.09765625, 0.4140625, 0.73046875, 1.046875, 1.36328125, 1.6796875, 1.99609375, 2.3125, 2.62890625, 2.9453125, 3.26171875, 3.578125, 3.89453125, 4.2109375, 4.52734375, 4.84375, 5.16015625, 5.4765625, 5.79296875, 6.109375, 6.42578125, 6.7421875, 7.05859375, 7.375, 7.69140625, 8.0078125, 8.32421875, 8.640625, 8.95703125, 9.2734375, 9.58984375, 9.90625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 4.0, 2.0, 4.0, 10.0, 6.0, 7.0, 14.0, 7.0, 12.0, 10.0, 20.0, 21.0, 24.0, 29.0, 35.0, 31.0, 34.0, 47.0, 48.0, 81.0, 144.0, 304.0, 1376.0, 219.0, 117.0, 68.0, 45.0, 40.0, 41.0, 29.0, 29.0, 18.0, 25.0, 26.0, 18.0, 21.0, 15.0, 12.0, 8.0, 8.0, 9.0, 5.0, 7.0, 5.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-22.640625, -21.892578125, -21.14453125, -20.396484375, -19.6484375, -18.900390625, -18.15234375, -17.404296875, -16.65625, -15.908203125, -15.16015625, -14.412109375, -13.6640625, -12.916015625, -12.16796875, -11.419921875, -10.671875, -9.923828125, -9.17578125, -8.427734375, -7.6796875, -6.931640625, -6.18359375, -5.435546875, -4.6875, -3.939453125, -3.19140625, -2.443359375, -1.6953125, -0.947265625, -0.19921875, 0.548828125, 1.296875, 2.044921875, 2.79296875, 3.541015625, 4.2890625, 5.037109375, 5.78515625, 6.533203125, 7.28125, 8.029296875, 8.77734375, 9.525390625, 10.2734375, 11.021484375, 11.76953125, 12.517578125, 13.265625, 14.013671875, 14.76171875, 15.509765625, 16.2578125, 17.005859375, 17.75390625, 18.501953125, 19.25, 19.998046875, 20.74609375, 21.494140625, 22.2421875, 22.990234375, 23.73828125, 24.486328125, 25.234375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 9.0, 8.0, 5.0, 9.0, 10.0, 9.0, 11.0, 19.0, 20.0, 26.0, 27.0, 31.0, 47.0, 68.0, 80.0, 124.0, 147.0, 245.0, 419.0, 875.0, 3901.0, 45694.0, 2396969.0, 674586.0, 18522.0, 2098.0, 648.0, 317.0, 212.0, 137.0, 95.0, 64.0, 62.0, 44.0, 33.0, 27.0, 15.0, 22.0, 19.0, 6.0, 9.0, 8.0, 9.0, 3.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0], "bins": [-39.25, -38.0546875, -36.859375, -35.6640625, -34.46875, -33.2734375, -32.078125, -30.8828125, -29.6875, -28.4921875, -27.296875, -26.1015625, -24.90625, -23.7109375, -22.515625, -21.3203125, -20.125, -18.9296875, -17.734375, -16.5390625, -15.34375, -14.1484375, -12.953125, -11.7578125, -10.5625, -9.3671875, -8.171875, -6.9765625, -5.78125, -4.5859375, -3.390625, -2.1953125, -1.0, 0.1953125, 1.390625, 2.5859375, 3.78125, 4.9765625, 6.171875, 7.3671875, 8.5625, 9.7578125, 10.953125, 12.1484375, 13.34375, 14.5390625, 15.734375, 16.9296875, 18.125, 19.3203125, 20.515625, 21.7109375, 22.90625, 24.1015625, 25.296875, 26.4921875, 27.6875, 28.8828125, 30.078125, 31.2734375, 32.46875, 33.6640625, 34.859375, 36.0546875, 37.25]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 42.0, 265.0, 487.0, 203.0, 15.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.82203674316406, -97.54124450683594, -92.26045227050781, -86.97966003417969, -81.69886779785156, -76.41807556152344, -71.13727569580078, -65.85648345947266, -60.57569122314453, -55.294898986816406, -50.01410675048828, -44.73331069946289, -39.452518463134766, -34.17172622680664, -28.890932083129883, -23.610137939453125, -18.329345703125, -13.048552513122559, -7.767759323120117, -2.486966133117676, 2.7938270568847656, 8.07461929321289, 13.355413436889648, 18.636207580566406, 23.91699981689453, 29.197792053222656, 34.47858428955078, 39.75938034057617, 45.0401725769043, 50.32096481323242, 55.60176086425781, 60.88255310058594, 66.163330078125, 71.44412231445312, 76.72491455078125, 82.00570678710938, 87.2864990234375, 92.56729125976562, 97.84809112548828, 103.1288833618164, 108.40967559814453, 113.69046783447266, 118.97126007080078, 124.2520523071289, 129.53285217285156, 134.8136444091797, 140.0944366455078, 145.37522888183594, 150.65602111816406, 155.9368133544922, 161.2176055908203, 166.49839782714844, 171.77919006347656, 177.0599822998047, 182.3407745361328, 187.62158203125, 192.90237426757812, 198.18316650390625, 203.46395874023438, 208.7447509765625, 214.02554321289062, 219.30633544921875, 224.58712768554688, 229.867919921875, 235.14871215820312]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 9.0, 13.0, 5.0, 17.0, 12.0, 12.0, 10.0, 22.0, 23.0, 18.0, 33.0, 37.0, 27.0, 36.0, 37.0, 33.0, 42.0, 64.0, 44.0, 47.0, 51.0, 31.0, 37.0, 48.0, 40.0, 36.0, 32.0, 28.0, 26.0, 23.0, 27.0, 12.0, 14.0, 11.0, 12.0, 10.0, 2.0, 9.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.95936584472656, -69.91117095947266, -67.86297607421875, -65.81478118896484, -63.76658630371094, -61.71839141845703, -59.67019271850586, -57.62199783325195, -55.57380294799805, -53.52560806274414, -51.477413177490234, -49.42921829223633, -47.381019592285156, -45.33282470703125, -43.284629821777344, -41.23643493652344, -39.18824005126953, -37.140045166015625, -35.09185028076172, -33.04365539550781, -30.995458602905273, -28.947263717651367, -26.899066925048828, -24.850872039794922, -22.802677154541016, -20.75448226928711, -18.706287384033203, -16.658090591430664, -14.609895706176758, -12.561700820922852, -10.513504981994629, -8.465309143066406, -6.417110443115234, -4.36891508102417, -2.3207197189331055, -0.272524356842041, 1.7756710052490234, 3.8238658905029297, 5.872061729431152, 7.920257568359375, 9.968452453613281, 12.016647338867188, 14.06484317779541, 16.113039016723633, 18.16123390197754, 20.209428787231445, 22.257625579833984, 24.30582046508789, 26.354015350341797, 28.402210235595703, 30.45040512084961, 32.498600006103516, 34.54679870605469, 36.594993591308594, 38.6431884765625, 40.691383361816406, 42.73957824707031, 44.78777313232422, 46.835968017578125, 48.88416290283203, 50.93235778808594, 52.980552673339844, 55.028751373291016, 57.07694625854492, 59.12514114379883]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 6.0, 3.0, 7.0, 5.0, 10.0, 12.0, 14.0, 20.0, 28.0, 23.0, 18.0, 37.0, 25.0, 22.0, 35.0, 38.0, 38.0, 41.0, 40.0, 53.0, 56.0, 36.0, 45.0, 41.0, 41.0, 51.0, 35.0, 32.0, 31.0, 23.0, 23.0, 21.0, 22.0, 18.0, 14.0, 12.0, 3.0, 7.0, 8.0, 9.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7421875, -9.4505615234375, -9.158935546875, -8.8673095703125, -8.57568359375, -8.2840576171875, -7.992431640625, -7.7008056640625, -7.4091796875, -7.1175537109375, -6.825927734375, -6.5343017578125, -6.24267578125, -5.9510498046875, -5.659423828125, -5.3677978515625, -5.076171875, -4.7845458984375, -4.492919921875, -4.2012939453125, -3.90966796875, -3.6180419921875, -3.326416015625, -3.0347900390625, -2.7431640625, -2.4515380859375, -2.159912109375, -1.8682861328125, -1.57666015625, -1.2850341796875, -0.993408203125, -0.7017822265625, -0.41015625, -0.1185302734375, 0.173095703125, 0.4647216796875, 0.75634765625, 1.0479736328125, 1.339599609375, 1.6312255859375, 1.9228515625, 2.2144775390625, 2.506103515625, 2.7977294921875, 3.08935546875, 3.3809814453125, 3.672607421875, 3.9642333984375, 4.255859375, 4.5474853515625, 4.839111328125, 5.1307373046875, 5.42236328125, 5.7139892578125, 6.005615234375, 6.2972412109375, 6.5888671875, 6.8804931640625, 7.172119140625, 7.4637451171875, 7.75537109375, 8.0469970703125, 8.338623046875, 8.6302490234375, 8.921875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 3.0, 5.0, 10.0, 8.0, 11.0, 11.0, 25.0, 27.0, 38.0, 57.0, 91.0, 162.0, 437.0, 1459.0, 6166.0, 33681.0, 209503.0, 1179643.0, 2066714.0, 581793.0, 94116.0, 15663.0, 3172.0, 830.0, 277.0, 140.0, 73.0, 44.0, 33.0, 28.0, 16.0, 14.0, 3.0, 12.0, 10.0, 0.0, 2.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.015625, -15.503662109375, -14.99169921875, -14.479736328125, -13.9677734375, -13.455810546875, -12.94384765625, -12.431884765625, -11.919921875, -11.407958984375, -10.89599609375, -10.384033203125, -9.8720703125, -9.360107421875, -8.84814453125, -8.336181640625, -7.82421875, -7.312255859375, -6.80029296875, -6.288330078125, -5.7763671875, -5.264404296875, -4.75244140625, -4.240478515625, -3.728515625, -3.216552734375, -2.70458984375, -2.192626953125, -1.6806640625, -1.168701171875, -0.65673828125, -0.144775390625, 0.3671875, 0.879150390625, 1.39111328125, 1.903076171875, 2.4150390625, 2.927001953125, 3.43896484375, 3.950927734375, 4.462890625, 4.974853515625, 5.48681640625, 5.998779296875, 6.5107421875, 7.022705078125, 7.53466796875, 8.046630859375, 8.55859375, 9.070556640625, 9.58251953125, 10.094482421875, 10.6064453125, 11.118408203125, 11.63037109375, 12.142333984375, 12.654296875, 13.166259765625, 13.67822265625, 14.190185546875, 14.7021484375, 15.214111328125, 15.72607421875, 16.238037109375, 16.75]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 14.0, 13.0, 20.0, 20.0, 33.0, 52.0, 53.0, 67.0, 92.0, 139.0, 176.0, 240.0, 287.0, 338.0, 348.0, 382.0, 357.0, 290.0, 268.0, 199.0, 163.0, 123.0, 102.0, 70.0, 64.0, 36.0, 32.0, 27.0, 16.0, 10.0, 4.0, 7.0, 5.0, 6.0, 7.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.796875, -12.424072265625, -12.05126953125, -11.678466796875, -11.3056640625, -10.932861328125, -10.56005859375, -10.187255859375, -9.814453125, -9.441650390625, -9.06884765625, -8.696044921875, -8.3232421875, -7.950439453125, -7.57763671875, -7.204833984375, -6.83203125, -6.459228515625, -6.08642578125, -5.713623046875, -5.3408203125, -4.968017578125, -4.59521484375, -4.222412109375, -3.849609375, -3.476806640625, -3.10400390625, -2.731201171875, -2.3583984375, -1.985595703125, -1.61279296875, -1.239990234375, -0.8671875, -0.494384765625, -0.12158203125, 0.251220703125, 0.6240234375, 0.996826171875, 1.36962890625, 1.742431640625, 2.115234375, 2.488037109375, 2.86083984375, 3.233642578125, 3.6064453125, 3.979248046875, 4.35205078125, 4.724853515625, 5.09765625, 5.470458984375, 5.84326171875, 6.216064453125, 6.5888671875, 6.961669921875, 7.33447265625, 7.707275390625, 8.080078125, 8.452880859375, 8.82568359375, 9.198486328125, 9.5712890625, 9.944091796875, 10.31689453125, 10.689697265625, 11.0625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 7.0, 5.0, 6.0, 7.0, 15.0, 15.0, 19.0, 31.0, 53.0, 63.0, 95.0, 119.0, 170.0, 259.0, 394.0, 741.0, 2161.0, 15021.0, 193731.0, 2411298.0, 1461599.0, 96604.0, 8533.0, 1545.0, 643.0, 382.0, 222.0, 156.0, 98.0, 90.0, 45.0, 39.0, 38.0, 25.0, 16.0, 11.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.625, -24.70556640625, -23.7861328125, -22.86669921875, -21.947265625, -21.02783203125, -20.1083984375, -19.18896484375, -18.26953125, -17.35009765625, -16.4306640625, -15.51123046875, -14.591796875, -13.67236328125, -12.7529296875, -11.83349609375, -10.9140625, -9.99462890625, -9.0751953125, -8.15576171875, -7.236328125, -6.31689453125, -5.3974609375, -4.47802734375, -3.55859375, -2.63916015625, -1.7197265625, -0.80029296875, 0.119140625, 1.03857421875, 1.9580078125, 2.87744140625, 3.796875, 4.71630859375, 5.6357421875, 6.55517578125, 7.474609375, 8.39404296875, 9.3134765625, 10.23291015625, 11.15234375, 12.07177734375, 12.9912109375, 13.91064453125, 14.830078125, 15.74951171875, 16.6689453125, 17.58837890625, 18.5078125, 19.42724609375, 20.3466796875, 21.26611328125, 22.185546875, 23.10498046875, 24.0244140625, 24.94384765625, 25.86328125, 26.78271484375, 27.7021484375, 28.62158203125, 29.541015625, 30.46044921875, 31.3798828125, 32.29931640625, 33.21875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 39.0, 151.0, 370.0, 280.0, 137.0, 25.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-287.2916259765625, -281.28759765625, -275.2835998535156, -269.2795715332031, -263.2755432128906, -257.2715148925781, -251.26751708984375, -245.26348876953125, -239.25946044921875, -233.2554473876953, -227.2514190673828, -221.24740600585938, -215.24337768554688, -209.23936462402344, -203.2353515625, -197.2313232421875, -191.22731018066406, -185.22329711914062, -179.21926879882812, -173.2152557373047, -167.2112274169922, -161.20721435546875, -155.20318603515625, -149.1991729736328, -143.19515991210938, -137.19114685058594, -131.18711853027344, -125.18310546875, -119.1790771484375, -113.17506408691406, -107.1710433959961, -101.16702270507812, -95.16297912597656, -89.1589584350586, -83.15493774414062, -77.15092468261719, -71.14689636230469, -65.14288330078125, -59.13886260986328, -53.13484191894531, -47.130821228027344, -41.126800537109375, -35.122779846191406, -29.118762969970703, -23.114742279052734, -17.110721588134766, -11.106704711914062, -5.102684020996094, 0.901336669921875, 6.905356407165527, 12.90937614440918, 18.913394927978516, 24.917415618896484, 30.921436309814453, 36.925453186035156, 42.929473876953125, 48.933494567871094, 54.93751525878906, 60.94153594970703, 66.945556640625, 72.94956970214844, 78.95359802246094, 84.95761108398438, 90.96163177490234, 96.96565246582031]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 6.0, 6.0, 5.0, 8.0, 4.0, 10.0, 15.0, 16.0, 8.0, 15.0, 22.0, 19.0, 19.0, 25.0, 26.0, 37.0, 32.0, 20.0, 32.0, 29.0, 45.0, 42.0, 45.0, 45.0, 28.0, 38.0, 34.0, 43.0, 32.0, 35.0, 31.0, 32.0, 26.0, 21.0, 28.0, 21.0, 15.0, 16.0, 9.0, 10.0, 14.0, 6.0, 8.0, 7.0, 7.0, 9.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-36.17174530029297, -35.01424789428711, -33.856746673583984, -32.699249267578125, -31.541751861572266, -30.384252548217773, -29.22675323486328, -28.069255828857422, -26.911758422851562, -25.75425910949707, -24.59676170349121, -23.43926239013672, -22.28176498413086, -21.124265670776367, -19.966766357421875, -18.809268951416016, -17.651769638061523, -16.49427032470703, -15.336772918701172, -14.17927360534668, -13.02177619934082, -11.864276885986328, -10.706778526306152, -9.549280166625977, -8.3917818069458, -7.234283447265625, -6.076785087585449, -4.919286251068115, -3.7617878913879395, -2.6042895317077637, -1.4467906951904297, -0.2892923355102539, 0.8682060241699219, 2.0257043838500977, 3.1832029819488525, 4.340701580047607, 5.498199939727783, 6.655698299407959, 7.813197135925293, 8.970695495605469, 10.128193855285645, 11.28569221496582, 12.443190574645996, 13.600688934326172, 14.758188247680664, 15.915685653686523, 17.073184967041016, 18.230682373046875, 19.388181686401367, 20.54568099975586, 21.70317840576172, 22.86067771911621, 24.01817512512207, 25.175674438476562, 26.333171844482422, 27.490671157836914, 28.648170471191406, 29.8056697845459, 30.963167190551758, 32.12066650390625, 33.27816390991211, 34.43566131591797, 35.593162536621094, 36.75065994262695, 37.90815734863281]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 4.0, 9.0, 10.0, 8.0, 5.0, 14.0, 11.0, 18.0, 12.0, 26.0, 17.0, 29.0, 40.0, 30.0, 37.0, 34.0, 39.0, 35.0, 46.0, 53.0, 46.0, 34.0, 51.0, 58.0, 31.0, 30.0, 35.0, 38.0, 34.0, 31.0, 21.0, 22.0, 16.0, 20.0, 11.0, 12.0, 5.0, 6.0, 8.0, 2.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.7734375, -9.4884033203125, -9.203369140625, -8.9183349609375, -8.63330078125, -8.3482666015625, -8.063232421875, -7.7781982421875, -7.4931640625, -7.2081298828125, -6.923095703125, -6.6380615234375, -6.35302734375, -6.0679931640625, -5.782958984375, -5.4979248046875, -5.212890625, -4.9278564453125, -4.642822265625, -4.3577880859375, -4.07275390625, -3.7877197265625, -3.502685546875, -3.2176513671875, -2.9326171875, -2.6475830078125, -2.362548828125, -2.0775146484375, -1.79248046875, -1.5074462890625, -1.222412109375, -0.9373779296875, -0.65234375, -0.3673095703125, -0.082275390625, 0.2027587890625, 0.48779296875, 0.7728271484375, 1.057861328125, 1.3428955078125, 1.6279296875, 1.9129638671875, 2.197998046875, 2.4830322265625, 2.76806640625, 3.0531005859375, 3.338134765625, 3.6231689453125, 3.908203125, 4.1932373046875, 4.478271484375, 4.7633056640625, 5.04833984375, 5.3333740234375, 5.618408203125, 5.9034423828125, 6.1884765625, 6.4735107421875, 6.758544921875, 7.0435791015625, 7.32861328125, 7.6136474609375, 7.898681640625, 8.1837158203125, 8.46875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 7.0, 10.0, 21.0, 40.0, 50.0, 107.0, 143.0, 230.0, 335.0, 587.0, 855.0, 1395.0, 2228.0, 3660.0, 5684.0, 9174.0, 14177.0, 21641.0, 32456.0, 47801.0, 67248.0, 89381.0, 111348.0, 126006.0, 124641.0, 108089.0, 85842.0, 63566.0, 44992.0, 30649.0, 20380.0, 13316.0, 8338.0, 5235.0, 3437.0, 2114.0, 1323.0, 755.0, 477.0, 303.0, 186.0, 123.0, 83.0, 56.0, 29.0, 18.0, 9.0, 10.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.11328125, -1.0804595947265625, -1.047637939453125, -1.0148162841796875, -0.98199462890625, -0.9491729736328125, -0.916351318359375, -0.8835296630859375, -0.8507080078125, -0.8178863525390625, -0.785064697265625, -0.7522430419921875, -0.71942138671875, -0.6865997314453125, -0.653778076171875, -0.6209564208984375, -0.588134765625, -0.5553131103515625, -0.522491455078125, -0.4896697998046875, -0.45684814453125, -0.4240264892578125, -0.391204833984375, -0.3583831787109375, -0.3255615234375, -0.2927398681640625, -0.259918212890625, -0.2270965576171875, -0.19427490234375, -0.1614532470703125, -0.128631591796875, -0.0958099365234375, -0.06298828125, -0.0301666259765625, 0.002655029296875, 0.0354766845703125, 0.06829833984375, 0.1011199951171875, 0.133941650390625, 0.1667633056640625, 0.1995849609375, 0.2324066162109375, 0.265228271484375, 0.2980499267578125, 0.33087158203125, 0.3636932373046875, 0.396514892578125, 0.4293365478515625, 0.462158203125, 0.4949798583984375, 0.527801513671875, 0.5606231689453125, 0.59344482421875, 0.6262664794921875, 0.659088134765625, 0.6919097900390625, 0.7247314453125, 0.7575531005859375, 0.790374755859375, 0.8231964111328125, 0.85601806640625, 0.8888397216796875, 0.921661376953125, 0.9544830322265625, 0.9873046875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 3.0, 3.0, 7.0, 6.0, 5.0, 4.0, 16.0, 12.0, 19.0, 13.0, 14.0, 19.0, 18.0, 27.0, 31.0, 28.0, 31.0, 35.0, 36.0, 29.0, 44.0, 33.0, 40.0, 1055.0, 27.0, 34.0, 34.0, 35.0, 32.0, 31.0, 40.0, 24.0, 28.0, 34.0, 25.0, 16.0, 19.0, 15.0, 11.0, 15.0, 19.0, 10.0, 7.0, 11.0, 3.0, 6.0, 3.0, 6.0, 4.0, 2.0, 2.0, 3.0, 3.0], "bins": [-5.87890625, -5.709716796875, -5.54052734375, -5.371337890625, -5.2021484375, -5.032958984375, -4.86376953125, -4.694580078125, -4.525390625, -4.356201171875, -4.18701171875, -4.017822265625, -3.8486328125, -3.679443359375, -3.51025390625, -3.341064453125, -3.171875, -3.002685546875, -2.83349609375, -2.664306640625, -2.4951171875, -2.325927734375, -2.15673828125, -1.987548828125, -1.818359375, -1.649169921875, -1.47998046875, -1.310791015625, -1.1416015625, -0.972412109375, -0.80322265625, -0.634033203125, -0.46484375, -0.295654296875, -0.12646484375, 0.042724609375, 0.2119140625, 0.381103515625, 0.55029296875, 0.719482421875, 0.888671875, 1.057861328125, 1.22705078125, 1.396240234375, 1.5654296875, 1.734619140625, 1.90380859375, 2.072998046875, 2.2421875, 2.411376953125, 2.58056640625, 2.749755859375, 2.9189453125, 3.088134765625, 3.25732421875, 3.426513671875, 3.595703125, 3.764892578125, 3.93408203125, 4.103271484375, 4.2724609375, 4.441650390625, 4.61083984375, 4.780029296875, 4.94921875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 7.0, 12.0, 23.0, 34.0, 40.0, 55.0, 76.0, 115.0, 200.0, 268.0, 396.0, 596.0, 812.0, 1127.0, 1660.0, 2325.0, 3308.0, 4671.0, 6721.0, 9681.0, 13069.0, 18959.0, 27902.0, 121880.0, 1782740.0, 30891.0, 20652.0, 14348.0, 10218.0, 7344.0, 5128.0, 3524.0, 2538.0, 1785.0, 1194.0, 839.0, 583.0, 419.0, 292.0, 201.0, 157.0, 102.0, 73.0, 66.0, 37.0, 26.0, 11.0, 18.0, 2.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8359375, -1.778778076171875, -1.72161865234375, -1.664459228515625, -1.6072998046875, -1.550140380859375, -1.49298095703125, -1.435821533203125, -1.378662109375, -1.321502685546875, -1.26434326171875, -1.207183837890625, -1.1500244140625, -1.092864990234375, -1.03570556640625, -0.978546142578125, -0.92138671875, -0.864227294921875, -0.80706787109375, -0.749908447265625, -0.6927490234375, -0.635589599609375, -0.57843017578125, -0.521270751953125, -0.464111328125, -0.406951904296875, -0.34979248046875, -0.292633056640625, -0.2354736328125, -0.178314208984375, -0.12115478515625, -0.063995361328125, -0.0068359375, 0.050323486328125, 0.10748291015625, 0.164642333984375, 0.2218017578125, 0.278961181640625, 0.33612060546875, 0.393280029296875, 0.450439453125, 0.507598876953125, 0.56475830078125, 0.621917724609375, 0.6790771484375, 0.736236572265625, 0.79339599609375, 0.850555419921875, 0.90771484375, 0.964874267578125, 1.02203369140625, 1.079193115234375, 1.1363525390625, 1.193511962890625, 1.25067138671875, 1.307830810546875, 1.364990234375, 1.422149658203125, 1.47930908203125, 1.536468505859375, 1.5936279296875, 1.650787353515625, 1.70794677734375, 1.765106201171875, 1.822265625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 5.0, 9.0, 12.0, 14.0, 18.0, 20.0, 24.0, 25.0, 21.0, 41.0, 46.0, 53.0, 49.0, 68.0, 59.0, 62.0, 60.0, 63.0, 58.0, 46.0, 35.0, 39.0, 26.0, 23.0, 23.0, 17.0, 10.0, 11.0, 4.0, 10.0, 7.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04791259765625, -0.04625654220581055, -0.044600486755371094, -0.04294443130493164, -0.04128837585449219, -0.039632320404052734, -0.03797626495361328, -0.03632020950317383, -0.034664154052734375, -0.03300809860229492, -0.03135204315185547, -0.029695987701416016, -0.028039932250976562, -0.02638387680053711, -0.024727821350097656, -0.023071765899658203, -0.02141571044921875, -0.019759654998779297, -0.018103599548339844, -0.01644754409790039, -0.014791488647460938, -0.013135433197021484, -0.011479377746582031, -0.009823322296142578, -0.008167266845703125, -0.006511211395263672, -0.004855155944824219, -0.0031991004943847656, -0.0015430450439453125, 0.00011301040649414062, 0.0017690658569335938, 0.003425121307373047, 0.0050811767578125, 0.006737232208251953, 0.008393287658691406, 0.01004934310913086, 0.011705398559570312, 0.013361454010009766, 0.015017509460449219, 0.016673564910888672, 0.018329620361328125, 0.019985675811767578, 0.02164173126220703, 0.023297786712646484, 0.024953842163085938, 0.02660989761352539, 0.028265953063964844, 0.029922008514404297, 0.03157806396484375, 0.0332341194152832, 0.034890174865722656, 0.03654623031616211, 0.03820228576660156, 0.039858341217041016, 0.04151439666748047, 0.04317045211791992, 0.044826507568359375, 0.04648256301879883, 0.04813861846923828, 0.049794673919677734, 0.05145072937011719, 0.05310678482055664, 0.054762840270996094, 0.05641889572143555, 0.058074951171875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 0.0, 4.0, 1.0, 2.0, 4.0, 6.0, 10.0, 11.0, 10.0, 14.0, 16.0, 20.0, 27.0, 32.0, 39.0, 59.0, 67.0, 126.0, 186.0, 296.0, 814.0, 51667.0, 992600.0, 1461.0, 399.0, 187.0, 143.0, 85.0, 46.0, 41.0, 37.0, 29.0, 27.0, 23.0, 13.0, 12.0, 4.0, 9.0, 9.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.3173828125, -1.2809906005859375, -1.244598388671875, -1.2082061767578125, -1.17181396484375, -1.1354217529296875, -1.099029541015625, -1.0626373291015625, -1.0262451171875, -0.9898529052734375, -0.953460693359375, -0.9170684814453125, -0.88067626953125, -0.8442840576171875, -0.807891845703125, -0.7714996337890625, -0.735107421875, -0.6987152099609375, -0.662322998046875, -0.6259307861328125, -0.58953857421875, -0.5531463623046875, -0.516754150390625, -0.4803619384765625, -0.4439697265625, -0.4075775146484375, -0.371185302734375, -0.3347930908203125, -0.29840087890625, -0.2620086669921875, -0.225616455078125, -0.1892242431640625, -0.15283203125, -0.1164398193359375, -0.080047607421875, -0.0436553955078125, -0.00726318359375, 0.0291290283203125, 0.065521240234375, 0.1019134521484375, 0.1383056640625, 0.1746978759765625, 0.211090087890625, 0.2474822998046875, 0.28387451171875, 0.3202667236328125, 0.356658935546875, 0.3930511474609375, 0.429443359375, 0.4658355712890625, 0.502227783203125, 0.5386199951171875, 0.57501220703125, 0.6114044189453125, 0.647796630859375, 0.6841888427734375, 0.7205810546875, 0.7569732666015625, 0.793365478515625, 0.8297576904296875, 0.86614990234375, 0.9025421142578125, 0.938934326171875, 0.9753265380859375, 1.01171875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 436.0, 550.0, 21.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5149092674255371, -0.49349889159202576, -0.4720885455608368, -0.45067816972732544, -0.4292678236961365, -0.4078574478626251, -0.38644707202911377, -0.3650367259979248, -0.34362637996673584, -0.3222160041332245, -0.3008056581020355, -0.27939528226852417, -0.2579849362373352, -0.23657456040382385, -0.2151641994714737, -0.19375383853912354, -0.17234346270561218, -0.15093310177326202, -0.12952274084091187, -0.10811237245798111, -0.08670201152563095, -0.06529165059328079, -0.04388128221035004, -0.022470921277999878, -0.0010605603456497192, 0.02034980244934559, 0.0417601652443409, 0.06317052990198135, 0.08458089083433151, 0.10599125176668167, 0.12740162014961243, 0.14881198108196259, 0.17022234201431274, 0.1916327029466629, 0.21304306387901306, 0.23445343971252441, 0.2558637857437134, 0.27727416157722473, 0.2986845374107361, 0.32009488344192505, 0.341505229473114, 0.36291560530662537, 0.38432595133781433, 0.4057363271713257, 0.42714667320251465, 0.448557049036026, 0.46996742486953735, 0.4913777709007263, 0.5127881765365601, 0.534198522567749, 0.5556089282035828, 0.5770192742347717, 0.5984296202659607, 0.6198399662971497, 0.6412503719329834, 0.6626607179641724, 0.6840710639953613, 0.7054814100265503, 0.726891815662384, 0.748302161693573, 0.769712507724762, 0.7911228537559509, 0.8125332593917847, 0.8339436054229736, 0.8553539514541626]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 10.0, 7.0, 8.0, 8.0, 18.0, 17.0, 22.0, 34.0, 31.0, 25.0, 34.0, 41.0, 34.0, 48.0, 45.0, 64.0, 47.0, 44.0, 49.0, 59.0, 45.0, 43.0, 34.0, 39.0, 29.0, 34.0, 20.0, 16.0, 16.0, 18.0, 13.0, 11.0, 10.0, 8.0, 4.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.14089655876159668, -0.1370643824338913, -0.1332322210073471, -0.12940004467964172, -0.12556788325309753, -0.12173570692539215, -0.11790353059768677, -0.11407136172056198, -0.1102391928434372, -0.10640702396631241, -0.10257485508918762, -0.09874267876148224, -0.09491050988435745, -0.09107834100723267, -0.08724616467952728, -0.0834139958024025, -0.07958182692527771, -0.07574965804815292, -0.07191748917102814, -0.06808531284332275, -0.06425314396619797, -0.06042097508907318, -0.056588802486658096, -0.05275662988424301, -0.048924461007118225, -0.04509229212999344, -0.041260119527578354, -0.03742794692516327, -0.03359577804803848, -0.029763607308268547, -0.02593143656849861, -0.022099265828728676, -0.01826709508895874, -0.014434924349188805, -0.010602753609418869, -0.006770582869648933, -0.002938412129878998, 0.0008937586098909378, 0.004725929349660873, 0.008558100089430809, 0.012390270829200745, 0.01622244156897068, 0.020054612308740616, 0.02388678304851055, 0.027718953788280487, 0.03155112266540527, 0.03538329526782036, 0.03921546787023544, 0.04304763674736023, 0.046879805624485016, 0.0507119782269001, 0.054544150829315186, 0.05837631970643997, 0.06220848858356476, 0.06604066491127014, 0.06987283378839493, 0.07370500266551971, 0.0775371715426445, 0.08136934041976929, 0.08520151674747467, 0.08903368562459946, 0.09286585450172424, 0.09669803082942963, 0.10053019970655441, 0.1043623685836792]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 9.0, 11.0, 5.0, 9.0, 11.0, 10.0, 13.0, 21.0, 14.0, 27.0, 22.0, 39.0, 24.0, 34.0, 32.0, 41.0, 45.0, 38.0, 43.0, 46.0, 54.0, 42.0, 46.0, 40.0, 47.0, 37.0, 31.0, 27.0, 36.0, 31.0, 27.0, 12.0, 20.0, 12.0, 15.0, 5.0, 16.0, 5.0, 5.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0], "bins": [-10.53125, -10.2371826171875, -9.943115234375, -9.6490478515625, -9.35498046875, -9.0609130859375, -8.766845703125, -8.4727783203125, -8.1787109375, -7.8846435546875, -7.590576171875, -7.2965087890625, -7.00244140625, -6.7083740234375, -6.414306640625, -6.1202392578125, -5.826171875, -5.5321044921875, -5.238037109375, -4.9439697265625, -4.64990234375, -4.3558349609375, -4.061767578125, -3.7677001953125, -3.4736328125, -3.1795654296875, -2.885498046875, -2.5914306640625, -2.29736328125, -2.0032958984375, -1.709228515625, -1.4151611328125, -1.12109375, -0.8270263671875, -0.532958984375, -0.2388916015625, 0.05517578125, 0.3492431640625, 0.643310546875, 0.9373779296875, 1.2314453125, 1.5255126953125, 1.819580078125, 2.1136474609375, 2.40771484375, 2.7017822265625, 2.995849609375, 3.2899169921875, 3.583984375, 3.8780517578125, 4.172119140625, 4.4661865234375, 4.76025390625, 5.0543212890625, 5.348388671875, 5.6424560546875, 5.9365234375, 6.2305908203125, 6.524658203125, 6.8187255859375, 7.11279296875, 7.4068603515625, 7.700927734375, 7.9949951171875, 8.2890625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 7.0, 11.0, 7.0, 16.0, 18.0, 36.0, 43.0, 47.0, 63.0, 119.0, 170.0, 292.0, 606.0, 1429.0, 3425.0, 8411.0, 22898.0, 77910.0, 461692.0, 374349.0, 63992.0, 19712.0, 7625.0, 3069.0, 1304.0, 542.0, 294.0, 157.0, 84.0, 76.0, 41.0, 23.0, 29.0, 19.0, 12.0, 6.0, 6.0, 10.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.65625, -17.08544921875, -16.5146484375, -15.94384765625, -15.373046875, -14.80224609375, -14.2314453125, -13.66064453125, -13.08984375, -12.51904296875, -11.9482421875, -11.37744140625, -10.806640625, -10.23583984375, -9.6650390625, -9.09423828125, -8.5234375, -7.95263671875, -7.3818359375, -6.81103515625, -6.240234375, -5.66943359375, -5.0986328125, -4.52783203125, -3.95703125, -3.38623046875, -2.8154296875, -2.24462890625, -1.673828125, -1.10302734375, -0.5322265625, 0.03857421875, 0.609375, 1.18017578125, 1.7509765625, 2.32177734375, 2.892578125, 3.46337890625, 4.0341796875, 4.60498046875, 5.17578125, 5.74658203125, 6.3173828125, 6.88818359375, 7.458984375, 8.02978515625, 8.6005859375, 9.17138671875, 9.7421875, 10.31298828125, 10.8837890625, 11.45458984375, 12.025390625, 12.59619140625, 13.1669921875, 13.73779296875, 14.30859375, 14.87939453125, 15.4501953125, 16.02099609375, 16.591796875, 17.16259765625, 17.7333984375, 18.30419921875, 18.875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 5.0, 11.0, 8.0, 11.0, 9.0, 11.0, 19.0, 18.0, 30.0, 22.0, 29.0, 40.0, 54.0, 47.0, 63.0, 87.0, 132.0, 350.0, 1418.0, 176.0, 88.0, 61.0, 44.0, 49.0, 34.0, 38.0, 33.0, 18.0, 30.0, 22.0, 11.0, 14.0, 12.0, 13.0, 12.0, 6.0, 9.0, 4.0, 3.0, 4.0, 3.0], "bins": [-33.125, -32.318115234375, -31.51123046875, -30.704345703125, -29.8974609375, -29.090576171875, -28.28369140625, -27.476806640625, -26.669921875, -25.863037109375, -25.05615234375, -24.249267578125, -23.4423828125, -22.635498046875, -21.82861328125, -21.021728515625, -20.21484375, -19.407958984375, -18.60107421875, -17.794189453125, -16.9873046875, -16.180419921875, -15.37353515625, -14.566650390625, -13.759765625, -12.952880859375, -12.14599609375, -11.339111328125, -10.5322265625, -9.725341796875, -8.91845703125, -8.111572265625, -7.3046875, -6.497802734375, -5.69091796875, -4.884033203125, -4.0771484375, -3.270263671875, -2.46337890625, -1.656494140625, -0.849609375, -0.042724609375, 0.76416015625, 1.571044921875, 2.3779296875, 3.184814453125, 3.99169921875, 4.798583984375, 5.60546875, 6.412353515625, 7.21923828125, 8.026123046875, 8.8330078125, 9.639892578125, 10.44677734375, 11.253662109375, 12.060546875, 12.867431640625, 13.67431640625, 14.481201171875, 15.2880859375, 16.094970703125, 16.90185546875, 17.708740234375, 18.515625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 10.0, 11.0, 13.0, 14.0, 30.0, 31.0, 39.0, 43.0, 66.0, 90.0, 110.0, 166.0, 288.0, 516.0, 1659.0, 12914.0, 482822.0, 2608533.0, 33439.0, 3164.0, 725.0, 339.0, 209.0, 117.0, 100.0, 76.0, 46.0, 29.0, 26.0, 16.0, 18.0, 13.0, 8.0, 11.0, 3.0, 6.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.875, -45.37158203125, -43.8681640625, -42.36474609375, -40.861328125, -39.35791015625, -37.8544921875, -36.35107421875, -34.84765625, -33.34423828125, -31.8408203125, -30.33740234375, -28.833984375, -27.33056640625, -25.8271484375, -24.32373046875, -22.8203125, -21.31689453125, -19.8134765625, -18.31005859375, -16.806640625, -15.30322265625, -13.7998046875, -12.29638671875, -10.79296875, -9.28955078125, -7.7861328125, -6.28271484375, -4.779296875, -3.27587890625, -1.7724609375, -0.26904296875, 1.234375, 2.73779296875, 4.2412109375, 5.74462890625, 7.248046875, 8.75146484375, 10.2548828125, 11.75830078125, 13.26171875, 14.76513671875, 16.2685546875, 17.77197265625, 19.275390625, 20.77880859375, 22.2822265625, 23.78564453125, 25.2890625, 26.79248046875, 28.2958984375, 29.79931640625, 31.302734375, 32.80615234375, 34.3095703125, 35.81298828125, 37.31640625, 38.81982421875, 40.3232421875, 41.82666015625, 43.330078125, 44.83349609375, 46.3369140625, 47.84033203125, 49.34375]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 36.0, 121.0, 227.0, 320.0, 206.0, 68.0, 24.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.579010009765625, -34.550235748291016, -31.521461486816406, -28.492687225341797, -25.463912963867188, -22.435138702392578, -19.40636444091797, -16.37759017944336, -13.34881591796875, -10.32004165649414, -7.291267395019531, -4.262493133544922, -1.2337188720703125, 1.7950553894042969, 4.823829650878906, 7.852603912353516, 10.881378173828125, 13.910152435302734, 16.938926696777344, 19.967700958251953, 22.996475219726562, 26.025249481201172, 29.05402374267578, 32.08279800415039, 35.111572265625, 38.14034652709961, 41.16912078857422, 44.19789505004883, 47.22666931152344, 50.25544357299805, 53.284217834472656, 56.312992095947266, 59.341766357421875, 62.370540618896484, 65.3993148803711, 68.42808532714844, 71.45686340332031, 74.48564147949219, 77.51441192626953, 80.54318237304688, 83.57196044921875, 86.60073852539062, 89.62950897216797, 92.65827941894531, 95.68705749511719, 98.71583557128906, 101.7446060180664, 104.77337646484375, 107.80215454101562, 110.8309326171875, 113.85970306396484, 116.88847351074219, 119.91725158691406, 122.94602966308594, 125.97480010986328, 129.00357055664062, 132.0323486328125, 135.06112670898438, 138.08990478515625, 141.11866760253906, 144.14744567871094, 147.1762237548828, 150.20498657226562, 153.2337646484375, 156.26254272460938]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 7.0, 5.0, 5.0, 6.0, 8.0, 13.0, 11.0, 12.0, 15.0, 14.0, 19.0, 22.0, 31.0, 27.0, 25.0, 28.0, 44.0, 33.0, 26.0, 27.0, 26.0, 25.0, 31.0, 40.0, 44.0, 48.0, 28.0, 38.0, 31.0, 25.0, 32.0, 24.0, 35.0, 20.0, 22.0, 24.0, 23.0, 11.0, 17.0, 15.0, 11.0, 13.0, 10.0, 2.0, 6.0, 10.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-54.21595001220703, -52.552249908447266, -50.8885498046875, -49.22484588623047, -47.5611457824707, -45.89744567871094, -44.233741760253906, -42.57004165649414, -40.906341552734375, -39.24264144897461, -37.578941345214844, -35.91523742675781, -34.25153732299805, -32.58783721923828, -30.924135208129883, -29.260433197021484, -27.59673309326172, -25.933032989501953, -24.269330978393555, -22.605628967285156, -20.94192886352539, -19.278228759765625, -17.614526748657227, -15.950825691223145, -14.287124633789062, -12.62342357635498, -10.959722518920898, -9.296021461486816, -7.632320404052734, -5.968619346618652, -4.30491828918457, -2.6412172317504883, -0.9775161743164062, 0.6861848831176758, 2.349885940551758, 4.01358699798584, 5.677288055419922, 7.340989112854004, 9.004690170288086, 10.668391227722168, 12.33209228515625, 13.995793342590332, 15.659494400024414, 17.323196411132812, 18.986896514892578, 20.650596618652344, 22.314298629760742, 23.97800064086914, 25.641700744628906, 27.305400848388672, 28.96910285949707, 30.63280487060547, 32.296504974365234, 33.960205078125, 35.62390899658203, 37.2876091003418, 38.95130920410156, 40.61500930786133, 42.278709411621094, 43.942413330078125, 45.60611343383789, 47.269813537597656, 48.93351745605469, 50.59721755981445, 52.26091766357422]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 9.0, 7.0, 4.0, 11.0, 10.0, 7.0, 11.0, 13.0, 21.0, 20.0, 20.0, 28.0, 28.0, 30.0, 42.0, 31.0, 37.0, 42.0, 45.0, 38.0, 39.0, 50.0, 40.0, 36.0, 57.0, 30.0, 33.0, 44.0, 41.0, 27.0, 32.0, 19.0, 21.0, 20.0, 8.0, 11.0, 8.0, 7.0, 5.0, 5.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0], "bins": [-10.8203125, -10.52740478515625, -10.2344970703125, -9.94158935546875, -9.648681640625, -9.35577392578125, -9.0628662109375, -8.76995849609375, -8.47705078125, -8.18414306640625, -7.8912353515625, -7.59832763671875, -7.305419921875, -7.01251220703125, -6.7196044921875, -6.42669677734375, -6.1337890625, -5.84088134765625, -5.5479736328125, -5.25506591796875, -4.962158203125, -4.66925048828125, -4.3763427734375, -4.08343505859375, -3.79052734375, -3.49761962890625, -3.2047119140625, -2.91180419921875, -2.618896484375, -2.32598876953125, -2.0330810546875, -1.74017333984375, -1.447265625, -1.15435791015625, -0.8614501953125, -0.56854248046875, -0.275634765625, 0.01727294921875, 0.3101806640625, 0.60308837890625, 0.89599609375, 1.18890380859375, 1.4818115234375, 1.77471923828125, 2.067626953125, 2.36053466796875, 2.6534423828125, 2.94635009765625, 3.2392578125, 3.53216552734375, 3.8250732421875, 4.11798095703125, 4.410888671875, 4.70379638671875, 4.9967041015625, 5.28961181640625, 5.58251953125, 5.87542724609375, 6.1683349609375, 6.46124267578125, 6.754150390625, 7.04705810546875, 7.3399658203125, 7.63287353515625, 7.92578125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 2.0, 12.0, 5.0, 11.0, 12.0, 24.0, 17.0, 39.0, 69.0, 81.0, 124.0, 228.0, 379.0, 800.0, 2118.0, 6559.0, 24144.0, 101229.0, 421134.0, 1363800.0, 1551990.0, 544501.0, 132816.0, 31382.0, 8213.0, 2532.0, 948.0, 452.0, 244.0, 132.0, 65.0, 74.0, 35.0, 26.0, 25.0, 16.0, 12.0, 5.0, 7.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.0078125, -11.62158203125, -11.2353515625, -10.84912109375, -10.462890625, -10.07666015625, -9.6904296875, -9.30419921875, -8.91796875, -8.53173828125, -8.1455078125, -7.75927734375, -7.373046875, -6.98681640625, -6.6005859375, -6.21435546875, -5.828125, -5.44189453125, -5.0556640625, -4.66943359375, -4.283203125, -3.89697265625, -3.5107421875, -3.12451171875, -2.73828125, -2.35205078125, -1.9658203125, -1.57958984375, -1.193359375, -0.80712890625, -0.4208984375, -0.03466796875, 0.3515625, 0.73779296875, 1.1240234375, 1.51025390625, 1.896484375, 2.28271484375, 2.6689453125, 3.05517578125, 3.44140625, 3.82763671875, 4.2138671875, 4.60009765625, 4.986328125, 5.37255859375, 5.7587890625, 6.14501953125, 6.53125, 6.91748046875, 7.3037109375, 7.68994140625, 8.076171875, 8.46240234375, 8.8486328125, 9.23486328125, 9.62109375, 10.00732421875, 10.3935546875, 10.77978515625, 11.166015625, 11.55224609375, 11.9384765625, 12.32470703125, 12.7109375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 8.0, 3.0, 8.0, 15.0, 25.0, 13.0, 29.0, 35.0, 48.0, 67.0, 106.0, 103.0, 150.0, 179.0, 204.0, 299.0, 322.0, 345.0, 365.0, 339.0, 296.0, 255.0, 197.0, 158.0, 120.0, 91.0, 61.0, 54.0, 35.0, 45.0, 18.0, 13.0, 16.0, 12.0, 12.0, 2.0, 7.0, 4.0, 2.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 2.0], "bins": [-12.875, -12.5189208984375, -12.162841796875, -11.8067626953125, -11.45068359375, -11.0946044921875, -10.738525390625, -10.3824462890625, -10.0263671875, -9.6702880859375, -9.314208984375, -8.9581298828125, -8.60205078125, -8.2459716796875, -7.889892578125, -7.5338134765625, -7.177734375, -6.8216552734375, -6.465576171875, -6.1094970703125, -5.75341796875, -5.3973388671875, -5.041259765625, -4.6851806640625, -4.3291015625, -3.9730224609375, -3.616943359375, -3.2608642578125, -2.90478515625, -2.5487060546875, -2.192626953125, -1.8365478515625, -1.48046875, -1.1243896484375, -0.768310546875, -0.4122314453125, -0.05615234375, 0.2999267578125, 0.656005859375, 1.0120849609375, 1.3681640625, 1.7242431640625, 2.080322265625, 2.4364013671875, 2.79248046875, 3.1485595703125, 3.504638671875, 3.8607177734375, 4.216796875, 4.5728759765625, 4.928955078125, 5.2850341796875, 5.64111328125, 5.9971923828125, 6.353271484375, 6.7093505859375, 7.0654296875, 7.4215087890625, 7.777587890625, 8.1336669921875, 8.48974609375, 8.8458251953125, 9.201904296875, 9.5579833984375, 9.9140625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 1.0, 4.0, 7.0, 5.0, 7.0, 9.0, 16.0, 24.0, 37.0, 45.0, 61.0, 84.0, 95.0, 176.0, 261.0, 400.0, 694.0, 1888.0, 11038.0, 147221.0, 2399870.0, 1538960.0, 83016.0, 7179.0, 1470.0, 632.0, 322.0, 219.0, 148.0, 119.0, 72.0, 58.0, 28.0, 27.0, 28.0, 18.0, 13.0, 9.0, 5.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.359375, -26.378662109375, -25.39794921875, -24.417236328125, -23.4365234375, -22.455810546875, -21.47509765625, -20.494384765625, -19.513671875, -18.532958984375, -17.55224609375, -16.571533203125, -15.5908203125, -14.610107421875, -13.62939453125, -12.648681640625, -11.66796875, -10.687255859375, -9.70654296875, -8.725830078125, -7.7451171875, -6.764404296875, -5.78369140625, -4.802978515625, -3.822265625, -2.841552734375, -1.86083984375, -0.880126953125, 0.1005859375, 1.081298828125, 2.06201171875, 3.042724609375, 4.0234375, 5.004150390625, 5.98486328125, 6.965576171875, 7.9462890625, 8.927001953125, 9.90771484375, 10.888427734375, 11.869140625, 12.849853515625, 13.83056640625, 14.811279296875, 15.7919921875, 16.772705078125, 17.75341796875, 18.734130859375, 19.71484375, 20.695556640625, 21.67626953125, 22.656982421875, 23.6376953125, 24.618408203125, 25.59912109375, 26.579833984375, 27.560546875, 28.541259765625, 29.52197265625, 30.502685546875, 31.4833984375, 32.464111328125, 33.44482421875, 34.425537109375, 35.40625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 60.0, 586.0, 332.0, 33.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.62297058105469, -90.15222930908203, -78.68148803710938, -67.21073913574219, -55.7400016784668, -44.26926040649414, -32.79851531982422, -21.327774047851562, -9.857032775878906, 1.6137094497680664, 13.084451675415039, 24.555194854736328, 36.025936126708984, 47.49667739868164, 58.96742248535156, 70.43816375732422, 81.90890502929688, 93.37964630126953, 104.85038757324219, 116.32113647460938, 127.7918701171875, 139.2626190185547, 150.73336791992188, 162.2041015625, 173.67483520507812, 185.1455841064453, 196.61631774902344, 208.08706665039062, 219.55780029296875, 231.02854919433594, 242.49929809570312, 253.97003173828125, 265.4407653808594, 276.9114990234375, 288.38226318359375, 299.8529968261719, 311.32373046875, 322.7944641113281, 334.2652282714844, 345.7359619140625, 357.2066955566406, 368.67742919921875, 380.148193359375, 391.6189270019531, 403.08966064453125, 414.5603942871094, 426.0311584472656, 437.50189208984375, 448.97265625, 460.4433898925781, 471.9141540527344, 483.3848876953125, 494.8556213378906, 506.32635498046875, 517.797119140625, 529.267822265625, 540.7385864257812, 552.2093505859375, 563.6800537109375, 575.1508178710938, 586.62158203125, 598.09228515625, 609.5630493164062, 621.0338134765625, 632.5045166015625]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 4.0, 9.0, 5.0, 10.0, 14.0, 12.0, 16.0, 18.0, 20.0, 22.0, 26.0, 31.0, 25.0, 27.0, 30.0, 41.0, 34.0, 45.0, 50.0, 44.0, 44.0, 46.0, 40.0, 37.0, 45.0, 38.0, 28.0, 32.0, 25.0, 35.0, 24.0, 22.0, 14.0, 8.0, 17.0, 18.0, 10.0, 7.0, 6.0, 2.0, 2.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.23480987548828, -38.83597183227539, -37.4371337890625, -36.038291931152344, -34.63945388793945, -33.24061584472656, -31.84177589416504, -30.442935943603516, -29.044097900390625, -27.645259857177734, -26.24641990661621, -24.847579956054688, -23.448741912841797, -22.049903869628906, -20.651063919067383, -19.25222396850586, -17.85338592529297, -16.454547882080078, -15.055707931518555, -13.656868934631348, -12.25802993774414, -10.859190940856934, -9.460351943969727, -8.06151294708252, -6.6626739501953125, -5.2638349533081055, -3.8649959564208984, -2.4661569595336914, -1.0673179626464844, 0.33152103424072266, 1.7303600311279297, 3.1291990280151367, 4.528034210205078, 5.926873207092285, 7.325712203979492, 8.7245512008667, 10.123390197753906, 11.522229194641113, 12.92106819152832, 14.319907188415527, 15.718746185302734, 17.117584228515625, 18.51642417907715, 19.915264129638672, 21.314102172851562, 22.712940216064453, 24.111780166625977, 25.5106201171875, 26.90945816040039, 28.30829620361328, 29.707136154174805, 31.105976104736328, 32.50481414794922, 33.90365219116211, 35.302490234375, 36.701332092285156, 38.10017013549805, 39.49900817871094, 40.897850036621094, 42.296688079833984, 43.695526123046875, 45.094364166259766, 46.493202209472656, 47.89204406738281, 49.2908821105957]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 8.0, 11.0, 6.0, 9.0, 9.0, 12.0, 11.0, 22.0, 14.0, 18.0, 21.0, 15.0, 18.0, 38.0, 30.0, 41.0, 26.0, 51.0, 43.0, 42.0, 45.0, 36.0, 47.0, 32.0, 31.0, 29.0, 39.0, 42.0, 42.0, 32.0, 26.0, 26.0, 34.0, 14.0, 12.0, 11.0, 4.0, 7.0, 7.0, 11.0, 3.0, 4.0, 2.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.265625, -8.00537109375, -7.7451171875, -7.48486328125, -7.224609375, -6.96435546875, -6.7041015625, -6.44384765625, -6.18359375, -5.92333984375, -5.6630859375, -5.40283203125, -5.142578125, -4.88232421875, -4.6220703125, -4.36181640625, -4.1015625, -3.84130859375, -3.5810546875, -3.32080078125, -3.060546875, -2.80029296875, -2.5400390625, -2.27978515625, -2.01953125, -1.75927734375, -1.4990234375, -1.23876953125, -0.978515625, -0.71826171875, -0.4580078125, -0.19775390625, 0.0625, 0.32275390625, 0.5830078125, 0.84326171875, 1.103515625, 1.36376953125, 1.6240234375, 1.88427734375, 2.14453125, 2.40478515625, 2.6650390625, 2.92529296875, 3.185546875, 3.44580078125, 3.7060546875, 3.96630859375, 4.2265625, 4.48681640625, 4.7470703125, 5.00732421875, 5.267578125, 5.52783203125, 5.7880859375, 6.04833984375, 6.30859375, 6.56884765625, 6.8291015625, 7.08935546875, 7.349609375, 7.60986328125, 7.8701171875, 8.13037109375, 8.390625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 14.0, 9.0, 20.0, 37.0, 44.0, 80.0, 102.0, 198.0, 293.0, 425.0, 609.0, 862.0, 1409.0, 2053.0, 3116.0, 4690.0, 7024.0, 10188.0, 15017.0, 21710.0, 30820.0, 43139.0, 57677.0, 74228.0, 90615.0, 104439.0, 109799.0, 104276.0, 91303.0, 74631.0, 57656.0, 42869.0, 30965.0, 21723.0, 15224.0, 10169.0, 7059.0, 4616.0, 3192.0, 2075.0, 1451.0, 927.0, 642.0, 389.0, 245.0, 180.0, 119.0, 89.0, 55.0, 32.0, 19.0, 16.0, 10.0, 9.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.84521484375, -0.8175048828125, -0.789794921875, -0.7620849609375, -0.734375, -0.7066650390625, -0.678955078125, -0.6512451171875, -0.62353515625, -0.5958251953125, -0.568115234375, -0.5404052734375, -0.5126953125, -0.4849853515625, -0.457275390625, -0.4295654296875, -0.40185546875, -0.3741455078125, -0.346435546875, -0.3187255859375, -0.291015625, -0.2633056640625, -0.235595703125, -0.2078857421875, -0.18017578125, -0.1524658203125, -0.124755859375, -0.0970458984375, -0.0693359375, -0.0416259765625, -0.013916015625, 0.0137939453125, 0.04150390625, 0.0692138671875, 0.096923828125, 0.1246337890625, 0.15234375, 0.1800537109375, 0.207763671875, 0.2354736328125, 0.26318359375, 0.2908935546875, 0.318603515625, 0.3463134765625, 0.3740234375, 0.4017333984375, 0.429443359375, 0.4571533203125, 0.48486328125, 0.5125732421875, 0.540283203125, 0.5679931640625, 0.595703125, 0.6234130859375, 0.651123046875, 0.6788330078125, 0.70654296875, 0.7342529296875, 0.761962890625, 0.7896728515625, 0.8173828125, 0.8450927734375, 0.872802734375, 0.9005126953125, 0.92822265625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 2.0, 3.0, 4.0, 6.0, 8.0, 9.0, 9.0, 15.0, 7.0, 17.0, 13.0, 16.0, 21.0, 18.0, 26.0, 20.0, 25.0, 26.0, 34.0, 34.0, 33.0, 31.0, 31.0, 30.0, 1055.0, 30.0, 44.0, 39.0, 39.0, 38.0, 34.0, 22.0, 34.0, 25.0, 23.0, 25.0, 23.0, 25.0, 19.0, 21.0, 17.0, 10.0, 12.0, 10.0, 9.0, 4.0, 3.0, 9.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0], "bins": [-4.70703125, -4.55987548828125, -4.4127197265625, -4.26556396484375, -4.118408203125, -3.97125244140625, -3.8240966796875, -3.67694091796875, -3.52978515625, -3.38262939453125, -3.2354736328125, -3.08831787109375, -2.941162109375, -2.79400634765625, -2.6468505859375, -2.49969482421875, -2.3525390625, -2.20538330078125, -2.0582275390625, -1.91107177734375, -1.763916015625, -1.61676025390625, -1.4696044921875, -1.32244873046875, -1.17529296875, -1.02813720703125, -0.8809814453125, -0.73382568359375, -0.586669921875, -0.43951416015625, -0.2923583984375, -0.14520263671875, 0.001953125, 0.14910888671875, 0.2962646484375, 0.44342041015625, 0.590576171875, 0.73773193359375, 0.8848876953125, 1.03204345703125, 1.17919921875, 1.32635498046875, 1.4735107421875, 1.62066650390625, 1.767822265625, 1.91497802734375, 2.0621337890625, 2.20928955078125, 2.3564453125, 2.50360107421875, 2.6507568359375, 2.79791259765625, 2.945068359375, 3.09222412109375, 3.2393798828125, 3.38653564453125, 3.53369140625, 3.68084716796875, 3.8280029296875, 3.97515869140625, 4.122314453125, 4.26947021484375, 4.4166259765625, 4.56378173828125, 4.7109375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 5.0, 3.0, 9.0, 8.0, 16.0, 9.0, 16.0, 29.0, 62.0, 81.0, 111.0, 170.0, 231.0, 328.0, 469.0, 613.0, 872.0, 1187.0, 1644.0, 2257.0, 2997.0, 4159.0, 5772.0, 7670.0, 10539.0, 14558.0, 19949.0, 28489.0, 1670347.0, 226580.0, 26916.0, 19156.0, 13903.0, 10365.0, 7477.0, 5565.0, 4047.0, 2945.0, 2047.0, 1602.0, 1149.0, 805.0, 569.0, 418.0, 298.0, 218.0, 137.0, 94.0, 71.0, 63.0, 38.0, 26.0, 19.0, 12.0, 10.0, 5.0, 1.0, 2.0, 5.0, 2.0, 1.0], "bins": [-1.5615234375, -1.51263427734375, -1.4637451171875, -1.41485595703125, -1.365966796875, -1.31707763671875, -1.2681884765625, -1.21929931640625, -1.17041015625, -1.12152099609375, -1.0726318359375, -1.02374267578125, -0.974853515625, -0.92596435546875, -0.8770751953125, -0.82818603515625, -0.779296875, -0.73040771484375, -0.6815185546875, -0.63262939453125, -0.583740234375, -0.53485107421875, -0.4859619140625, -0.43707275390625, -0.38818359375, -0.33929443359375, -0.2904052734375, -0.24151611328125, -0.192626953125, -0.14373779296875, -0.0948486328125, -0.04595947265625, 0.0029296875, 0.05181884765625, 0.1007080078125, 0.14959716796875, 0.198486328125, 0.24737548828125, 0.2962646484375, 0.34515380859375, 0.39404296875, 0.44293212890625, 0.4918212890625, 0.54071044921875, 0.589599609375, 0.63848876953125, 0.6873779296875, 0.73626708984375, 0.78515625, 0.83404541015625, 0.8829345703125, 0.93182373046875, 0.980712890625, 1.02960205078125, 1.0784912109375, 1.12738037109375, 1.17626953125, 1.22515869140625, 1.2740478515625, 1.32293701171875, 1.371826171875, 1.42071533203125, 1.4696044921875, 1.51849365234375, 1.5673828125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 6.0, 6.0, 5.0, 3.0, 7.0, 8.0, 10.0, 19.0, 27.0, 24.0, 39.0, 76.0, 90.0, 105.0, 118.0, 105.0, 87.0, 65.0, 61.0, 37.0, 23.0, 15.0, 10.0, 8.0, 7.0, 4.0, 2.0, 1.0, 6.0, 1.0, 3.0, 6.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04852294921875, -0.046990394592285156, -0.04545783996582031, -0.04392528533935547, -0.042392730712890625, -0.04086017608642578, -0.03932762145996094, -0.037795066833496094, -0.03626251220703125, -0.034729957580566406, -0.03319740295410156, -0.03166484832763672, -0.030132293701171875, -0.02859973907470703, -0.027067184448242188, -0.025534629821777344, -0.0240020751953125, -0.022469520568847656, -0.020936965942382812, -0.01940441131591797, -0.017871856689453125, -0.01633930206298828, -0.014806747436523438, -0.013274192810058594, -0.01174163818359375, -0.010209083557128906, -0.008676528930664062, -0.007143974304199219, -0.005611419677734375, -0.004078865051269531, -0.0025463104248046875, -0.0010137557983398438, 0.000518798828125, 0.0020513534545898438, 0.0035839080810546875, 0.005116462707519531, 0.006649017333984375, 0.008181571960449219, 0.009714126586914062, 0.011246681213378906, 0.01277923583984375, 0.014311790466308594, 0.015844345092773438, 0.01737689971923828, 0.018909454345703125, 0.02044200897216797, 0.021974563598632812, 0.023507118225097656, 0.0250396728515625, 0.026572227478027344, 0.028104782104492188, 0.02963733673095703, 0.031169891357421875, 0.03270244598388672, 0.03423500061035156, 0.035767555236816406, 0.03730010986328125, 0.038832664489746094, 0.04036521911621094, 0.04189777374267578, 0.043430328369140625, 0.04496288299560547, 0.04649543762207031, 0.048027992248535156, 0.049560546875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 4.0, 1.0, 7.0, 10.0, 8.0, 8.0, 17.0, 32.0, 28.0, 80.0, 121.0, 184.0, 502.0, 12856.0, 1032255.0, 1603.0, 340.0, 169.0, 109.0, 52.0, 40.0, 32.0, 11.0, 8.0, 7.0, 11.0, 5.0, 9.0, 9.0, 5.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1396484375, -1.104400634765625, -1.06915283203125, -1.033905029296875, -0.9986572265625, -0.963409423828125, -0.92816162109375, -0.892913818359375, -0.857666015625, -0.822418212890625, -0.78717041015625, -0.751922607421875, -0.7166748046875, -0.681427001953125, -0.64617919921875, -0.610931396484375, -0.57568359375, -0.540435791015625, -0.50518798828125, -0.469940185546875, -0.4346923828125, -0.399444580078125, -0.36419677734375, -0.328948974609375, -0.293701171875, -0.258453369140625, -0.22320556640625, -0.187957763671875, -0.1527099609375, -0.117462158203125, -0.08221435546875, -0.046966552734375, -0.01171875, 0.023529052734375, 0.05877685546875, 0.094024658203125, 0.1292724609375, 0.164520263671875, 0.19976806640625, 0.235015869140625, 0.270263671875, 0.305511474609375, 0.34075927734375, 0.376007080078125, 0.4112548828125, 0.446502685546875, 0.48175048828125, 0.516998291015625, 0.55224609375, 0.587493896484375, 0.62274169921875, 0.657989501953125, 0.6932373046875, 0.728485107421875, 0.76373291015625, 0.798980712890625, 0.834228515625, 0.869476318359375, 0.90472412109375, 0.939971923828125, 0.9752197265625, 1.010467529296875, 1.04571533203125, 1.080963134765625, 1.1162109375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 15.0, 74.0, 516.0, 342.0, 50.0, 10.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.34927070140838623, -0.33952271938323975, -0.32977473735809326, -0.32002678513526917, -0.3102788031101227, -0.3005308210849762, -0.2907828390598297, -0.2810348570346832, -0.27128690481185913, -0.26153892278671265, -0.25179094076156616, -0.24204297363758087, -0.23229500651359558, -0.2225470244884491, -0.2127990424633026, -0.20305106043815613, -0.19330307841300964, -0.18355509638786316, -0.17380712926387787, -0.16405914723873138, -0.1543111801147461, -0.1445631980895996, -0.13481521606445312, -0.12506723403930664, -0.11531926691532135, -0.10557129234075546, -0.09582331776618958, -0.08607533574104309, -0.0763273611664772, -0.06657938659191132, -0.05683140829205513, -0.047083429992198944, -0.03733545541763306, -0.02758747898042202, -0.017839502543210983, -0.008091526105999947, 0.00165645033121109, 0.011404424905776978, 0.021152403205633163, 0.03090038150548935, 0.04064835608005524, 0.050396330654621124, 0.06014430895447731, 0.0698922872543335, 0.07964026182889938, 0.08938823640346527, 0.09913621842861176, 0.10888419300317764, 0.11863216757774353, 0.12838014960289001, 0.1381281167268753, 0.1478760987520218, 0.15762406587600708, 0.16737204790115356, 0.17712002992630005, 0.18686801195144653, 0.19661597907543182, 0.2063639611005783, 0.2161119282245636, 0.22585991024971008, 0.23560789227485657, 0.24535585939884186, 0.25510382652282715, 0.26485180854797363, 0.2745997905731201]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 9.0, 6.0, 8.0, 12.0, 12.0, 17.0, 16.0, 18.0, 30.0, 32.0, 37.0, 30.0, 49.0, 43.0, 47.0, 40.0, 55.0, 36.0, 49.0, 45.0, 57.0, 46.0, 40.0, 40.0, 36.0, 30.0, 30.0, 25.0, 24.0, 24.0, 15.0, 13.0, 15.0, 9.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06502461433410645, -0.06309106945991516, -0.06115752086043358, -0.059223972260951996, -0.05729042738676071, -0.05535688251256943, -0.053423333913087845, -0.05148978531360626, -0.04955624043941498, -0.047622695565223694, -0.04568914696574211, -0.04375559836626053, -0.041822053492069244, -0.03988850861787796, -0.03795496001839638, -0.036021411418914795, -0.03408786654472351, -0.03215432167053223, -0.030220773071050644, -0.02828722633421421, -0.026353679597377777, -0.024420132860541344, -0.02248658612370491, -0.020553039386868477, -0.018619492650032043, -0.01668594591319561, -0.014752399176359177, -0.012818852439522743, -0.01088530570268631, -0.008951758965849876, -0.007018212229013443, -0.00508466549217701, -0.003151118755340576, -0.0012175720185041428, 0.0007159747183322906, 0.002649521455168724, 0.0045830681920051575, 0.006516614928841591, 0.008450161665678024, 0.010383708402514458, 0.012317255139350891, 0.014250801876187325, 0.016184348613023758, 0.01811789534986019, 0.020051442086696625, 0.021984988823533058, 0.02391853556036949, 0.025852082297205925, 0.02778562903404236, 0.029719175770878792, 0.031652722507715225, 0.03358627110719681, 0.03551981598138809, 0.037453360855579376, 0.03938690945506096, 0.04132045805454254, 0.043254002928733826, 0.04518754780292511, 0.04712109640240669, 0.049054645001888275, 0.05098818987607956, 0.052921734750270844, 0.054855283349752426, 0.05678883194923401, 0.05872237682342529]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 6.0, 6.0, 3.0, 6.0, 8.0, 16.0, 5.0, 13.0, 24.0, 20.0, 17.0, 20.0, 33.0, 31.0, 35.0, 38.0, 26.0, 36.0, 31.0, 50.0, 51.0, 34.0, 34.0, 38.0, 43.0, 47.0, 33.0, 42.0, 27.0, 33.0, 22.0, 29.0, 21.0, 30.0, 10.0, 17.0, 12.0, 10.0, 7.0, 9.0, 3.0, 1.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.1484375, -7.887451171875, -7.62646484375, -7.365478515625, -7.1044921875, -6.843505859375, -6.58251953125, -6.321533203125, -6.060546875, -5.799560546875, -5.53857421875, -5.277587890625, -5.0166015625, -4.755615234375, -4.49462890625, -4.233642578125, -3.97265625, -3.711669921875, -3.45068359375, -3.189697265625, -2.9287109375, -2.667724609375, -2.40673828125, -2.145751953125, -1.884765625, -1.623779296875, -1.36279296875, -1.101806640625, -0.8408203125, -0.579833984375, -0.31884765625, -0.057861328125, 0.203125, 0.464111328125, 0.72509765625, 0.986083984375, 1.2470703125, 1.508056640625, 1.76904296875, 2.030029296875, 2.291015625, 2.552001953125, 2.81298828125, 3.073974609375, 3.3349609375, 3.595947265625, 3.85693359375, 4.117919921875, 4.37890625, 4.639892578125, 4.90087890625, 5.161865234375, 5.4228515625, 5.683837890625, 5.94482421875, 6.205810546875, 6.466796875, 6.727783203125, 6.98876953125, 7.249755859375, 7.5107421875, 7.771728515625, 8.03271484375, 8.293701171875, 8.5546875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 5.0, 7.0, 19.0, 18.0, 37.0, 56.0, 67.0, 114.0, 186.0, 290.0, 466.0, 764.0, 1375.0, 2218.0, 3789.0, 6749.0, 12782.0, 25841.0, 52486.0, 114482.0, 253493.0, 299212.0, 142707.0, 65576.0, 31193.0, 15462.0, 8201.0, 4532.0, 2497.0, 1540.0, 906.0, 514.0, 363.0, 204.0, 153.0, 85.0, 64.0, 35.0, 24.0, 14.0, 13.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.421875, -8.111572265625, -7.80126953125, -7.490966796875, -7.1806640625, -6.870361328125, -6.56005859375, -6.249755859375, -5.939453125, -5.629150390625, -5.31884765625, -5.008544921875, -4.6982421875, -4.387939453125, -4.07763671875, -3.767333984375, -3.45703125, -3.146728515625, -2.83642578125, -2.526123046875, -2.2158203125, -1.905517578125, -1.59521484375, -1.284912109375, -0.974609375, -0.664306640625, -0.35400390625, -0.043701171875, 0.2666015625, 0.576904296875, 0.88720703125, 1.197509765625, 1.5078125, 1.818115234375, 2.12841796875, 2.438720703125, 2.7490234375, 3.059326171875, 3.36962890625, 3.679931640625, 3.990234375, 4.300537109375, 4.61083984375, 4.921142578125, 5.2314453125, 5.541748046875, 5.85205078125, 6.162353515625, 6.47265625, 6.782958984375, 7.09326171875, 7.403564453125, 7.7138671875, 8.024169921875, 8.33447265625, 8.644775390625, 8.955078125, 9.265380859375, 9.57568359375, 9.885986328125, 10.1962890625, 10.506591796875, 10.81689453125, 11.127197265625, 11.4375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 5.0, 5.0, 13.0, 7.0, 19.0, 20.0, 18.0, 21.0, 30.0, 21.0, 37.0, 32.0, 43.0, 61.0, 66.0, 83.0, 143.0, 296.0, 1403.0, 172.0, 129.0, 78.0, 51.0, 44.0, 44.0, 27.0, 32.0, 23.0, 21.0, 16.0, 10.0, 11.0, 16.0, 12.0, 12.0, 7.0, 8.0, 4.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.578125, -26.773193359375, -25.96826171875, -25.163330078125, -24.3583984375, -23.553466796875, -22.74853515625, -21.943603515625, -21.138671875, -20.333740234375, -19.52880859375, -18.723876953125, -17.9189453125, -17.114013671875, -16.30908203125, -15.504150390625, -14.69921875, -13.894287109375, -13.08935546875, -12.284423828125, -11.4794921875, -10.674560546875, -9.86962890625, -9.064697265625, -8.259765625, -7.454833984375, -6.64990234375, -5.844970703125, -5.0400390625, -4.235107421875, -3.43017578125, -2.625244140625, -1.8203125, -1.015380859375, -0.21044921875, 0.594482421875, 1.3994140625, 2.204345703125, 3.00927734375, 3.814208984375, 4.619140625, 5.424072265625, 6.22900390625, 7.033935546875, 7.8388671875, 8.643798828125, 9.44873046875, 10.253662109375, 11.05859375, 11.863525390625, 12.66845703125, 13.473388671875, 14.2783203125, 15.083251953125, 15.88818359375, 16.693115234375, 17.498046875, 18.302978515625, 19.10791015625, 19.912841796875, 20.7177734375, 21.522705078125, 22.32763671875, 23.132568359375, 23.9375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 2.0, 3.0, 6.0, 5.0, 10.0, 12.0, 16.0, 25.0, 27.0, 44.0, 81.0, 118.0, 165.0, 227.0, 394.0, 855.0, 3319.0, 25528.0, 583282.0, 2446190.0, 75397.0, 7253.0, 1359.0, 506.0, 309.0, 176.0, 123.0, 75.0, 68.0, 36.0, 23.0, 14.0, 15.0, 13.0, 12.0, 8.0, 5.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-40.53125, -39.44189453125, -38.3525390625, -37.26318359375, -36.173828125, -35.08447265625, -33.9951171875, -32.90576171875, -31.81640625, -30.72705078125, -29.6376953125, -28.54833984375, -27.458984375, -26.36962890625, -25.2802734375, -24.19091796875, -23.1015625, -22.01220703125, -20.9228515625, -19.83349609375, -18.744140625, -17.65478515625, -16.5654296875, -15.47607421875, -14.38671875, -13.29736328125, -12.2080078125, -11.11865234375, -10.029296875, -8.93994140625, -7.8505859375, -6.76123046875, -5.671875, -4.58251953125, -3.4931640625, -2.40380859375, -1.314453125, -0.22509765625, 0.8642578125, 1.95361328125, 3.04296875, 4.13232421875, 5.2216796875, 6.31103515625, 7.400390625, 8.48974609375, 9.5791015625, 10.66845703125, 11.7578125, 12.84716796875, 13.9365234375, 15.02587890625, 16.115234375, 17.20458984375, 18.2939453125, 19.38330078125, 20.47265625, 21.56201171875, 22.6513671875, 23.74072265625, 24.830078125, 25.91943359375, 27.0087890625, 28.09814453125, 29.1875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 22.0, 328.0, 585.0, 78.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-393.34136962890625, -385.01788330078125, -376.69439697265625, -368.3708801269531, -360.0473937988281, -351.7239074707031, -343.4004211425781, -335.0769348144531, -326.75341796875, -318.429931640625, -310.1064453125, -301.7829284667969, -293.4594421386719, -285.1359558105469, -276.8124694824219, -268.4889831542969, -260.1654968261719, -251.84201049804688, -243.5185089111328, -235.1950225830078, -226.87152099609375, -218.54803466796875, -210.22454833984375, -201.90106201171875, -193.5775604248047, -185.2540740966797, -176.93057250976562, -168.60708618164062, -160.28359985351562, -151.96009826660156, -143.63661193847656, -135.3131103515625, -126.98965454101562, -118.6661605834961, -110.34266662597656, -102.01918029785156, -93.69568634033203, -85.3721923828125, -77.0487060546875, -68.72521209716797, -60.40171813964844, -52.078224182128906, -43.75473403930664, -35.431243896484375, -27.107749938964844, -18.784255981445312, -10.460765838623047, -2.1372756958007812, 6.18621826171875, 14.509710311889648, 22.833202362060547, 31.156694412231445, 39.480186462402344, 47.803680419921875, 56.12717056274414, 64.4506607055664, 72.77415466308594, 81.09764862060547, 89.421142578125, 97.74462890625, 106.06812286376953, 114.39161682128906, 122.71510314941406, 131.03860473632812, 139.36209106445312]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 5.0, 5.0, 5.0, 5.0, 11.0, 12.0, 13.0, 10.0, 16.0, 16.0, 30.0, 29.0, 30.0, 25.0, 23.0, 34.0, 32.0, 40.0, 48.0, 34.0, 40.0, 42.0, 47.0, 45.0, 39.0, 37.0, 41.0, 33.0, 27.0, 38.0, 38.0, 27.0, 20.0, 18.0, 16.0, 9.0, 6.0, 10.0, 11.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-57.95024871826172, -56.25326156616211, -54.5562744140625, -52.85928726196289, -51.16230010986328, -49.46531295776367, -47.76832580566406, -46.07134246826172, -44.374351501464844, -42.677364349365234, -40.980377197265625, -39.283390045166016, -37.586402893066406, -35.8894157409668, -34.19242858886719, -32.495445251464844, -30.798458099365234, -29.101470947265625, -27.404483795166016, -25.707496643066406, -24.010509490966797, -22.313522338867188, -20.61653709411621, -18.9195499420166, -17.222562789916992, -15.525575637817383, -13.828588485717773, -12.13160228729248, -10.434615135192871, -8.737627983093262, -7.040641784667969, -5.343654632568359, -3.6466636657714844, -1.949676752090454, -0.25268983840942383, 1.4442968368530273, 3.1412839889526367, 4.838271141052246, 6.535257339477539, 8.232244491577148, 9.929231643676758, 11.626218795776367, 13.323205947875977, 15.02019214630127, 16.717178344726562, 18.414165496826172, 20.11115264892578, 21.80813980102539, 23.505126953125, 25.20211410522461, 26.89910125732422, 28.596088409423828, 30.293075561523438, 31.990062713623047, 33.687049865722656, 35.384033203125, 37.081024169921875, 38.778011322021484, 40.474998474121094, 42.1719856262207, 43.86897277832031, 45.56595993041992, 47.26294708251953, 48.959930419921875, 50.656917572021484]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 7.0, 5.0, 4.0, 8.0, 10.0, 12.0, 12.0, 10.0, 12.0, 11.0, 17.0, 18.0, 24.0, 16.0, 33.0, 24.0, 27.0, 35.0, 33.0, 44.0, 28.0, 36.0, 26.0, 31.0, 56.0, 29.0, 37.0, 38.0, 27.0, 51.0, 32.0, 24.0, 17.0, 37.0, 27.0, 15.0, 19.0, 21.0, 18.0, 16.0, 10.0, 10.0, 7.0, 6.0, 9.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.390625, -7.14453125, -6.8984375, -6.65234375, -6.40625, -6.16015625, -5.9140625, -5.66796875, -5.421875, -5.17578125, -4.9296875, -4.68359375, -4.4375, -4.19140625, -3.9453125, -3.69921875, -3.453125, -3.20703125, -2.9609375, -2.71484375, -2.46875, -2.22265625, -1.9765625, -1.73046875, -1.484375, -1.23828125, -0.9921875, -0.74609375, -0.5, -0.25390625, -0.0078125, 0.23828125, 0.484375, 0.73046875, 0.9765625, 1.22265625, 1.46875, 1.71484375, 1.9609375, 2.20703125, 2.453125, 2.69921875, 2.9453125, 3.19140625, 3.4375, 3.68359375, 3.9296875, 4.17578125, 4.421875, 4.66796875, 4.9140625, 5.16015625, 5.40625, 5.65234375, 5.8984375, 6.14453125, 6.390625, 6.63671875, 6.8828125, 7.12890625, 7.375, 7.62109375, 7.8671875, 8.11328125, 8.359375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 8.0, 5.0, 15.0, 8.0, 13.0, 12.0, 17.0, 13.0, 24.0, 27.0, 41.0, 36.0, 43.0, 72.0, 88.0, 208.0, 468.0, 2582.0, 32156.0, 764173.0, 3097181.0, 281387.0, 13393.0, 1429.0, 314.0, 142.0, 86.0, 70.0, 56.0, 44.0, 34.0, 21.0, 10.0, 15.0, 24.0, 11.0, 14.0, 14.0, 6.0, 8.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-31.125, -30.21875, -29.3125, -28.40625, -27.5, -26.59375, -25.6875, -24.78125, -23.875, -22.96875, -22.0625, -21.15625, -20.25, -19.34375, -18.4375, -17.53125, -16.625, -15.71875, -14.8125, -13.90625, -13.0, -12.09375, -11.1875, -10.28125, -9.375, -8.46875, -7.5625, -6.65625, -5.75, -4.84375, -3.9375, -3.03125, -2.125, -1.21875, -0.3125, 0.59375, 1.5, 2.40625, 3.3125, 4.21875, 5.125, 6.03125, 6.9375, 7.84375, 8.75, 9.65625, 10.5625, 11.46875, 12.375, 13.28125, 14.1875, 15.09375, 16.0, 16.90625, 17.8125, 18.71875, 19.625, 20.53125, 21.4375, 22.34375, 23.25, 24.15625, 25.0625, 25.96875, 26.875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 15.0, 5.0, 17.0, 26.0, 32.0, 37.0, 45.0, 72.0, 82.0, 125.0, 168.0, 220.0, 272.0, 360.0, 395.0, 394.0, 370.0, 298.0, 277.0, 228.0, 137.0, 125.0, 92.0, 81.0, 40.0, 50.0, 27.0, 14.0, 21.0, 9.0, 9.0, 8.0, 7.0, 5.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.5546875, -9.1920166015625, -8.829345703125, -8.4666748046875, -8.10400390625, -7.7413330078125, -7.378662109375, -7.0159912109375, -6.6533203125, -6.2906494140625, -5.927978515625, -5.5653076171875, -5.20263671875, -4.8399658203125, -4.477294921875, -4.1146240234375, -3.751953125, -3.3892822265625, -3.026611328125, -2.6639404296875, -2.30126953125, -1.9385986328125, -1.575927734375, -1.2132568359375, -0.8505859375, -0.4879150390625, -0.125244140625, 0.2374267578125, 0.60009765625, 0.9627685546875, 1.325439453125, 1.6881103515625, 2.05078125, 2.4134521484375, 2.776123046875, 3.1387939453125, 3.50146484375, 3.8641357421875, 4.226806640625, 4.5894775390625, 4.9521484375, 5.3148193359375, 5.677490234375, 6.0401611328125, 6.40283203125, 6.7655029296875, 7.128173828125, 7.4908447265625, 7.853515625, 8.2161865234375, 8.578857421875, 8.9415283203125, 9.30419921875, 9.6668701171875, 10.029541015625, 10.3922119140625, 10.7548828125, 11.1175537109375, 11.480224609375, 11.8428955078125, 12.20556640625, 12.5682373046875, 12.930908203125, 13.2935791015625, 13.65625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 2.0, 7.0, 6.0, 13.0, 13.0, 21.0, 19.0, 26.0, 55.0, 70.0, 103.0, 138.0, 252.0, 535.0, 1682.0, 8979.0, 76707.0, 978910.0, 2781811.0, 309759.0, 29009.0, 4127.0, 1032.0, 401.0, 216.0, 140.0, 69.0, 54.0, 30.0, 22.0, 12.0, 11.0, 12.0, 5.0, 5.0, 7.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.015625, -27.173828125, -26.33203125, -25.490234375, -24.6484375, -23.806640625, -22.96484375, -22.123046875, -21.28125, -20.439453125, -19.59765625, -18.755859375, -17.9140625, -17.072265625, -16.23046875, -15.388671875, -14.546875, -13.705078125, -12.86328125, -12.021484375, -11.1796875, -10.337890625, -9.49609375, -8.654296875, -7.8125, -6.970703125, -6.12890625, -5.287109375, -4.4453125, -3.603515625, -2.76171875, -1.919921875, -1.078125, -0.236328125, 0.60546875, 1.447265625, 2.2890625, 3.130859375, 3.97265625, 4.814453125, 5.65625, 6.498046875, 7.33984375, 8.181640625, 9.0234375, 9.865234375, 10.70703125, 11.548828125, 12.390625, 13.232421875, 14.07421875, 14.916015625, 15.7578125, 16.599609375, 17.44140625, 18.283203125, 19.125, 19.966796875, 20.80859375, 21.650390625, 22.4921875, 23.333984375, 24.17578125, 25.017578125, 25.859375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 54.0, 258.0, 419.0, 219.0, 53.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-324.8886413574219, -318.44683837890625, -312.0050354003906, -305.563232421875, -299.1214294433594, -292.67962646484375, -286.2378234863281, -279.7960205078125, -273.354248046875, -266.9124450683594, -260.47064208984375, -254.02883911132812, -247.5870361328125, -241.14523315429688, -234.7034454345703, -228.2616424560547, -221.81982421875, -215.37802124023438, -208.93621826171875, -202.49441528320312, -196.0526123046875, -189.61080932617188, -183.1690216064453, -176.7272186279297, -170.28541564941406, -163.84361267089844, -157.4018096923828, -150.9600067138672, -144.51821899414062, -138.076416015625, -131.63461303710938, -125.19281005859375, -118.75100708007812, -112.3092041015625, -105.86740112304688, -99.42560577392578, -92.98380279541016, -86.54199981689453, -80.10020446777344, -73.65840148925781, -67.21659851074219, -60.77479553222656, -54.3329963684082, -47.891197204589844, -41.44939422607422, -35.007591247558594, -28.565792083740234, -22.123992919921875, -15.68218994140625, -9.240388870239258, -2.7985877990722656, 3.6432132720947266, 10.085014343261719, 16.526817321777344, 22.968616485595703, 29.410415649414062, 35.85221862792969, 42.29402160644531, 48.73582077026367, 55.17761993408203, 61.619422912597656, 68.06122589111328, 74.50302124023438, 80.94482421875, 87.38662719726562]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 3.0, 4.0, 3.0, 6.0, 16.0, 15.0, 17.0, 11.0, 13.0, 19.0, 22.0, 22.0, 25.0, 26.0, 31.0, 34.0, 30.0, 46.0, 40.0, 37.0, 38.0, 38.0, 40.0, 25.0, 46.0, 40.0, 34.0, 35.0, 36.0, 34.0, 32.0, 23.0, 25.0, 16.0, 13.0, 14.0, 10.0, 22.0, 10.0, 11.0, 9.0, 5.0, 3.0, 5.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-39.89580535888672, -38.642818450927734, -37.389827728271484, -36.1368408203125, -34.883853912353516, -33.630863189697266, -32.37787628173828, -31.124887466430664, -29.871898651123047, -28.61890983581543, -27.365922927856445, -26.112934112548828, -24.85994529724121, -23.606956481933594, -22.35396957397461, -21.100980758666992, -19.847993850708008, -18.59500503540039, -17.342018127441406, -16.08902931213379, -14.836040496826172, -13.583052635192871, -12.33006477355957, -11.077075958251953, -9.824088096618652, -8.571100234985352, -7.318111419677734, -6.065123558044434, -4.812135219573975, -3.5591468811035156, -2.306159019470215, -1.0531702041625977, 0.19981765747070312, 1.4528058767318726, 2.705794095993042, 3.958782196044922, 5.211770534515381, 6.46475887298584, 7.717746734619141, 8.970735549926758, 10.223723411560059, 11.47671127319336, 12.729700088500977, 13.982687950134277, 15.235675811767578, 16.488664627075195, 17.741653442382812, 18.994640350341797, 20.247629165649414, 21.50061798095703, 22.753604888916016, 24.006593704223633, 25.25958251953125, 26.512569427490234, 27.76555824279785, 29.01854705810547, 30.271533966064453, 31.52452278137207, 32.77751159667969, 34.03049850463867, 35.283485412597656, 36.536476135253906, 37.78946304321289, 39.042449951171875, 40.295440673828125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 10.0, 10.0, 12.0, 16.0, 12.0, 11.0, 20.0, 18.0, 24.0, 24.0, 29.0, 28.0, 35.0, 40.0, 35.0, 33.0, 40.0, 42.0, 34.0, 41.0, 44.0, 44.0, 35.0, 39.0, 27.0, 34.0, 27.0, 30.0, 34.0, 23.0, 24.0, 18.0, 20.0, 14.0, 12.0, 10.0, 14.0, 12.0, 9.0, 4.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.4453125, -9.1783447265625, -8.911376953125, -8.6444091796875, -8.37744140625, -8.1104736328125, -7.843505859375, -7.5765380859375, -7.3095703125, -7.0426025390625, -6.775634765625, -6.5086669921875, -6.24169921875, -5.9747314453125, -5.707763671875, -5.4407958984375, -5.173828125, -4.9068603515625, -4.639892578125, -4.3729248046875, -4.10595703125, -3.8389892578125, -3.572021484375, -3.3050537109375, -3.0380859375, -2.7711181640625, -2.504150390625, -2.2371826171875, -1.97021484375, -1.7032470703125, -1.436279296875, -1.1693115234375, -0.90234375, -0.6353759765625, -0.368408203125, -0.1014404296875, 0.16552734375, 0.4324951171875, 0.699462890625, 0.9664306640625, 1.2333984375, 1.5003662109375, 1.767333984375, 2.0343017578125, 2.30126953125, 2.5682373046875, 2.835205078125, 3.1021728515625, 3.369140625, 3.6361083984375, 3.903076171875, 4.1700439453125, 4.43701171875, 4.7039794921875, 4.970947265625, 5.2379150390625, 5.5048828125, 5.7718505859375, 6.038818359375, 6.3057861328125, 6.57275390625, 6.8397216796875, 7.106689453125, 7.3736572265625, 7.640625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 6.0, 17.0, 20.0, 29.0, 36.0, 58.0, 100.0, 166.0, 284.0, 467.0, 736.0, 1158.0, 1928.0, 2984.0, 4775.0, 7395.0, 11721.0, 17831.0, 27083.0, 39535.0, 56679.0, 76825.0, 98680.0, 116577.0, 123408.0, 115816.0, 97666.0, 75894.0, 56155.0, 39184.0, 26384.0, 17332.0, 11474.0, 7401.0, 4758.0, 3014.0, 1929.0, 1192.0, 740.0, 436.0, 288.0, 146.0, 96.0, 61.0, 38.0, 21.0, 15.0, 7.0, 3.0, 6.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0068359375, -0.974853515625, -0.94287109375, -0.910888671875, -0.87890625, -0.846923828125, -0.81494140625, -0.782958984375, -0.7509765625, -0.718994140625, -0.68701171875, -0.655029296875, -0.623046875, -0.591064453125, -0.55908203125, -0.527099609375, -0.4951171875, -0.463134765625, -0.43115234375, -0.399169921875, -0.3671875, -0.335205078125, -0.30322265625, -0.271240234375, -0.2392578125, -0.207275390625, -0.17529296875, -0.143310546875, -0.111328125, -0.079345703125, -0.04736328125, -0.015380859375, 0.0166015625, 0.048583984375, 0.08056640625, 0.112548828125, 0.14453125, 0.176513671875, 0.20849609375, 0.240478515625, 0.2724609375, 0.304443359375, 0.33642578125, 0.368408203125, 0.400390625, 0.432373046875, 0.46435546875, 0.496337890625, 0.5283203125, 0.560302734375, 0.59228515625, 0.624267578125, 0.65625, 0.688232421875, 0.72021484375, 0.752197265625, 0.7841796875, 0.816162109375, 0.84814453125, 0.880126953125, 0.912109375, 0.944091796875, 0.97607421875, 1.008056640625, 1.0400390625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 6.0, 14.0, 5.0, 3.0, 9.0, 10.0, 10.0, 15.0, 16.0, 24.0, 21.0, 27.0, 30.0, 31.0, 48.0, 39.0, 44.0, 42.0, 41.0, 1063.0, 49.0, 44.0, 48.0, 45.0, 51.0, 56.0, 39.0, 38.0, 25.0, 22.0, 17.0, 22.0, 10.0, 20.0, 9.0, 6.0, 6.0, 5.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8046875, -5.60223388671875, -5.3997802734375, -5.19732666015625, -4.994873046875, -4.79241943359375, -4.5899658203125, -4.38751220703125, -4.18505859375, -3.98260498046875, -3.7801513671875, -3.57769775390625, -3.375244140625, -3.17279052734375, -2.9703369140625, -2.76788330078125, -2.5654296875, -2.36297607421875, -2.1605224609375, -1.95806884765625, -1.755615234375, -1.55316162109375, -1.3507080078125, -1.14825439453125, -0.94580078125, -0.74334716796875, -0.5408935546875, -0.33843994140625, -0.135986328125, 0.06646728515625, 0.2689208984375, 0.47137451171875, 0.673828125, 0.87628173828125, 1.0787353515625, 1.28118896484375, 1.483642578125, 1.68609619140625, 1.8885498046875, 2.09100341796875, 2.29345703125, 2.49591064453125, 2.6983642578125, 2.90081787109375, 3.103271484375, 3.30572509765625, 3.5081787109375, 3.71063232421875, 3.9130859375, 4.11553955078125, 4.3179931640625, 4.52044677734375, 4.722900390625, 4.92535400390625, 5.1278076171875, 5.33026123046875, 5.53271484375, 5.73516845703125, 5.9376220703125, 6.14007568359375, 6.342529296875, 6.54498291015625, 6.7474365234375, 6.94989013671875, 7.15234375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 10.0, 13.0, 23.0, 25.0, 42.0, 42.0, 84.0, 123.0, 169.0, 234.0, 369.0, 543.0, 790.0, 1088.0, 1655.0, 2316.0, 3465.0, 5065.0, 7307.0, 10397.0, 14877.0, 21817.0, 32655.0, 1847367.0, 60603.0, 26683.0, 18462.0, 12595.0, 8842.0, 5986.0, 4200.0, 2892.0, 2014.0, 1388.0, 951.0, 679.0, 446.0, 285.0, 212.0, 128.0, 109.0, 57.0, 48.0, 31.0, 14.0, 13.0, 8.0, 7.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.7216796875, -1.6638336181640625, -1.605987548828125, -1.5481414794921875, -1.49029541015625, -1.4324493408203125, -1.374603271484375, -1.3167572021484375, -1.2589111328125, -1.2010650634765625, -1.143218994140625, -1.0853729248046875, -1.02752685546875, -0.9696807861328125, -0.911834716796875, -0.8539886474609375, -0.796142578125, -0.7382965087890625, -0.680450439453125, -0.6226043701171875, -0.56475830078125, -0.5069122314453125, -0.449066162109375, -0.3912200927734375, -0.3333740234375, -0.2755279541015625, -0.217681884765625, -0.1598358154296875, -0.10198974609375, -0.0441436767578125, 0.013702392578125, 0.0715484619140625, 0.12939453125, 0.1872406005859375, 0.245086669921875, 0.3029327392578125, 0.36077880859375, 0.4186248779296875, 0.476470947265625, 0.5343170166015625, 0.5921630859375, 0.6500091552734375, 0.707855224609375, 0.7657012939453125, 0.82354736328125, 0.8813934326171875, 0.939239501953125, 0.9970855712890625, 1.054931640625, 1.1127777099609375, 1.170623779296875, 1.2284698486328125, 1.28631591796875, 1.3441619873046875, 1.402008056640625, 1.4598541259765625, 1.5177001953125, 1.5755462646484375, 1.633392333984375, 1.6912384033203125, 1.74908447265625, 1.8069305419921875, 1.864776611328125, 1.9226226806640625, 1.98046875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 5.0, 5.0, 3.0, 8.0, 14.0, 9.0, 15.0, 22.0, 15.0, 36.0, 37.0, 60.0, 64.0, 103.0, 81.0, 79.0, 91.0, 77.0, 70.0, 52.0, 35.0, 34.0, 23.0, 13.0, 10.0, 10.0, 11.0, 3.0, 10.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.037933349609375, -0.03672075271606445, -0.035508155822753906, -0.03429555892944336, -0.03308296203613281, -0.031870365142822266, -0.03065776824951172, -0.029445171356201172, -0.028232574462890625, -0.027019977569580078, -0.02580738067626953, -0.024594783782958984, -0.023382186889648438, -0.02216958999633789, -0.020956993103027344, -0.019744396209716797, -0.01853179931640625, -0.017319202423095703, -0.016106605529785156, -0.01489400863647461, -0.013681411743164062, -0.012468814849853516, -0.011256217956542969, -0.010043621063232422, -0.008831024169921875, -0.007618427276611328, -0.006405830383300781, -0.005193233489990234, -0.0039806365966796875, -0.0027680397033691406, -0.0015554428100585938, -0.0003428459167480469, 0.0008697509765625, 0.002082347869873047, 0.0032949447631835938, 0.004507541656494141, 0.0057201385498046875, 0.006932735443115234, 0.008145332336425781, 0.009357929229736328, 0.010570526123046875, 0.011783123016357422, 0.012995719909667969, 0.014208316802978516, 0.015420913696289062, 0.01663351058959961, 0.017846107482910156, 0.019058704376220703, 0.02027130126953125, 0.021483898162841797, 0.022696495056152344, 0.02390909194946289, 0.025121688842773438, 0.026334285736083984, 0.02754688262939453, 0.028759479522705078, 0.029972076416015625, 0.031184673309326172, 0.03239727020263672, 0.033609867095947266, 0.03482246398925781, 0.03603506088256836, 0.037247657775878906, 0.03846025466918945, 0.0396728515625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 4.0, 14.0, 11.0, 12.0, 27.0, 25.0, 33.0, 61.0, 94.0, 140.0, 219.0, 381.0, 1121.0, 107359.0, 934974.0, 2777.0, 502.0, 293.0, 151.0, 98.0, 56.0, 45.0, 35.0, 18.0, 20.0, 18.0, 12.0, 8.0, 8.0, 6.0, 6.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.74755859375, -0.7250289916992188, -0.7024993896484375, -0.6799697875976562, -0.657440185546875, -0.6349105834960938, -0.6123809814453125, -0.5898513793945312, -0.56732177734375, -0.5447921752929688, -0.5222625732421875, -0.49973297119140625, -0.477203369140625, -0.45467376708984375, -0.4321441650390625, -0.40961456298828125, -0.3870849609375, -0.36455535888671875, -0.3420257568359375, -0.31949615478515625, -0.296966552734375, -0.27443695068359375, -0.2519073486328125, -0.22937774658203125, -0.20684814453125, -0.18431854248046875, -0.1617889404296875, -0.13925933837890625, -0.116729736328125, -0.09420013427734375, -0.0716705322265625, -0.04914093017578125, -0.026611328125, -0.00408172607421875, 0.0184478759765625, 0.04097747802734375, 0.063507080078125, 0.08603668212890625, 0.1085662841796875, 0.13109588623046875, 0.15362548828125, 0.17615509033203125, 0.1986846923828125, 0.22121429443359375, 0.243743896484375, 0.26627349853515625, 0.2888031005859375, 0.31133270263671875, 0.3338623046875, 0.35639190673828125, 0.3789215087890625, 0.40145111083984375, 0.423980712890625, 0.44651031494140625, 0.4690399169921875, 0.49156951904296875, 0.51409912109375, 0.5366287231445312, 0.5591583251953125, 0.5816879272460938, 0.604217529296875, 0.6267471313476562, 0.6492767333984375, 0.6718063354492188, 0.6943359375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 8.0, 78.0, 597.0, 303.0, 26.0, 4.0], "bins": [-0.684520423412323, -0.6732665300369263, -0.6620125770568848, -0.650758683681488, -0.6395047903060913, -0.6282508373260498, -0.6169969439506531, -0.6057430505752563, -0.5944890975952148, -0.5832352042198181, -0.5719812512397766, -0.5607273578643799, -0.5494734644889832, -0.5382195115089417, -0.5269656181335449, -0.5157117247581482, -0.5044578313827515, -0.49320390820503235, -0.4819500148296356, -0.4706960916519165, -0.4594421684741974, -0.44818827509880066, -0.43693435192108154, -0.4256804585456848, -0.4144265055656433, -0.4031725823879242, -0.39191868901252747, -0.38066476583480835, -0.36941084265708923, -0.3581569492816925, -0.3469030261039734, -0.33564913272857666, -0.32439517974853516, -0.31314125657081604, -0.3018873631954193, -0.2906334400177002, -0.2793795168399811, -0.26812562346458435, -0.25687170028686523, -0.2456177920103073, -0.2343638837337494, -0.22310997545719147, -0.21185605227947235, -0.20060214400291443, -0.1893482357263565, -0.17809432744979858, -0.16684040427207947, -0.15558649599552155, -0.14433258771896362, -0.1330786794424057, -0.12182476371526718, -0.11057084798812866, -0.09931693971157074, -0.08806302398443222, -0.0768091082572937, -0.06555519998073578, -0.05430128052830696, -0.04304736852645874, -0.03179345279932022, -0.020539540797472, -0.00928562879562378, 0.0019682832062244415, 0.01322219893336296, 0.024476107209920883, 0.0357300229370594]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 6.0, 5.0, 5.0, 10.0, 9.0, 8.0, 14.0, 23.0, 14.0, 12.0, 24.0, 23.0, 26.0, 36.0, 28.0, 30.0, 30.0, 42.0, 50.0, 49.0, 42.0, 51.0, 41.0, 41.0, 50.0, 24.0, 46.0, 41.0, 33.0, 23.0, 24.0, 17.0, 19.0, 18.0, 16.0, 14.0, 12.0, 11.0, 7.0, 4.0, 9.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.03651696443557739, -0.03536229580640793, -0.034207627177238464, -0.0330529548227787, -0.03189828619360924, -0.030743617564439774, -0.02958894707262516, -0.028434276580810547, -0.027279607951641083, -0.02612493932247162, -0.024970268830657005, -0.023815598338842392, -0.022660929709672928, -0.021506261080503464, -0.02035159058868885, -0.019196920096874237, -0.018042251467704773, -0.01688758283853531, -0.015732912346720695, -0.014578242786228657, -0.013423573225736618, -0.01226890366524458, -0.01111423410475254, -0.009959564544260502, -0.008804894983768463, -0.007650225423276424, -0.006495555862784386, -0.005340886302292347, -0.004186216741800308, -0.0030315471813082695, -0.0018768776208162308, -0.000722208060324192, 0.0004324615001678467, 0.0015871310606598854, 0.002741800621151924, 0.003896470181643963, 0.005051139742136002, 0.00620580930262804, 0.007360478863120079, 0.008515148423612118, 0.009669817984104156, 0.010824487544596195, 0.011979157105088234, 0.013133826665580273, 0.014288496226072311, 0.01544316578656435, 0.01659783534705639, 0.017752505838871002, 0.018907174468040466, 0.02006184309720993, 0.021216513589024544, 0.022371184080839157, 0.02352585271000862, 0.024680521339178085, 0.0258351918309927, 0.026989862322807312, 0.028144530951976776, 0.02929919958114624, 0.030453870072960854, 0.03160854056477547, 0.03276320919394493, 0.033917877823114395, 0.03507255017757416, 0.03622721880674362, 0.037381887435913086]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 3.0, 5.0, 9.0, 6.0, 7.0, 17.0, 13.0, 14.0, 18.0, 18.0, 18.0, 18.0, 23.0, 29.0, 32.0, 43.0, 35.0, 42.0, 37.0, 31.0, 33.0, 34.0, 49.0, 29.0, 38.0, 32.0, 32.0, 30.0, 30.0, 32.0, 15.0, 26.0, 31.0, 24.0, 21.0, 19.0, 19.0, 15.0, 10.0, 13.0, 10.0, 9.0, 7.0, 6.0, 3.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-8.1953125, -7.948974609375, -7.70263671875, -7.456298828125, -7.2099609375, -6.963623046875, -6.71728515625, -6.470947265625, -6.224609375, -5.978271484375, -5.73193359375, -5.485595703125, -5.2392578125, -4.992919921875, -4.74658203125, -4.500244140625, -4.25390625, -4.007568359375, -3.76123046875, -3.514892578125, -3.2685546875, -3.022216796875, -2.77587890625, -2.529541015625, -2.283203125, -2.036865234375, -1.79052734375, -1.544189453125, -1.2978515625, -1.051513671875, -0.80517578125, -0.558837890625, -0.3125, -0.066162109375, 0.18017578125, 0.426513671875, 0.6728515625, 0.919189453125, 1.16552734375, 1.411865234375, 1.658203125, 1.904541015625, 2.15087890625, 2.397216796875, 2.6435546875, 2.889892578125, 3.13623046875, 3.382568359375, 3.62890625, 3.875244140625, 4.12158203125, 4.367919921875, 4.6142578125, 4.860595703125, 5.10693359375, 5.353271484375, 5.599609375, 5.845947265625, 6.09228515625, 6.338623046875, 6.5849609375, 6.831298828125, 7.07763671875, 7.323974609375, 7.5703125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 8.0, 5.0, 6.0, 7.0, 18.0, 20.0, 27.0, 47.0, 75.0, 104.0, 165.0, 298.0, 564.0, 1154.0, 2215.0, 4765.0, 11015.0, 26082.0, 64075.0, 168789.0, 362265.0, 247989.0, 93139.0, 37257.0, 15544.0, 6680.0, 3102.0, 1384.0, 756.0, 390.0, 233.0, 134.0, 75.0, 44.0, 35.0, 28.0, 16.0, 13.0, 13.0, 8.0, 3.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.2109375, -12.794189453125, -12.37744140625, -11.960693359375, -11.5439453125, -11.127197265625, -10.71044921875, -10.293701171875, -9.876953125, -9.460205078125, -9.04345703125, -8.626708984375, -8.2099609375, -7.793212890625, -7.37646484375, -6.959716796875, -6.54296875, -6.126220703125, -5.70947265625, -5.292724609375, -4.8759765625, -4.459228515625, -4.04248046875, -3.625732421875, -3.208984375, -2.792236328125, -2.37548828125, -1.958740234375, -1.5419921875, -1.125244140625, -0.70849609375, -0.291748046875, 0.125, 0.541748046875, 0.95849609375, 1.375244140625, 1.7919921875, 2.208740234375, 2.62548828125, 3.042236328125, 3.458984375, 3.875732421875, 4.29248046875, 4.709228515625, 5.1259765625, 5.542724609375, 5.95947265625, 6.376220703125, 6.79296875, 7.209716796875, 7.62646484375, 8.043212890625, 8.4599609375, 8.876708984375, 9.29345703125, 9.710205078125, 10.126953125, 10.543701171875, 10.96044921875, 11.377197265625, 11.7939453125, 12.210693359375, 12.62744140625, 13.044189453125, 13.4609375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 8.0, 17.0, 10.0, 11.0, 19.0, 24.0, 26.0, 24.0, 44.0, 38.0, 55.0, 64.0, 91.0, 109.0, 178.0, 1323.0, 262.0, 177.0, 118.0, 74.0, 54.0, 50.0, 40.0, 48.0, 33.0, 33.0, 18.0, 21.0, 17.0, 12.0, 10.0, 3.0, 4.0, 8.0, 6.0, 2.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-25.34375, -24.595458984375, -23.84716796875, -23.098876953125, -22.3505859375, -21.602294921875, -20.85400390625, -20.105712890625, -19.357421875, -18.609130859375, -17.86083984375, -17.112548828125, -16.3642578125, -15.615966796875, -14.86767578125, -14.119384765625, -13.37109375, -12.622802734375, -11.87451171875, -11.126220703125, -10.3779296875, -9.629638671875, -8.88134765625, -8.133056640625, -7.384765625, -6.636474609375, -5.88818359375, -5.139892578125, -4.3916015625, -3.643310546875, -2.89501953125, -2.146728515625, -1.3984375, -0.650146484375, 0.09814453125, 0.846435546875, 1.5947265625, 2.343017578125, 3.09130859375, 3.839599609375, 4.587890625, 5.336181640625, 6.08447265625, 6.832763671875, 7.5810546875, 8.329345703125, 9.07763671875, 9.825927734375, 10.57421875, 11.322509765625, 12.07080078125, 12.819091796875, 13.5673828125, 14.315673828125, 15.06396484375, 15.812255859375, 16.560546875, 17.308837890625, 18.05712890625, 18.805419921875, 19.5537109375, 20.302001953125, 21.05029296875, 21.798583984375, 22.546875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 4.0, 11.0, 11.0, 20.0, 26.0, 20.0, 27.0, 52.0, 71.0, 91.0, 143.0, 229.0, 335.0, 578.0, 1308.0, 7328.0, 134574.0, 2812635.0, 176573.0, 8705.0, 1341.0, 563.0, 339.0, 224.0, 145.0, 121.0, 62.0, 44.0, 33.0, 26.0, 23.0, 11.0, 6.0, 3.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-41.625, -40.3837890625, -39.142578125, -37.9013671875, -36.66015625, -35.4189453125, -34.177734375, -32.9365234375, -31.6953125, -30.4541015625, -29.212890625, -27.9716796875, -26.73046875, -25.4892578125, -24.248046875, -23.0068359375, -21.765625, -20.5244140625, -19.283203125, -18.0419921875, -16.80078125, -15.5595703125, -14.318359375, -13.0771484375, -11.8359375, -10.5947265625, -9.353515625, -8.1123046875, -6.87109375, -5.6298828125, -4.388671875, -3.1474609375, -1.90625, -0.6650390625, 0.576171875, 1.8173828125, 3.05859375, 4.2998046875, 5.541015625, 6.7822265625, 8.0234375, 9.2646484375, 10.505859375, 11.7470703125, 12.98828125, 14.2294921875, 15.470703125, 16.7119140625, 17.953125, 19.1943359375, 20.435546875, 21.6767578125, 22.91796875, 24.1591796875, 25.400390625, 26.6416015625, 27.8828125, 29.1240234375, 30.365234375, 31.6064453125, 32.84765625, 34.0888671875, 35.330078125, 36.5712890625, 37.8125]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 149.0, 694.0, 163.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-460.33709716796875, -451.2255859375, -442.11407470703125, -433.0025634765625, -423.89105224609375, -414.779541015625, -405.66802978515625, -396.5565490722656, -387.4450378417969, -378.3335266113281, -369.2220153808594, -360.1105041503906, -350.9989929199219, -341.88751220703125, -332.7760009765625, -323.66448974609375, -314.552978515625, -305.44146728515625, -296.3299560546875, -287.21844482421875, -278.10693359375, -268.99542236328125, -259.8839111328125, -250.7724151611328, -241.660888671875, -232.54937744140625, -223.4378662109375, -214.32635498046875, -205.21485900878906, -196.1033477783203, -186.99183654785156, -177.8803253173828, -168.768798828125, -159.65728759765625, -150.5457763671875, -141.43426513671875, -132.32276916503906, -123.21125793457031, -114.09974670410156, -104.98823547363281, -95.87673950195312, -86.76522827148438, -77.65372467041016, -68.5422134399414, -59.43070602416992, -50.31919860839844, -41.20768737792969, -32.0961799621582, -22.98467254638672, -13.873164176940918, -4.761655807495117, 4.349853515625, 13.461360931396484, 22.57286834716797, 31.68437957763672, 40.7958869934082, 49.90739440917969, 59.01890182495117, 68.13040924072266, 77.2419204711914, 86.35342407226562, 95.46493530273438, 104.57644653320312, 113.68795776367188, 122.7994613647461]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 3.0, 9.0, 11.0, 5.0, 16.0, 12.0, 16.0, 22.0, 19.0, 16.0, 19.0, 20.0, 22.0, 35.0, 34.0, 38.0, 34.0, 41.0, 33.0, 32.0, 26.0, 43.0, 38.0, 41.0, 21.0, 49.0, 32.0, 34.0, 34.0, 34.0, 26.0, 17.0, 29.0, 26.0, 23.0, 9.0, 13.0, 10.0, 6.0, 11.0, 4.0, 5.0, 9.0, 3.0, 6.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-46.05925750732422, -44.5831413269043, -43.10702133178711, -41.63090515136719, -40.15478515625, -38.67866897583008, -37.202552795410156, -35.72643280029297, -34.25031280517578, -32.77419662475586, -31.298076629638672, -29.82196044921875, -28.345840454101562, -26.86972427368164, -25.393606185913086, -23.91748809814453, -22.44137191772461, -20.965253829956055, -19.4891357421875, -18.013019561767578, -16.53689956665039, -15.060782432556152, -13.584665298461914, -12.10854721069336, -10.632429122924805, -9.15631103515625, -7.6801934242248535, -6.204075813293457, -4.727957725524902, -3.2518396377563477, -1.7757225036621094, -0.2996044158935547, 1.176513671875, 2.6526315212249756, 4.128749370574951, 5.604866981506348, 7.080985069274902, 8.557103157043457, 10.033220291137695, 11.50933837890625, 12.985456466674805, 14.46157455444336, 15.937692642211914, 17.41381072998047, 18.88992691040039, 20.366046905517578, 21.8421630859375, 23.318281173706055, 24.79439926147461, 26.270517349243164, 27.74663543701172, 29.22275161743164, 30.698871612548828, 32.17498779296875, 33.65110778808594, 35.12722396850586, 36.60334014892578, 38.0794563293457, 39.55557632446289, 41.03169250488281, 42.5078125, 43.98392868041992, 45.460044860839844, 46.93616485595703, 48.41228485107422]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 1.0, 1.0, 5.0, 6.0, 4.0, 3.0, 10.0, 7.0, 11.0, 26.0, 21.0, 22.0, 20.0, 36.0, 29.0, 24.0, 43.0, 37.0, 42.0, 30.0, 44.0, 44.0, 34.0, 47.0, 44.0, 30.0, 46.0, 42.0, 50.0, 27.0, 27.0, 21.0, 25.0, 23.0, 27.0, 15.0, 19.0, 8.0, 14.0, 12.0, 2.0, 12.0, 3.0, 3.0, 3.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.4609375, -9.1807861328125, -8.900634765625, -8.6204833984375, -8.34033203125, -8.0601806640625, -7.780029296875, -7.4998779296875, -7.2197265625, -6.9395751953125, -6.659423828125, -6.3792724609375, -6.09912109375, -5.8189697265625, -5.538818359375, -5.2586669921875, -4.978515625, -4.6983642578125, -4.418212890625, -4.1380615234375, -3.85791015625, -3.5777587890625, -3.297607421875, -3.0174560546875, -2.7373046875, -2.4571533203125, -2.177001953125, -1.8968505859375, -1.61669921875, -1.3365478515625, -1.056396484375, -0.7762451171875, -0.49609375, -0.2159423828125, 0.064208984375, 0.3443603515625, 0.62451171875, 0.9046630859375, 1.184814453125, 1.4649658203125, 1.7451171875, 2.0252685546875, 2.305419921875, 2.5855712890625, 2.86572265625, 3.1458740234375, 3.426025390625, 3.7061767578125, 3.986328125, 4.2664794921875, 4.546630859375, 4.8267822265625, 5.10693359375, 5.3870849609375, 5.667236328125, 5.9473876953125, 6.2275390625, 6.5076904296875, 6.787841796875, 7.0679931640625, 7.34814453125, 7.6282958984375, 7.908447265625, 8.1885986328125, 8.46875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 3.0, 5.0, 3.0, 7.0, 9.0, 11.0, 11.0, 20.0, 22.0, 18.0, 33.0, 34.0, 54.0, 63.0, 78.0, 124.0, 185.0, 213.0, 307.0, 446.0, 1871.0, 1308914.0, 2877137.0, 2967.0, 491.0, 334.0, 257.0, 181.0, 107.0, 82.0, 72.0, 52.0, 29.0, 30.0, 20.0, 21.0, 22.0, 19.0, 10.0, 7.0, 2.0, 3.0, 4.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0], "bins": [-90.125, -87.693359375, -85.26171875, -82.830078125, -80.3984375, -77.966796875, -75.53515625, -73.103515625, -70.671875, -68.240234375, -65.80859375, -63.376953125, -60.9453125, -58.513671875, -56.08203125, -53.650390625, -51.21875, -48.787109375, -46.35546875, -43.923828125, -41.4921875, -39.060546875, -36.62890625, -34.197265625, -31.765625, -29.333984375, -26.90234375, -24.470703125, -22.0390625, -19.607421875, -17.17578125, -14.744140625, -12.3125, -9.880859375, -7.44921875, -5.017578125, -2.5859375, -0.154296875, 2.27734375, 4.708984375, 7.140625, 9.572265625, 12.00390625, 14.435546875, 16.8671875, 19.298828125, 21.73046875, 24.162109375, 26.59375, 29.025390625, 31.45703125, 33.888671875, 36.3203125, 38.751953125, 41.18359375, 43.615234375, 46.046875, 48.478515625, 50.91015625, 53.341796875, 55.7734375, 58.205078125, 60.63671875, 63.068359375, 65.5]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 3.0, 6.0, 10.0, 13.0, 9.0, 15.0, 22.0, 33.0, 46.0, 45.0, 60.0, 113.0, 125.0, 180.0, 265.0, 349.0, 444.0, 459.0, 437.0, 374.0, 274.0, 197.0, 159.0, 117.0, 67.0, 50.0, 36.0, 37.0, 40.0, 16.0, 19.0, 17.0, 12.0, 8.0, 6.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.59375, -10.2237548828125, -9.853759765625, -9.4837646484375, -9.11376953125, -8.7437744140625, -8.373779296875, -8.0037841796875, -7.6337890625, -7.2637939453125, -6.893798828125, -6.5238037109375, -6.15380859375, -5.7838134765625, -5.413818359375, -5.0438232421875, -4.673828125, -4.3038330078125, -3.933837890625, -3.5638427734375, -3.19384765625, -2.8238525390625, -2.453857421875, -2.0838623046875, -1.7138671875, -1.3438720703125, -0.973876953125, -0.6038818359375, -0.23388671875, 0.1361083984375, 0.506103515625, 0.8760986328125, 1.24609375, 1.6160888671875, 1.986083984375, 2.3560791015625, 2.72607421875, 3.0960693359375, 3.466064453125, 3.8360595703125, 4.2060546875, 4.5760498046875, 4.946044921875, 5.3160400390625, 5.68603515625, 6.0560302734375, 6.426025390625, 6.7960205078125, 7.166015625, 7.5360107421875, 7.906005859375, 8.2760009765625, 8.64599609375, 9.0159912109375, 9.385986328125, 9.7559814453125, 10.1259765625, 10.4959716796875, 10.865966796875, 11.2359619140625, 11.60595703125, 11.9759521484375, 12.345947265625, 12.7159423828125, 13.0859375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 8.0, 4.0, 9.0, 7.0, 12.0, 15.0, 17.0, 23.0, 29.0, 36.0, 39.0, 81.0, 125.0, 236.0, 464.0, 2064.0, 27714.0, 904821.0, 3153011.0, 98661.0, 5403.0, 741.0, 291.0, 144.0, 87.0, 67.0, 53.0, 33.0, 22.0, 13.0, 11.0, 9.0, 5.0, 6.0, 10.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.6875, -34.46533203125, -33.2431640625, -32.02099609375, -30.798828125, -29.57666015625, -28.3544921875, -27.13232421875, -25.91015625, -24.68798828125, -23.4658203125, -22.24365234375, -21.021484375, -19.79931640625, -18.5771484375, -17.35498046875, -16.1328125, -14.91064453125, -13.6884765625, -12.46630859375, -11.244140625, -10.02197265625, -8.7998046875, -7.57763671875, -6.35546875, -5.13330078125, -3.9111328125, -2.68896484375, -1.466796875, -0.24462890625, 0.9775390625, 2.19970703125, 3.421875, 4.64404296875, 5.8662109375, 7.08837890625, 8.310546875, 9.53271484375, 10.7548828125, 11.97705078125, 13.19921875, 14.42138671875, 15.6435546875, 16.86572265625, 18.087890625, 19.31005859375, 20.5322265625, 21.75439453125, 22.9765625, 24.19873046875, 25.4208984375, 26.64306640625, 27.865234375, 29.08740234375, 30.3095703125, 31.53173828125, 32.75390625, 33.97607421875, 35.1982421875, 36.42041015625, 37.642578125, 38.86474609375, 40.0869140625, 41.30908203125, 42.53125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 27.0, 128.0, 328.0, 341.0, 156.0, 31.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-292.38720703125, -287.0774230957031, -281.76763916015625, -276.4578552246094, -271.1480712890625, -265.8382873535156, -260.52850341796875, -255.2187042236328, -249.90892028808594, -244.59913635253906, -239.2893524169922, -233.9795684814453, -228.66976928710938, -223.3599853515625, -218.05020141601562, -212.74041748046875, -207.43063354492188, -202.120849609375, -196.81106567382812, -191.50128173828125, -186.19149780273438, -180.88169860839844, -175.57191467285156, -170.2621307373047, -164.9523468017578, -159.64256286621094, -154.33277893066406, -149.0229949951172, -143.71319580078125, -138.40341186523438, -133.0936279296875, -127.78384399414062, -122.47406005859375, -117.16427612304688, -111.8544921875, -106.5447006225586, -101.23491668701172, -95.92513275146484, -90.61534118652344, -85.30555725097656, -79.99577331542969, -74.68598937988281, -69.37620544433594, -64.06641387939453, -58.756629943847656, -53.44684600830078, -48.13705825805664, -42.8272705078125, -37.517486572265625, -32.20770263671875, -26.89791488647461, -21.5881290435791, -16.278343200683594, -10.968557357788086, -5.658771514892578, -0.3489837646484375, 4.9608001708984375, 10.270586013793945, 15.580371856689453, 20.89015769958496, 26.19994354248047, 31.509729385375977, 36.819515228271484, 42.129302978515625, 47.4390869140625]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 0.0, 3.0, 11.0, 5.0, 20.0, 18.0, 27.0, 23.0, 33.0, 21.0, 37.0, 41.0, 39.0, 36.0, 43.0, 43.0, 46.0, 49.0, 45.0, 42.0, 48.0, 45.0, 42.0, 50.0, 33.0, 27.0, 25.0, 24.0, 26.0, 23.0, 14.0, 13.0, 15.0, 8.0, 10.0, 3.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.999176025390625, -42.53871536254883, -41.0782585144043, -39.6177978515625, -38.15734100341797, -36.69688034057617, -35.236419677734375, -33.775962829589844, -32.31550598144531, -30.85504722595215, -29.394588470458984, -27.934127807617188, -26.473670959472656, -25.01321029663086, -23.552751541137695, -22.09229278564453, -20.631832122802734, -19.17137336730957, -17.710914611816406, -16.25045394897461, -14.789996147155762, -13.329537391662598, -11.869077682495117, -10.408618927001953, -8.948160171508789, -7.487701416015625, -6.027242183685303, -4.5667829513549805, -3.1063241958618164, -1.6458654403686523, -0.18540573120117188, 1.2750530242919922, 2.735515594482422, 4.195974349975586, 5.656433582305908, 7.1168928146362305, 8.577351570129395, 10.037810325622559, 11.498270034790039, 12.958728790283203, 14.419187545776367, 15.879646301269531, 17.340105056762695, 18.80056381225586, 20.261024475097656, 21.721481323242188, 23.181941986083984, 24.64240074157715, 26.102859497070312, 27.563318252563477, 29.02377700805664, 30.484237670898438, 31.94469451904297, 33.405155181884766, 34.86561584472656, 36.326072692871094, 37.786529541015625, 39.24699020385742, 40.70744705200195, 42.16790771484375, 43.62836456298828, 45.08882522583008, 46.549285888671875, 48.009742736816406, 49.4702033996582]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 3.0, 3.0, 7.0, 5.0, 4.0, 8.0, 11.0, 11.0, 10.0, 9.0, 17.0, 15.0, 23.0, 13.0, 19.0, 24.0, 20.0, 21.0, 19.0, 34.0, 42.0, 31.0, 45.0, 37.0, 30.0, 33.0, 41.0, 48.0, 21.0, 27.0, 38.0, 30.0, 24.0, 42.0, 29.0, 28.0, 19.0, 29.0, 23.0, 12.0, 18.0, 10.0, 15.0, 8.0, 9.0, 3.0, 9.0, 16.0, 4.0, 2.0, 4.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-7.61328125, -7.37799072265625, -7.1427001953125, -6.90740966796875, -6.672119140625, -6.43682861328125, -6.2015380859375, -5.96624755859375, -5.73095703125, -5.49566650390625, -5.2603759765625, -5.02508544921875, -4.789794921875, -4.55450439453125, -4.3192138671875, -4.08392333984375, -3.8486328125, -3.61334228515625, -3.3780517578125, -3.14276123046875, -2.907470703125, -2.67218017578125, -2.4368896484375, -2.20159912109375, -1.96630859375, -1.73101806640625, -1.4957275390625, -1.26043701171875, -1.025146484375, -0.78985595703125, -0.5545654296875, -0.31927490234375, -0.083984375, 0.15130615234375, 0.3865966796875, 0.62188720703125, 0.857177734375, 1.09246826171875, 1.3277587890625, 1.56304931640625, 1.79833984375, 2.03363037109375, 2.2689208984375, 2.50421142578125, 2.739501953125, 2.97479248046875, 3.2100830078125, 3.44537353515625, 3.6806640625, 3.91595458984375, 4.1512451171875, 4.38653564453125, 4.621826171875, 4.85711669921875, 5.0924072265625, 5.32769775390625, 5.56298828125, 5.79827880859375, 6.0335693359375, 6.26885986328125, 6.504150390625, 6.73944091796875, 6.9747314453125, 7.21002197265625, 7.4453125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 7.0, 2.0, 4.0, 6.0, 25.0, 45.0, 56.0, 65.0, 99.0, 147.0, 242.0, 374.0, 587.0, 798.0, 1206.0, 1817.0, 2746.0, 4102.0, 6171.0, 8844.0, 13184.0, 18763.0, 27250.0, 37698.0, 51576.0, 67741.0, 84556.0, 99759.0, 109261.0, 107199.0, 96192.0, 81402.0, 63677.0, 48042.0, 35171.0, 25169.0, 17377.0, 11948.0, 8222.0, 5539.0, 3750.0, 2563.0, 1724.0, 1156.0, 742.0, 512.0, 339.0, 242.0, 174.0, 103.0, 66.0, 44.0, 32.0, 20.0, 13.0, 5.0, 5.0, 7.0, 2.0, 3.0], "bins": [-0.9287109375, -0.9004745483398438, -0.8722381591796875, -0.8440017700195312, -0.815765380859375, -0.7875289916992188, -0.7592926025390625, -0.7310562133789062, -0.70281982421875, -0.6745834350585938, -0.6463470458984375, -0.6181106567382812, -0.589874267578125, -0.5616378784179688, -0.5334014892578125, -0.5051651000976562, -0.4769287109375, -0.44869232177734375, -0.4204559326171875, -0.39221954345703125, -0.363983154296875, -0.33574676513671875, -0.3075103759765625, -0.27927398681640625, -0.25103759765625, -0.22280120849609375, -0.1945648193359375, -0.16632843017578125, -0.138092041015625, -0.10985565185546875, -0.0816192626953125, -0.05338287353515625, -0.025146484375, 0.00308990478515625, 0.0313262939453125, 0.05956268310546875, 0.087799072265625, 0.11603546142578125, 0.1442718505859375, 0.17250823974609375, 0.20074462890625, 0.22898101806640625, 0.2572174072265625, 0.28545379638671875, 0.313690185546875, 0.34192657470703125, 0.3701629638671875, 0.39839935302734375, 0.4266357421875, 0.45487213134765625, 0.4831085205078125, 0.5113449096679688, 0.539581298828125, 0.5678176879882812, 0.5960540771484375, 0.6242904663085938, 0.65252685546875, 0.6807632446289062, 0.7089996337890625, 0.7372360229492188, 0.765472412109375, 0.7937088012695312, 0.8219451904296875, 0.8501815795898438, 0.87841796875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 11.0, 9.0, 7.0, 13.0, 18.0, 19.0, 19.0, 15.0, 17.0, 26.0, 29.0, 39.0, 46.0, 39.0, 36.0, 52.0, 43.0, 44.0, 1065.0, 39.0, 46.0, 63.0, 40.0, 43.0, 38.0, 39.0, 32.0, 27.0, 21.0, 15.0, 13.0, 8.0, 16.0, 8.0, 8.0, 5.0, 7.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.328125, -6.13177490234375, -5.9354248046875, -5.73907470703125, -5.542724609375, -5.34637451171875, -5.1500244140625, -4.95367431640625, -4.75732421875, -4.56097412109375, -4.3646240234375, -4.16827392578125, -3.971923828125, -3.77557373046875, -3.5792236328125, -3.38287353515625, -3.1865234375, -2.99017333984375, -2.7938232421875, -2.59747314453125, -2.401123046875, -2.20477294921875, -2.0084228515625, -1.81207275390625, -1.61572265625, -1.41937255859375, -1.2230224609375, -1.02667236328125, -0.830322265625, -0.63397216796875, -0.4376220703125, -0.24127197265625, -0.044921875, 0.15142822265625, 0.3477783203125, 0.54412841796875, 0.740478515625, 0.93682861328125, 1.1331787109375, 1.32952880859375, 1.52587890625, 1.72222900390625, 1.9185791015625, 2.11492919921875, 2.311279296875, 2.50762939453125, 2.7039794921875, 2.90032958984375, 3.0966796875, 3.29302978515625, 3.4893798828125, 3.68572998046875, 3.882080078125, 4.07843017578125, 4.2747802734375, 4.47113037109375, 4.66748046875, 4.86383056640625, 5.0601806640625, 5.25653076171875, 5.452880859375, 5.64923095703125, 5.8455810546875, 6.04193115234375, 6.23828125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 9.0, 12.0, 17.0, 22.0, 30.0, 46.0, 85.0, 118.0, 180.0, 273.0, 436.0, 586.0, 826.0, 1324.0, 2075.0, 2848.0, 4482.0, 6588.0, 9737.0, 14543.0, 21201.0, 32735.0, 1828055.0, 85279.0, 28178.0, 18499.0, 12741.0, 8608.0, 5739.0, 3749.0, 2751.0, 1834.0, 1175.0, 777.0, 529.0, 318.0, 231.0, 162.0, 99.0, 71.0, 52.0, 47.0, 25.0, 15.0, 14.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8017578125, -1.7392730712890625, -1.676788330078125, -1.6143035888671875, -1.55181884765625, -1.4893341064453125, -1.426849365234375, -1.3643646240234375, -1.3018798828125, -1.2393951416015625, -1.176910400390625, -1.1144256591796875, -1.05194091796875, -0.9894561767578125, -0.926971435546875, -0.8644866943359375, -0.802001953125, -0.7395172119140625, -0.677032470703125, -0.6145477294921875, -0.55206298828125, -0.4895782470703125, -0.427093505859375, -0.3646087646484375, -0.3021240234375, -0.2396392822265625, -0.177154541015625, -0.1146697998046875, -0.05218505859375, 0.0102996826171875, 0.072784423828125, 0.1352691650390625, 0.19775390625, 0.2602386474609375, 0.322723388671875, 0.3852081298828125, 0.44769287109375, 0.5101776123046875, 0.572662353515625, 0.6351470947265625, 0.6976318359375, 0.7601165771484375, 0.822601318359375, 0.8850860595703125, 0.94757080078125, 1.0100555419921875, 1.072540283203125, 1.1350250244140625, 1.197509765625, 1.2599945068359375, 1.322479248046875, 1.3849639892578125, 1.44744873046875, 1.5099334716796875, 1.572418212890625, 1.6349029541015625, 1.6973876953125, 1.7598724365234375, 1.822357177734375, 1.8848419189453125, 1.94732666015625, 2.0098114013671875, 2.072296142578125, 2.1347808837890625, 2.197265625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 4.0, 5.0, 7.0, 6.0, 2.0, 8.0, 10.0, 9.0, 12.0, 15.0, 17.0, 21.0, 23.0, 29.0, 29.0, 60.0, 77.0, 79.0, 81.0, 67.0, 72.0, 77.0, 53.0, 37.0, 35.0, 26.0, 25.0, 16.0, 13.0, 11.0, 16.0, 10.0, 9.0, 10.0, 8.0, 3.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.06622314453125, -0.06443405151367188, -0.06264495849609375, -0.060855865478515625, -0.0590667724609375, -0.057277679443359375, -0.05548858642578125, -0.053699493408203125, -0.051910400390625, -0.050121307373046875, -0.04833221435546875, -0.046543121337890625, -0.0447540283203125, -0.042964935302734375, -0.04117584228515625, -0.039386749267578125, -0.03759765625, -0.035808563232421875, -0.03401947021484375, -0.032230377197265625, -0.0304412841796875, -0.028652191162109375, -0.02686309814453125, -0.025074005126953125, -0.023284912109375, -0.021495819091796875, -0.01970672607421875, -0.017917633056640625, -0.0161285400390625, -0.014339447021484375, -0.01255035400390625, -0.010761260986328125, -0.00897216796875, -0.007183074951171875, -0.00539398193359375, -0.003604888916015625, -0.0018157958984375, -2.6702880859375e-05, 0.00176239013671875, 0.003551483154296875, 0.005340576171875, 0.007129669189453125, 0.00891876220703125, 0.010707855224609375, 0.0124969482421875, 0.014286041259765625, 0.01607513427734375, 0.017864227294921875, 0.0196533203125, 0.021442413330078125, 0.02323150634765625, 0.025020599365234375, 0.0268096923828125, 0.028598785400390625, 0.03038787841796875, 0.032176971435546875, 0.033966064453125, 0.035755157470703125, 0.03754425048828125, 0.039333343505859375, 0.0411224365234375, 0.042911529541015625, 0.04470062255859375, 0.046489715576171875, 0.04827880859375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 4.0, 9.0, 4.0, 13.0, 14.0, 15.0, 17.0, 23.0, 32.0, 32.0, 43.0, 48.0, 70.0, 96.0, 146.0, 251.0, 427.0, 729.0, 7423.0, 1032911.0, 4370.0, 713.0, 397.0, 205.0, 153.0, 101.0, 68.0, 54.0, 29.0, 24.0, 24.0, 14.0, 19.0, 12.0, 10.0, 13.0, 7.0, 10.0, 7.0, 7.0, 5.0, 0.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95751953125, -0.9226455688476562, -0.8877716064453125, -0.8528976440429688, -0.818023681640625, -0.7831497192382812, -0.7482757568359375, -0.7134017944335938, -0.67852783203125, -0.6436538696289062, -0.6087799072265625, -0.5739059448242188, -0.539031982421875, -0.5041580200195312, -0.4692840576171875, -0.43441009521484375, -0.3995361328125, -0.36466217041015625, -0.3297882080078125, -0.29491424560546875, -0.260040283203125, -0.22516632080078125, -0.1902923583984375, -0.15541839599609375, -0.12054443359375, -0.08567047119140625, -0.0507965087890625, -0.01592254638671875, 0.018951416015625, 0.05382537841796875, 0.0886993408203125, 0.12357330322265625, 0.158447265625, 0.19332122802734375, 0.2281951904296875, 0.26306915283203125, 0.297943115234375, 0.33281707763671875, 0.3676910400390625, 0.40256500244140625, 0.43743896484375, 0.47231292724609375, 0.5071868896484375, 0.5420608520507812, 0.576934814453125, 0.6118087768554688, 0.6466827392578125, 0.6815567016601562, 0.7164306640625, 0.7513046264648438, 0.7861785888671875, 0.8210525512695312, 0.855926513671875, 0.8908004760742188, 0.9256744384765625, 0.9605484008789062, 0.99542236328125, 1.0302963256835938, 1.0651702880859375, 1.1000442504882812, 1.134918212890625, 1.1697921752929688, 1.2046661376953125, 1.2395401000976562, 1.2744140625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 12.0, 440.0, 545.0, 11.0, 3.0, 0.0, 1.0], "bins": [-1.2427388429641724, -1.2216887474060059, -1.2006386518478394, -1.1795885562896729, -1.1585384607315063, -1.1374883651733398, -1.1164381504058838, -1.0953881740570068, -1.0743379592895508, -1.0532878637313843, -1.0322377681732178, -1.0111876726150513, -0.99013751745224, -0.9690874218940735, -0.948037326335907, -0.9269872307777405, -0.9059371948242188, -0.8848870992660522, -0.8638370037078857, -0.8427869081497192, -0.821736752986908, -0.8006866574287415, -0.779636561870575, -0.7585864663124084, -0.7375363111495972, -0.7164862155914307, -0.6954361200332642, -0.6743860244750977, -0.6533358693122864, -0.6322857737541199, -0.6112356781959534, -0.5901855826377869, -0.5691354870796204, -0.5480853915214539, -0.5270352959632874, -0.5059851408004761, -0.48493507504463196, -0.46388494968414307, -0.44283485412597656, -0.42178475856781006, -0.40073466300964355, -0.37968456745147705, -0.35863444209098816, -0.33758434653282166, -0.31653425097465515, -0.29548412561416626, -0.27443403005599976, -0.25338393449783325, -0.23233380913734436, -0.21128369867801666, -0.19023360311985016, -0.16918349266052246, -0.14813339710235596, -0.12708328664302826, -0.10603317618370056, -0.08498308062553406, -0.06393297761678696, -0.042882874608039856, -0.021832767874002457, -0.0007826611399650574, 0.020267441868782043, 0.041317544877529144, 0.06236765533685684, 0.08341775089502335, 0.10446786135435104]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 6.0, 4.0, 4.0, 4.0, 10.0, 10.0, 14.0, 16.0, 17.0, 24.0, 27.0, 19.0, 30.0, 40.0, 52.0, 41.0, 39.0, 38.0, 42.0, 56.0, 45.0, 46.0, 45.0, 38.0, 37.0, 41.0, 42.0, 37.0, 35.0, 27.0, 14.0, 24.0, 13.0, 14.0, 8.0, 11.0, 9.0, 2.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1104973554611206, -0.10671819746494293, -0.10293903946876526, -0.09915988147258759, -0.09538072347640991, -0.09160156548023224, -0.08782241493463516, -0.08404325693845749, -0.08026409894227982, -0.07648494094610214, -0.07270578294992447, -0.0689266249537468, -0.06514747440814972, -0.06136831268668175, -0.05758915841579437, -0.0538100004196167, -0.050030842423439026, -0.04625168442726135, -0.04247252643108368, -0.038693372160196304, -0.03491421416401863, -0.031135056167840958, -0.027355900034308434, -0.02357674390077591, -0.019797585904598236, -0.016018427908420563, -0.012239271774888039, -0.00846011471003294, -0.004680957645177841, -0.0009017996490001678, 0.0028773564845323563, 0.00665651261806488, 0.010435670614242554, 0.014214827679097652, 0.01799398474395275, 0.021773140877485275, 0.02555229887366295, 0.029331456869840622, 0.033110611140728, 0.03688976913690567, 0.040668927133083344, 0.04444808512926102, 0.04822724312543869, 0.052006397396326065, 0.05578555539250374, 0.05956471338868141, 0.06334386765956879, 0.06712302565574646, 0.07090218365192413, 0.0746813416481018, 0.07846049964427948, 0.08223965764045715, 0.08601881563663483, 0.0897979736328125, 0.09357712417840958, 0.09735628217458725, 0.10113544017076492, 0.1049145981669426, 0.10869375616312027, 0.11247291415929794, 0.11625206470489502, 0.12003122270107269, 0.12381038069725037, 0.12758953869342804, 0.1313686966896057]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 10.0, 7.0, 15.0, 11.0, 17.0, 10.0, 23.0, 19.0, 21.0, 25.0, 37.0, 30.0, 34.0, 32.0, 39.0, 35.0, 48.0, 36.0, 53.0, 43.0, 35.0, 44.0, 36.0, 35.0, 45.0, 33.0, 31.0, 24.0, 19.0, 18.0, 16.0, 16.0, 21.0, 13.0, 9.0, 15.0, 8.0, 6.0, 8.0, 3.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.5078125, -8.239013671875, -7.97021484375, -7.701416015625, -7.4326171875, -7.163818359375, -6.89501953125, -6.626220703125, -6.357421875, -6.088623046875, -5.81982421875, -5.551025390625, -5.2822265625, -5.013427734375, -4.74462890625, -4.475830078125, -4.20703125, -3.938232421875, -3.66943359375, -3.400634765625, -3.1318359375, -2.863037109375, -2.59423828125, -2.325439453125, -2.056640625, -1.787841796875, -1.51904296875, -1.250244140625, -0.9814453125, -0.712646484375, -0.44384765625, -0.175048828125, 0.09375, 0.362548828125, 0.63134765625, 0.900146484375, 1.1689453125, 1.437744140625, 1.70654296875, 1.975341796875, 2.244140625, 2.512939453125, 2.78173828125, 3.050537109375, 3.3193359375, 3.588134765625, 3.85693359375, 4.125732421875, 4.39453125, 4.663330078125, 4.93212890625, 5.200927734375, 5.4697265625, 5.738525390625, 6.00732421875, 6.276123046875, 6.544921875, 6.813720703125, 7.08251953125, 7.351318359375, 7.6201171875, 7.888916015625, 8.15771484375, 8.426513671875, 8.6953125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 3.0, 17.0, 16.0, 11.0, 25.0, 30.0, 40.0, 57.0, 59.0, 87.0, 116.0, 164.0, 230.0, 319.0, 504.0, 880.0, 1649.0, 3191.0, 6081.0, 12563.0, 25450.0, 52371.0, 108048.0, 221889.0, 289509.0, 167499.0, 79778.0, 38926.0, 19088.0, 9418.0, 4673.0, 2449.0, 1203.0, 766.0, 430.0, 294.0, 189.0, 134.0, 95.0, 73.0, 51.0, 35.0, 37.0, 27.0, 21.0, 14.0, 16.0, 9.0, 7.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0], "bins": [-10.03125, -9.72998046875, -9.4287109375, -9.12744140625, -8.826171875, -8.52490234375, -8.2236328125, -7.92236328125, -7.62109375, -7.31982421875, -7.0185546875, -6.71728515625, -6.416015625, -6.11474609375, -5.8134765625, -5.51220703125, -5.2109375, -4.90966796875, -4.6083984375, -4.30712890625, -4.005859375, -3.70458984375, -3.4033203125, -3.10205078125, -2.80078125, -2.49951171875, -2.1982421875, -1.89697265625, -1.595703125, -1.29443359375, -0.9931640625, -0.69189453125, -0.390625, -0.08935546875, 0.2119140625, 0.51318359375, 0.814453125, 1.11572265625, 1.4169921875, 1.71826171875, 2.01953125, 2.32080078125, 2.6220703125, 2.92333984375, 3.224609375, 3.52587890625, 3.8271484375, 4.12841796875, 4.4296875, 4.73095703125, 5.0322265625, 5.33349609375, 5.634765625, 5.93603515625, 6.2373046875, 6.53857421875, 6.83984375, 7.14111328125, 7.4423828125, 7.74365234375, 8.044921875, 8.34619140625, 8.6474609375, 8.94873046875, 9.25]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 3.0, 11.0, 8.0, 7.0, 19.0, 25.0, 18.0, 18.0, 23.0, 32.0, 34.0, 39.0, 43.0, 51.0, 87.0, 134.0, 241.0, 1371.0, 271.0, 140.0, 90.0, 52.0, 54.0, 34.0, 41.0, 39.0, 29.0, 26.0, 14.0, 15.0, 12.0, 10.0, 6.0, 10.0, 6.0, 11.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.6875, -20.95751953125, -20.2275390625, -19.49755859375, -18.767578125, -18.03759765625, -17.3076171875, -16.57763671875, -15.84765625, -15.11767578125, -14.3876953125, -13.65771484375, -12.927734375, -12.19775390625, -11.4677734375, -10.73779296875, -10.0078125, -9.27783203125, -8.5478515625, -7.81787109375, -7.087890625, -6.35791015625, -5.6279296875, -4.89794921875, -4.16796875, -3.43798828125, -2.7080078125, -1.97802734375, -1.248046875, -0.51806640625, 0.2119140625, 0.94189453125, 1.671875, 2.40185546875, 3.1318359375, 3.86181640625, 4.591796875, 5.32177734375, 6.0517578125, 6.78173828125, 7.51171875, 8.24169921875, 8.9716796875, 9.70166015625, 10.431640625, 11.16162109375, 11.8916015625, 12.62158203125, 13.3515625, 14.08154296875, 14.8115234375, 15.54150390625, 16.271484375, 17.00146484375, 17.7314453125, 18.46142578125, 19.19140625, 19.92138671875, 20.6513671875, 21.38134765625, 22.111328125, 22.84130859375, 23.5712890625, 24.30126953125, 25.03125]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 7.0, 6.0, 13.0, 21.0, 19.0, 29.0, 37.0, 73.0, 100.0, 168.0, 241.0, 481.0, 1003.0, 4159.0, 3125672.0, 11138.0, 1151.0, 569.0, 296.0, 185.0, 103.0, 61.0, 39.0, 24.0, 23.0, 21.0, 19.0, 13.0, 10.0, 8.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-110.8125, -107.513671875, -104.21484375, -100.916015625, -97.6171875, -94.318359375, -91.01953125, -87.720703125, -84.421875, -81.123046875, -77.82421875, -74.525390625, -71.2265625, -67.927734375, -64.62890625, -61.330078125, -58.03125, -54.732421875, -51.43359375, -48.134765625, -44.8359375, -41.537109375, -38.23828125, -34.939453125, -31.640625, -28.341796875, -25.04296875, -21.744140625, -18.4453125, -15.146484375, -11.84765625, -8.548828125, -5.25, -1.951171875, 1.34765625, 4.646484375, 7.9453125, 11.244140625, 14.54296875, 17.841796875, 21.140625, 24.439453125, 27.73828125, 31.037109375, 34.3359375, 37.634765625, 40.93359375, 44.232421875, 47.53125, 50.830078125, 54.12890625, 57.427734375, 60.7265625, 64.025390625, 67.32421875, 70.623046875, 73.921875, 77.220703125, 80.51953125, 83.818359375, 87.1171875, 90.416015625, 93.71484375, 97.013671875, 100.3125]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 5.0, 24.0, 52.0, 81.0, 171.0, 219.0, 200.0, 135.0, 67.0, 33.0, 17.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.076915740966797, -22.513221740722656, -19.949525833129883, -17.385831832885742, -14.822136878967285, -12.258441925048828, -9.694747924804688, -7.131052017211914, -4.567358016967773, -2.0036633014678955, 0.5600314140319824, 3.1237258911132812, 5.687420845031738, 8.251115798950195, 10.814809799194336, 13.37850570678711, 15.94219970703125, 18.50589370727539, 21.069589614868164, 23.633283615112305, 26.196979522705078, 28.76067352294922, 31.32436752319336, 33.8880615234375, 36.451759338378906, 39.01545333862305, 41.57914733886719, 44.142845153808594, 46.706539154052734, 49.270233154296875, 51.833927154541016, 54.397621154785156, 56.96131134033203, 59.52500534057617, 62.08869934082031, 64.65239715576172, 67.2160873413086, 69.77978515625, 72.34347534179688, 74.90717315673828, 77.47087097167969, 80.0345687866211, 82.59825897216797, 85.16195678710938, 87.72564697265625, 90.28934478759766, 92.85304260253906, 95.41673278808594, 97.98042297363281, 100.54412078857422, 103.1078109741211, 105.6715087890625, 108.23519897460938, 110.79889678955078, 113.36259460449219, 115.92628479003906, 118.48998260498047, 121.05368041992188, 123.61737060546875, 126.18106842041016, 128.74476623535156, 131.30845642089844, 133.8721466064453, 136.43585205078125, 138.99954223632812]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 1.0, 8.0, 7.0, 9.0, 9.0, 12.0, 18.0, 17.0, 17.0, 18.0, 29.0, 33.0, 27.0, 33.0, 28.0, 46.0, 41.0, 38.0, 58.0, 44.0, 52.0, 50.0, 59.0, 40.0, 39.0, 35.0, 36.0, 37.0, 36.0, 22.0, 19.0, 13.0, 11.0, 11.0, 9.0, 9.0, 9.0, 4.0, 7.0, 1.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-75.68386840820312, -73.52392578125, -71.36397552490234, -69.20403289794922, -67.04408264160156, -64.88414001464844, -62.72419738769531, -60.56425094604492, -58.40430450439453, -56.24435806274414, -54.08441162109375, -51.924468994140625, -49.764522552490234, -47.604576110839844, -45.44463348388672, -43.28468704223633, -41.12474060058594, -38.96479415893555, -36.804847717285156, -34.64490509033203, -32.48495864868164, -30.32501220703125, -28.165067672729492, -26.005123138427734, -23.845176696777344, -21.685230255126953, -19.525285720825195, -17.365341186523438, -15.205394744873047, -13.045449256896973, -10.885503768920898, -8.725558280944824, -6.56561279296875, -4.405667304992676, -2.2457218170166016, -0.08577632904052734, 2.074169158935547, 4.234114646911621, 6.394060134887695, 8.55400562286377, 10.713951110839844, 12.873896598815918, 15.033842086791992, 17.19378662109375, 19.35373306274414, 21.51367950439453, 23.67362403869629, 25.833568572998047, 27.993515014648438, 30.153461456298828, 32.31340789794922, 34.473350524902344, 36.633296966552734, 38.793243408203125, 40.95318603515625, 43.11313247680664, 45.27307891845703, 47.43302536010742, 49.59297180175781, 51.75291442871094, 53.91286087036133, 56.07280731201172, 58.232749938964844, 60.392696380615234, 62.552642822265625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 3.0, 6.0, 9.0, 9.0, 19.0, 21.0, 10.0, 21.0, 28.0, 26.0, 29.0, 36.0, 40.0, 33.0, 56.0, 58.0, 39.0, 36.0, 62.0, 43.0, 41.0, 36.0, 37.0, 40.0, 37.0, 26.0, 38.0, 23.0, 21.0, 26.0, 15.0, 12.0, 12.0, 14.0, 10.0, 7.0, 12.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.859375, -8.55810546875, -8.2568359375, -7.95556640625, -7.654296875, -7.35302734375, -7.0517578125, -6.75048828125, -6.44921875, -6.14794921875, -5.8466796875, -5.54541015625, -5.244140625, -4.94287109375, -4.6416015625, -4.34033203125, -4.0390625, -3.73779296875, -3.4365234375, -3.13525390625, -2.833984375, -2.53271484375, -2.2314453125, -1.93017578125, -1.62890625, -1.32763671875, -1.0263671875, -0.72509765625, -0.423828125, -0.12255859375, 0.1787109375, 0.47998046875, 0.78125, 1.08251953125, 1.3837890625, 1.68505859375, 1.986328125, 2.28759765625, 2.5888671875, 2.89013671875, 3.19140625, 3.49267578125, 3.7939453125, 4.09521484375, 4.396484375, 4.69775390625, 4.9990234375, 5.30029296875, 5.6015625, 5.90283203125, 6.2041015625, 6.50537109375, 6.806640625, 7.10791015625, 7.4091796875, 7.71044921875, 8.01171875, 8.31298828125, 8.6142578125, 8.91552734375, 9.216796875, 9.51806640625, 9.8193359375, 10.12060546875, 10.421875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 3.0, 3.0, 6.0, 10.0, 9.0, 20.0, 36.0, 64.0, 81.0, 119.0, 218.0, 336.0, 592.0, 1018.0, 1998.0, 3930.0, 9093.0, 24569.0, 82986.0, 306754.0, 917224.0, 1581925.0, 864570.0, 283338.0, 76485.0, 22605.0, 8303.0, 3802.0, 1878.0, 926.0, 537.0, 339.0, 181.0, 115.0, 68.0, 49.0, 23.0, 19.0, 10.0, 12.0, 8.0, 3.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-11.3515625, -11.0123291015625, -10.673095703125, -10.3338623046875, -9.99462890625, -9.6553955078125, -9.316162109375, -8.9769287109375, -8.6376953125, -8.2984619140625, -7.959228515625, -7.6199951171875, -7.28076171875, -6.9415283203125, -6.602294921875, -6.2630615234375, -5.923828125, -5.5845947265625, -5.245361328125, -4.9061279296875, -4.56689453125, -4.2276611328125, -3.888427734375, -3.5491943359375, -3.2099609375, -2.8707275390625, -2.531494140625, -2.1922607421875, -1.85302734375, -1.5137939453125, -1.174560546875, -0.8353271484375, -0.49609375, -0.1568603515625, 0.182373046875, 0.5216064453125, 0.86083984375, 1.2000732421875, 1.539306640625, 1.8785400390625, 2.2177734375, 2.5570068359375, 2.896240234375, 3.2354736328125, 3.57470703125, 3.9139404296875, 4.253173828125, 4.5924072265625, 4.931640625, 5.2708740234375, 5.610107421875, 5.9493408203125, 6.28857421875, 6.6278076171875, 6.967041015625, 7.3062744140625, 7.6455078125, 7.9847412109375, 8.323974609375, 8.6632080078125, 9.00244140625, 9.3416748046875, 9.680908203125, 10.0201416015625, 10.359375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 9.0, 12.0, 8.0, 15.0, 14.0, 20.0, 18.0, 33.0, 34.0, 43.0, 70.0, 85.0, 99.0, 104.0, 114.0, 190.0, 234.0, 230.0, 296.0, 325.0, 320.0, 295.0, 252.0, 205.0, 207.0, 157.0, 100.0, 114.0, 85.0, 76.0, 67.0, 50.0, 35.0, 30.0, 29.0, 27.0, 16.0, 9.0, 10.0, 12.0, 5.0, 7.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.890625, -9.57177734375, -9.2529296875, -8.93408203125, -8.615234375, -8.29638671875, -7.9775390625, -7.65869140625, -7.33984375, -7.02099609375, -6.7021484375, -6.38330078125, -6.064453125, -5.74560546875, -5.4267578125, -5.10791015625, -4.7890625, -4.47021484375, -4.1513671875, -3.83251953125, -3.513671875, -3.19482421875, -2.8759765625, -2.55712890625, -2.23828125, -1.91943359375, -1.6005859375, -1.28173828125, -0.962890625, -0.64404296875, -0.3251953125, -0.00634765625, 0.3125, 0.63134765625, 0.9501953125, 1.26904296875, 1.587890625, 1.90673828125, 2.2255859375, 2.54443359375, 2.86328125, 3.18212890625, 3.5009765625, 3.81982421875, 4.138671875, 4.45751953125, 4.7763671875, 5.09521484375, 5.4140625, 5.73291015625, 6.0517578125, 6.37060546875, 6.689453125, 7.00830078125, 7.3271484375, 7.64599609375, 7.96484375, 8.28369140625, 8.6025390625, 8.92138671875, 9.240234375, 9.55908203125, 9.8779296875, 10.19677734375, 10.515625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 3.0, 7.0, 13.0, 13.0, 18.0, 17.0, 26.0, 43.0, 46.0, 68.0, 106.0, 140.0, 219.0, 294.0, 513.0, 754.0, 1287.0, 2685.0, 6822.0, 29019.0, 174211.0, 1075466.0, 2311136.0, 489736.0, 78124.0, 14784.0, 4225.0, 1742.0, 946.0, 584.0, 363.0, 268.0, 167.0, 132.0, 67.0, 54.0, 47.0, 42.0, 27.0, 19.0, 15.0, 6.0, 11.0, 5.0, 6.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.640625, -16.108642578125, -15.57666015625, -15.044677734375, -14.5126953125, -13.980712890625, -13.44873046875, -12.916748046875, -12.384765625, -11.852783203125, -11.32080078125, -10.788818359375, -10.2568359375, -9.724853515625, -9.19287109375, -8.660888671875, -8.12890625, -7.596923828125, -7.06494140625, -6.532958984375, -6.0009765625, -5.468994140625, -4.93701171875, -4.405029296875, -3.873046875, -3.341064453125, -2.80908203125, -2.277099609375, -1.7451171875, -1.213134765625, -0.68115234375, -0.149169921875, 0.3828125, 0.914794921875, 1.44677734375, 1.978759765625, 2.5107421875, 3.042724609375, 3.57470703125, 4.106689453125, 4.638671875, 5.170654296875, 5.70263671875, 6.234619140625, 6.7666015625, 7.298583984375, 7.83056640625, 8.362548828125, 8.89453125, 9.426513671875, 9.95849609375, 10.490478515625, 11.0224609375, 11.554443359375, 12.08642578125, 12.618408203125, 13.150390625, 13.682373046875, 14.21435546875, 14.746337890625, 15.2783203125, 15.810302734375, 16.34228515625, 16.874267578125, 17.40625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 26.0, 973.0, 16.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1041.1632080078125, -1011.8036499023438, -982.4441528320312, -953.0845947265625, -923.7250366210938, -894.3655395507812, -865.0059814453125, -835.646484375, -806.2869262695312, -776.9273681640625, -747.56787109375, -718.2083129882812, -688.8487548828125, -659.4892578125, -630.1296997070312, -600.7701416015625, -571.41064453125, -542.0510864257812, -512.6915893554688, -483.33203125, -453.9725036621094, -424.61297607421875, -395.25341796875, -365.8938903808594, -336.5343017578125, -307.1747741699219, -277.8152160644531, -248.4556884765625, -219.09616088867188, -189.7366180419922, -160.3770751953125, -131.01754760742188, -101.65802001953125, -72.2984848022461, -42.93894577026367, -13.57940673828125, 15.780128479003906, 45.13966369628906, 74.49920654296875, 103.85873413085938, 133.21827697753906, 162.57781982421875, 191.93734741210938, 221.29689025878906, 250.65643310546875, 280.0159606933594, 309.37548828125, 338.73504638671875, 368.0945739746094, 397.4541015625, 426.81365966796875, 456.1731872558594, 485.53271484375, 514.8922729492188, 544.2518310546875, 573.611328125, 602.9708862304688, 632.3304443359375, 661.68994140625, 691.0494995117188, 720.4090576171875, 749.7685546875, 779.1281127929688, 808.4876708984375, 837.84716796875]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 7.0, 4.0, 10.0, 8.0, 9.0, 13.0, 15.0, 12.0, 15.0, 20.0, 20.0, 32.0, 20.0, 25.0, 37.0, 35.0, 43.0, 38.0, 41.0, 48.0, 40.0, 36.0, 45.0, 29.0, 40.0, 45.0, 35.0, 35.0, 33.0, 25.0, 24.0, 18.0, 27.0, 24.0, 22.0, 20.0, 9.0, 12.0, 4.0, 3.0, 5.0, 4.0, 3.0, 5.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-44.60017013549805, -42.937538146972656, -41.27490234375, -39.61227035522461, -37.94963836669922, -36.28700256347656, -34.62437057495117, -32.96173858642578, -31.299102783203125, -29.6364688873291, -27.973834991455078, -26.311203002929688, -24.648569107055664, -22.98593521118164, -21.32330322265625, -19.660669326782227, -17.998035430908203, -16.33540153503418, -14.672768592834473, -13.010135650634766, -11.347501754760742, -9.684867858886719, -8.022234916687012, -6.359601974487305, -4.696968078613281, -3.034334659576416, -1.3717012405395508, 0.29093217849731445, 1.9535655975341797, 3.616199493408203, 5.27883243560791, 6.941465377807617, 8.604095458984375, 10.266729354858398, 11.929362297058105, 13.591995239257812, 15.254629135131836, 16.91726303100586, 18.57989501953125, 20.242528915405273, 21.905162811279297, 23.56779670715332, 25.230430603027344, 26.893062591552734, 28.555696487426758, 30.21833038330078, 31.880962371826172, 33.54359436035156, 35.20623016357422, 36.86886215209961, 38.531497955322266, 40.194129943847656, 41.85676574707031, 43.5193977355957, 45.182029724121094, 46.84466552734375, 48.50729751586914, 50.16992950439453, 51.83256530761719, 53.49519729614258, 55.15782928466797, 56.820465087890625, 58.483097076416016, 60.145729064941406, 61.80836486816406]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 6.0, 12.0, 5.0, 6.0, 15.0, 16.0, 11.0, 13.0, 21.0, 21.0, 32.0, 37.0, 26.0, 33.0, 33.0, 47.0, 54.0, 38.0, 32.0, 52.0, 39.0, 41.0, 35.0, 43.0, 42.0, 35.0, 28.0, 35.0, 28.0, 27.0, 19.0, 28.0, 14.0, 18.0, 18.0, 6.0, 7.0, 7.0, 3.0, 6.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.63671875, -7.395263671875, -7.15380859375, -6.912353515625, -6.6708984375, -6.429443359375, -6.18798828125, -5.946533203125, -5.705078125, -5.463623046875, -5.22216796875, -4.980712890625, -4.7392578125, -4.497802734375, -4.25634765625, -4.014892578125, -3.7734375, -3.531982421875, -3.29052734375, -3.049072265625, -2.8076171875, -2.566162109375, -2.32470703125, -2.083251953125, -1.841796875, -1.600341796875, -1.35888671875, -1.117431640625, -0.8759765625, -0.634521484375, -0.39306640625, -0.151611328125, 0.08984375, 0.331298828125, 0.57275390625, 0.814208984375, 1.0556640625, 1.297119140625, 1.53857421875, 1.780029296875, 2.021484375, 2.262939453125, 2.50439453125, 2.745849609375, 2.9873046875, 3.228759765625, 3.47021484375, 3.711669921875, 3.953125, 4.194580078125, 4.43603515625, 4.677490234375, 4.9189453125, 5.160400390625, 5.40185546875, 5.643310546875, 5.884765625, 6.126220703125, 6.36767578125, 6.609130859375, 6.8505859375, 7.092041015625, 7.33349609375, 7.574951171875, 7.81640625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 8.0, 10.0, 7.0, 22.0, 31.0, 59.0, 69.0, 138.0, 205.0, 330.0, 538.0, 833.0, 1350.0, 2111.0, 3395.0, 5071.0, 8091.0, 12157.0, 18260.0, 26902.0, 38661.0, 54218.0, 73313.0, 93755.0, 111742.0, 120862.0, 114924.0, 98477.0, 77171.0, 58038.0, 41716.0, 29103.0, 19789.0, 13064.0, 8667.0, 5665.0, 3570.0, 2334.0, 1418.0, 882.0, 607.0, 376.0, 244.0, 150.0, 93.0, 51.0, 29.0, 19.0, 13.0, 7.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.8291015625, -0.8044281005859375, -0.779754638671875, -0.7550811767578125, -0.73040771484375, -0.7057342529296875, -0.681060791015625, -0.6563873291015625, -0.6317138671875, -0.6070404052734375, -0.582366943359375, -0.5576934814453125, -0.53302001953125, -0.5083465576171875, -0.483673095703125, -0.4589996337890625, -0.434326171875, -0.4096527099609375, -0.384979248046875, -0.3603057861328125, -0.33563232421875, -0.3109588623046875, -0.286285400390625, -0.2616119384765625, -0.2369384765625, -0.2122650146484375, -0.187591552734375, -0.1629180908203125, -0.13824462890625, -0.1135711669921875, -0.088897705078125, -0.0642242431640625, -0.03955078125, -0.0148773193359375, 0.009796142578125, 0.0344696044921875, 0.05914306640625, 0.0838165283203125, 0.108489990234375, 0.1331634521484375, 0.1578369140625, 0.1825103759765625, 0.207183837890625, 0.2318572998046875, 0.25653076171875, 0.2812042236328125, 0.305877685546875, 0.3305511474609375, 0.355224609375, 0.3798980712890625, 0.404571533203125, 0.4292449951171875, 0.45391845703125, 0.4785919189453125, 0.503265380859375, 0.5279388427734375, 0.5526123046875, 0.5772857666015625, 0.601959228515625, 0.6266326904296875, 0.65130615234375, 0.6759796142578125, 0.700653076171875, 0.7253265380859375, 0.75]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 5.0, 5.0, 10.0, 12.0, 8.0, 10.0, 14.0, 25.0, 20.0, 25.0, 17.0, 30.0, 30.0, 38.0, 31.0, 42.0, 39.0, 50.0, 50.0, 38.0, 1071.0, 39.0, 36.0, 36.0, 37.0, 45.0, 34.0, 22.0, 27.0, 18.0, 32.0, 26.0, 21.0, 16.0, 16.0, 11.0, 10.0, 5.0, 7.0, 0.0, 4.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.94140625, -5.76898193359375, -5.5965576171875, -5.42413330078125, -5.251708984375, -5.07928466796875, -4.9068603515625, -4.73443603515625, -4.56201171875, -4.38958740234375, -4.2171630859375, -4.04473876953125, -3.872314453125, -3.69989013671875, -3.5274658203125, -3.35504150390625, -3.1826171875, -3.01019287109375, -2.8377685546875, -2.66534423828125, -2.492919921875, -2.32049560546875, -2.1480712890625, -1.97564697265625, -1.80322265625, -1.63079833984375, -1.4583740234375, -1.28594970703125, -1.113525390625, -0.94110107421875, -0.7686767578125, -0.59625244140625, -0.423828125, -0.25140380859375, -0.0789794921875, 0.09344482421875, 0.265869140625, 0.43829345703125, 0.6107177734375, 0.78314208984375, 0.95556640625, 1.12799072265625, 1.3004150390625, 1.47283935546875, 1.645263671875, 1.81768798828125, 1.9901123046875, 2.16253662109375, 2.3349609375, 2.50738525390625, 2.6798095703125, 2.85223388671875, 3.024658203125, 3.19708251953125, 3.3695068359375, 3.54193115234375, 3.71435546875, 3.88677978515625, 4.0592041015625, 4.23162841796875, 4.404052734375, 4.57647705078125, 4.7489013671875, 4.92132568359375, 5.09375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 8.0, 13.0, 20.0, 31.0, 40.0, 81.0, 94.0, 124.0, 246.0, 343.0, 463.0, 698.0, 1057.0, 1591.0, 2304.0, 3283.0, 4812.0, 7174.0, 10451.0, 15157.0, 22409.0, 33935.0, 1852723.0, 55815.0, 26643.0, 17984.0, 12733.0, 8598.0, 5840.0, 3994.0, 2688.0, 1854.0, 1271.0, 883.0, 596.0, 400.0, 264.0, 181.0, 112.0, 78.0, 51.0, 37.0, 24.0, 19.0, 5.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6787109375, -1.6289520263671875, -1.579193115234375, -1.5294342041015625, -1.47967529296875, -1.4299163818359375, -1.380157470703125, -1.3303985595703125, -1.2806396484375, -1.2308807373046875, -1.181121826171875, -1.1313629150390625, -1.08160400390625, -1.0318450927734375, -0.982086181640625, -0.9323272705078125, -0.882568359375, -0.8328094482421875, -0.783050537109375, -0.7332916259765625, -0.68353271484375, -0.6337738037109375, -0.584014892578125, -0.5342559814453125, -0.4844970703125, -0.4347381591796875, -0.384979248046875, -0.3352203369140625, -0.28546142578125, -0.2357025146484375, -0.185943603515625, -0.1361846923828125, -0.08642578125, -0.0366668701171875, 0.013092041015625, 0.0628509521484375, 0.11260986328125, 0.1623687744140625, 0.212127685546875, 0.2618865966796875, 0.3116455078125, 0.3614044189453125, 0.411163330078125, 0.4609222412109375, 0.51068115234375, 0.5604400634765625, 0.610198974609375, 0.6599578857421875, 0.709716796875, 0.7594757080078125, 0.809234619140625, 0.8589935302734375, 0.90875244140625, 0.9585113525390625, 1.008270263671875, 1.0580291748046875, 1.1077880859375, 1.1575469970703125, 1.207305908203125, 1.2570648193359375, 1.30682373046875, 1.3565826416015625, 1.406341552734375, 1.4561004638671875, 1.505859375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 5.0, 6.0, 8.0, 8.0, 6.0, 4.0, 8.0, 12.0, 14.0, 20.0, 13.0, 18.0, 19.0, 39.0, 37.0, 60.0, 72.0, 109.0, 106.0, 86.0, 52.0, 36.0, 35.0, 40.0, 29.0, 23.0, 26.0, 14.0, 11.0, 12.0, 15.0, 10.0, 9.0, 5.0, 5.0, 7.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.036529541015625, -0.03542327880859375, -0.0343170166015625, -0.03321075439453125, -0.0321044921875, -0.03099822998046875, -0.0298919677734375, -0.02878570556640625, -0.027679443359375, -0.02657318115234375, -0.0254669189453125, -0.02436065673828125, -0.02325439453125, -0.02214813232421875, -0.0210418701171875, -0.01993560791015625, -0.018829345703125, -0.01772308349609375, -0.0166168212890625, -0.01551055908203125, -0.014404296875, -0.01329803466796875, -0.0121917724609375, -0.01108551025390625, -0.009979248046875, -0.00887298583984375, -0.0077667236328125, -0.00666046142578125, -0.00555419921875, -0.00444793701171875, -0.0033416748046875, -0.00223541259765625, -0.001129150390625, -2.288818359375e-05, 0.0010833740234375, 0.00218963623046875, 0.0032958984375, 0.00440216064453125, 0.0055084228515625, 0.00661468505859375, 0.007720947265625, 0.00882720947265625, 0.0099334716796875, 0.01103973388671875, 0.01214599609375, 0.01325225830078125, 0.0143585205078125, 0.01546478271484375, 0.016571044921875, 0.01767730712890625, 0.0187835693359375, 0.01988983154296875, 0.02099609375, 0.02210235595703125, 0.0232086181640625, 0.02431488037109375, 0.025421142578125, 0.02652740478515625, 0.0276336669921875, 0.02873992919921875, 0.02984619140625, 0.03095245361328125, 0.0320587158203125, 0.03316497802734375, 0.034271240234375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 0.0, 6.0, 5.0, 7.0, 8.0, 9.0, 9.0, 12.0, 19.0, 20.0, 29.0, 34.0, 36.0, 63.0, 71.0, 106.0, 141.0, 192.0, 284.0, 634.0, 1718.0, 977817.0, 65110.0, 916.0, 452.0, 266.0, 161.0, 102.0, 60.0, 48.0, 56.0, 38.0, 19.0, 21.0, 18.0, 9.0, 13.0, 7.0, 8.0, 8.0, 1.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.65869140625, -0.6373138427734375, -0.615936279296875, -0.5945587158203125, -0.57318115234375, -0.5518035888671875, -0.530426025390625, -0.5090484619140625, -0.4876708984375, -0.4662933349609375, -0.444915771484375, -0.4235382080078125, -0.40216064453125, -0.3807830810546875, -0.359405517578125, -0.3380279541015625, -0.316650390625, -0.2952728271484375, -0.273895263671875, -0.2525177001953125, -0.23114013671875, -0.2097625732421875, -0.188385009765625, -0.1670074462890625, -0.1456298828125, -0.1242523193359375, -0.102874755859375, -0.0814971923828125, -0.06011962890625, -0.0387420654296875, -0.017364501953125, 0.0040130615234375, 0.025390625, 0.0467681884765625, 0.068145751953125, 0.0895233154296875, 0.11090087890625, 0.1322784423828125, 0.153656005859375, 0.1750335693359375, 0.1964111328125, 0.2177886962890625, 0.239166259765625, 0.2605438232421875, 0.28192138671875, 0.3032989501953125, 0.324676513671875, 0.3460540771484375, 0.367431640625, 0.3888092041015625, 0.410186767578125, 0.4315643310546875, 0.45294189453125, 0.4743194580078125, 0.495697021484375, 0.5170745849609375, 0.5384521484375, 0.5598297119140625, 0.581207275390625, 0.6025848388671875, 0.62396240234375, 0.6453399658203125, 0.666717529296875, 0.6880950927734375, 0.70947265625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 360.0, 653.0], "bins": [-1.1560038328170776, -1.1376762390136719, -1.1193487644195557, -1.10102117061615, -1.0826935768127441, -1.0643659830093384, -1.0460383892059326, -1.0277109146118164, -1.0093833208084106, -0.9910557270050049, -0.9727281928062439, -0.9544006586074829, -0.9360730648040771, -0.9177454710006714, -0.8994179368019104, -0.8810904026031494, -0.8627628087997437, -0.8444352149963379, -0.8261076807975769, -0.8077801465988159, -0.7894525527954102, -0.7711249589920044, -0.7527974247932434, -0.7344698905944824, -0.7161422967910767, -0.6978147029876709, -0.6794871687889099, -0.6611596345901489, -0.6428320407867432, -0.6245044469833374, -0.6061769127845764, -0.5878493785858154, -0.5695217847824097, -0.5511941909790039, -0.5328666567802429, -0.5145391225814819, -0.49621152877807617, -0.4778839647769928, -0.4595564007759094, -0.44122883677482605, -0.42290130257606506, -0.4045737385749817, -0.3862461745738983, -0.36791861057281494, -0.34959104657173157, -0.3312634825706482, -0.3129359185695648, -0.29460835456848145, -0.27628079056739807, -0.2579532265663147, -0.23962566256523132, -0.22129809856414795, -0.20297053456306458, -0.1846429705619812, -0.16631540656089783, -0.14798784255981445, -0.12966027855873108, -0.1113327145576477, -0.09300515055656433, -0.07467758655548096, -0.05635002255439758, -0.03802245855331421, -0.019694894552230835, -0.001367330551147461, 0.01696023903787136]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 7.0, 3.0, 9.0, 11.0, 19.0, 19.0, 25.0, 25.0, 32.0, 41.0, 37.0, 44.0, 33.0, 52.0, 47.0, 76.0, 52.0, 45.0, 56.0, 45.0, 44.0, 41.0, 37.0, 40.0, 38.0, 27.0, 14.0, 19.0, 11.0, 10.0, 13.0, 13.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08116167783737183, -0.07875660806894302, -0.07635153830051422, -0.07394647598266602, -0.07154140621423721, -0.06913633644580841, -0.0667312741279602, -0.0643262043595314, -0.0619211345911026, -0.0595160648226738, -0.057110998779535294, -0.05470593273639679, -0.05230086296796799, -0.049895793199539185, -0.04749072715640068, -0.045085661113262177, -0.042680591344833374, -0.04027552157640457, -0.03787045553326607, -0.035465389490127563, -0.03306031972169876, -0.030655251815915108, -0.028250183910131454, -0.0258451160043478, -0.023440048098564148, -0.021034980192780495, -0.01862991228699684, -0.016224844381213188, -0.013819776475429535, -0.011414708569645882, -0.009009640663862228, -0.006604572758078575, -0.004199504852294922, -0.0017944369465112686, 0.0006106309592723846, 0.003015698865056038, 0.005420766770839691, 0.007825834676623344, 0.010230902582406998, 0.012635970488190651, 0.015041038393974304, 0.017446106299757957, 0.01985117420554161, 0.022256242111325264, 0.024661310017108917, 0.02706637792289257, 0.029471445828676224, 0.03187651187181473, 0.03428158164024353, 0.03668665140867233, 0.03909171745181084, 0.04149678349494934, 0.04390185326337814, 0.046306923031806946, 0.04871198907494545, 0.051117055118083954, 0.053522124886512756, 0.05592719465494156, 0.05833226069808006, 0.06073732674121857, 0.06314239650964737, 0.06554746627807617, 0.06795252859592438, 0.07035759836435318, 0.07276266813278198]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 9.0, 8.0, 9.0, 15.0, 16.0, 17.0, 14.0, 23.0, 27.0, 25.0, 28.0, 23.0, 31.0, 40.0, 36.0, 41.0, 37.0, 45.0, 47.0, 40.0, 47.0, 35.0, 45.0, 24.0, 48.0, 26.0, 32.0, 31.0, 24.0, 29.0, 17.0, 23.0, 14.0, 14.0, 7.0, 14.0, 10.0, 7.0, 2.0, 5.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.18359375, -6.950439453125, -6.71728515625, -6.484130859375, -6.2509765625, -6.017822265625, -5.78466796875, -5.551513671875, -5.318359375, -5.085205078125, -4.85205078125, -4.618896484375, -4.3857421875, -4.152587890625, -3.91943359375, -3.686279296875, -3.453125, -3.219970703125, -2.98681640625, -2.753662109375, -2.5205078125, -2.287353515625, -2.05419921875, -1.821044921875, -1.587890625, -1.354736328125, -1.12158203125, -0.888427734375, -0.6552734375, -0.422119140625, -0.18896484375, 0.044189453125, 0.27734375, 0.510498046875, 0.74365234375, 0.976806640625, 1.2099609375, 1.443115234375, 1.67626953125, 1.909423828125, 2.142578125, 2.375732421875, 2.60888671875, 2.842041015625, 3.0751953125, 3.308349609375, 3.54150390625, 3.774658203125, 4.0078125, 4.240966796875, 4.47412109375, 4.707275390625, 4.9404296875, 5.173583984375, 5.40673828125, 5.639892578125, 5.873046875, 6.106201171875, 6.33935546875, 6.572509765625, 6.8056640625, 7.038818359375, 7.27197265625, 7.505126953125, 7.73828125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 9.0, 9.0, 12.0, 12.0, 29.0, 28.0, 62.0, 62.0, 91.0, 108.0, 189.0, 267.0, 422.0, 574.0, 994.0, 1644.0, 3222.0, 7161.0, 18860.0, 59093.0, 205406.0, 497068.0, 172256.0, 50609.0, 16819.0, 6459.0, 2854.0, 1569.0, 873.0, 573.0, 344.0, 250.0, 169.0, 151.0, 86.0, 68.0, 33.0, 39.0, 22.0, 12.0, 15.0, 7.0, 10.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.6171875, -12.2158203125, -11.814453125, -11.4130859375, -11.01171875, -10.6103515625, -10.208984375, -9.8076171875, -9.40625, -9.0048828125, -8.603515625, -8.2021484375, -7.80078125, -7.3994140625, -6.998046875, -6.5966796875, -6.1953125, -5.7939453125, -5.392578125, -4.9912109375, -4.58984375, -4.1884765625, -3.787109375, -3.3857421875, -2.984375, -2.5830078125, -2.181640625, -1.7802734375, -1.37890625, -0.9775390625, -0.576171875, -0.1748046875, 0.2265625, 0.6279296875, 1.029296875, 1.4306640625, 1.83203125, 2.2333984375, 2.634765625, 3.0361328125, 3.4375, 3.8388671875, 4.240234375, 4.6416015625, 5.04296875, 5.4443359375, 5.845703125, 6.2470703125, 6.6484375, 7.0498046875, 7.451171875, 7.8525390625, 8.25390625, 8.6552734375, 9.056640625, 9.4580078125, 9.859375, 10.2607421875, 10.662109375, 11.0634765625, 11.46484375, 11.8662109375, 12.267578125, 12.6689453125, 13.0703125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 7.0, 4.0, 8.0, 12.0, 8.0, 12.0, 12.0, 12.0, 26.0, 20.0, 32.0, 38.0, 34.0, 24.0, 56.0, 77.0, 129.0, 234.0, 1473.0, 266.0, 138.0, 70.0, 60.0, 51.0, 36.0, 25.0, 20.0, 26.0, 26.0, 25.0, 15.0, 16.0, 11.0, 6.0, 12.0, 5.0, 4.0, 4.0, 6.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.96875, -18.32861328125, -17.6884765625, -17.04833984375, -16.408203125, -15.76806640625, -15.1279296875, -14.48779296875, -13.84765625, -13.20751953125, -12.5673828125, -11.92724609375, -11.287109375, -10.64697265625, -10.0068359375, -9.36669921875, -8.7265625, -8.08642578125, -7.4462890625, -6.80615234375, -6.166015625, -5.52587890625, -4.8857421875, -4.24560546875, -3.60546875, -2.96533203125, -2.3251953125, -1.68505859375, -1.044921875, -0.40478515625, 0.2353515625, 0.87548828125, 1.515625, 2.15576171875, 2.7958984375, 3.43603515625, 4.076171875, 4.71630859375, 5.3564453125, 5.99658203125, 6.63671875, 7.27685546875, 7.9169921875, 8.55712890625, 9.197265625, 9.83740234375, 10.4775390625, 11.11767578125, 11.7578125, 12.39794921875, 13.0380859375, 13.67822265625, 14.318359375, 14.95849609375, 15.5986328125, 16.23876953125, 16.87890625, 17.51904296875, 18.1591796875, 18.79931640625, 19.439453125, 20.07958984375, 20.7197265625, 21.35986328125, 22.0]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 4.0, 1.0, 9.0, 6.0, 7.0, 14.0, 17.0, 17.0, 30.0, 32.0, 43.0, 66.0, 103.0, 166.0, 227.0, 360.0, 500.0, 1115.0, 5859.0, 3101946.0, 31799.0, 1576.0, 640.0, 360.0, 244.0, 179.0, 97.0, 66.0, 73.0, 48.0, 22.0, 24.0, 15.0, 15.0, 10.0, 4.0, 4.0, 5.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-67.625, -65.4892578125, -63.353515625, -61.2177734375, -59.08203125, -56.9462890625, -54.810546875, -52.6748046875, -50.5390625, -48.4033203125, -46.267578125, -44.1318359375, -41.99609375, -39.8603515625, -37.724609375, -35.5888671875, -33.453125, -31.3173828125, -29.181640625, -27.0458984375, -24.91015625, -22.7744140625, -20.638671875, -18.5029296875, -16.3671875, -14.2314453125, -12.095703125, -9.9599609375, -7.82421875, -5.6884765625, -3.552734375, -1.4169921875, 0.71875, 2.8544921875, 4.990234375, 7.1259765625, 9.26171875, 11.3974609375, 13.533203125, 15.6689453125, 17.8046875, 19.9404296875, 22.076171875, 24.2119140625, 26.34765625, 28.4833984375, 30.619140625, 32.7548828125, 34.890625, 37.0263671875, 39.162109375, 41.2978515625, 43.43359375, 45.5693359375, 47.705078125, 49.8408203125, 51.9765625, 54.1123046875, 56.248046875, 58.3837890625, 60.51953125, 62.6552734375, 64.791015625, 66.9267578125, 69.0625]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 78.0, 432.0, 415.0, 79.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.582401275634766, -47.781394958496094, -40.98039245605469, -34.179386138916016, -27.378381729125977, -20.577377319335938, -13.776371002197266, -6.975368499755859, -0.1743621826171875, 6.62664270401001, 13.427647590637207, 20.228652954101562, 27.0296573638916, 33.83066177368164, 40.63166809082031, 47.43267059326172, 54.23367691040039, 61.03468322753906, 67.83568572998047, 74.63668823242188, 81.43769836425781, 88.23870086669922, 95.03970336914062, 101.84071350097656, 108.64171600341797, 115.44271850585938, 122.24372863769531, 129.04473876953125, 135.84573364257812, 142.64674377441406, 149.44775390625, 156.24874877929688, 163.0497589111328, 169.85076904296875, 176.65176391601562, 183.45277404785156, 190.2537841796875, 197.05477905273438, 203.8557891845703, 210.65679931640625, 217.45779418945312, 224.25880432128906, 231.05979919433594, 237.86080932617188, 244.6618194580078, 251.4628143310547, 258.2638244628906, 265.0648193359375, 271.8658447265625, 278.6668395996094, 285.4678649902344, 292.26885986328125, 299.0698547363281, 305.8708801269531, 312.671875, 319.4728698730469, 326.27386474609375, 333.0748596191406, 339.8758850097656, 346.6768798828125, 353.4778747558594, 360.2789001464844, 367.07989501953125, 373.8808898925781, 380.6819152832031]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 6.0, 5.0, 6.0, 5.0, 10.0, 12.0, 16.0, 12.0, 20.0, 23.0, 21.0, 24.0, 25.0, 31.0, 33.0, 37.0, 44.0, 41.0, 34.0, 33.0, 50.0, 40.0, 42.0, 39.0, 46.0, 40.0, 27.0, 29.0, 40.0, 35.0, 29.0, 22.0, 12.0, 19.0, 20.0, 15.0, 8.0, 11.0, 13.0, 5.0, 5.0, 7.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-59.57758331298828, -57.76750183105469, -55.95741653442383, -54.147335052490234, -52.337249755859375, -50.52716827392578, -48.71708679199219, -46.90700149536133, -45.096920013427734, -43.28683853149414, -41.47675323486328, -39.66667175292969, -37.85658645629883, -36.046504974365234, -34.236419677734375, -32.42633819580078, -30.616254806518555, -28.806171417236328, -26.9960880279541, -25.186004638671875, -23.37592315673828, -21.565839767456055, -19.755756378173828, -17.945674896240234, -16.135589599609375, -14.325506210327148, -12.515423774719238, -10.705340385437012, -8.895257949829102, -7.085174560546875, -5.275091171264648, -3.4650087356567383, -1.6549263000488281, 0.15515673160552979, 1.9652397632598877, 3.775322914123535, 5.5854058265686035, 7.395488739013672, 9.205572128295898, 11.015654563903809, 12.825737953186035, 14.635821342468262, 16.445903778076172, 18.2559871673584, 20.066070556640625, 21.87615203857422, 23.686237335205078, 25.496318817138672, 27.3064022064209, 29.116485595703125, 30.92656898498535, 32.73665237426758, 34.54673385620117, 36.35681915283203, 38.166900634765625, 39.97698211669922, 41.78706741333008, 43.59714889526367, 45.40723419189453, 47.217315673828125, 49.027400970458984, 50.83748245239258, 52.64756774902344, 54.45764923095703, 56.267730712890625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 14.0, 6.0, 10.0, 18.0, 9.0, 14.0, 13.0, 21.0, 30.0, 32.0, 27.0, 22.0, 44.0, 40.0, 49.0, 39.0, 43.0, 57.0, 43.0, 42.0, 43.0, 49.0, 48.0, 45.0, 39.0, 29.0, 26.0, 24.0, 20.0, 18.0, 11.0, 13.0, 9.0, 12.0, 6.0, 9.0, 8.0, 6.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.9140625, -8.643310546875, -8.37255859375, -8.101806640625, -7.8310546875, -7.560302734375, -7.28955078125, -7.018798828125, -6.748046875, -6.477294921875, -6.20654296875, -5.935791015625, -5.6650390625, -5.394287109375, -5.12353515625, -4.852783203125, -4.58203125, -4.311279296875, -4.04052734375, -3.769775390625, -3.4990234375, -3.228271484375, -2.95751953125, -2.686767578125, -2.416015625, -2.145263671875, -1.87451171875, -1.603759765625, -1.3330078125, -1.062255859375, -0.79150390625, -0.520751953125, -0.25, 0.020751953125, 0.29150390625, 0.562255859375, 0.8330078125, 1.103759765625, 1.37451171875, 1.645263671875, 1.916015625, 2.186767578125, 2.45751953125, 2.728271484375, 2.9990234375, 3.269775390625, 3.54052734375, 3.811279296875, 4.08203125, 4.352783203125, 4.62353515625, 4.894287109375, 5.1650390625, 5.435791015625, 5.70654296875, 5.977294921875, 6.248046875, 6.518798828125, 6.78955078125, 7.060302734375, 7.3310546875, 7.601806640625, 7.87255859375, 8.143310546875, 8.4140625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 11.0, 16.0, 24.0, 47.0, 50.0, 104.0, 183.0, 306.0, 564.0, 943.0, 1793.0, 3571.0, 7818.0, 20576.0, 72855.0, 330905.0, 1163110.0, 1715234.0, 660140.0, 155833.0, 36914.0, 12448.0, 5238.0, 2630.0, 1243.0, 700.0, 444.0, 238.0, 146.0, 76.0, 45.0, 26.0, 16.0, 16.0, 4.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5625, -9.1982421875, -8.833984375, -8.4697265625, -8.10546875, -7.7412109375, -7.376953125, -7.0126953125, -6.6484375, -6.2841796875, -5.919921875, -5.5556640625, -5.19140625, -4.8271484375, -4.462890625, -4.0986328125, -3.734375, -3.3701171875, -3.005859375, -2.6416015625, -2.27734375, -1.9130859375, -1.548828125, -1.1845703125, -0.8203125, -0.4560546875, -0.091796875, 0.2724609375, 0.63671875, 1.0009765625, 1.365234375, 1.7294921875, 2.09375, 2.4580078125, 2.822265625, 3.1865234375, 3.55078125, 3.9150390625, 4.279296875, 4.6435546875, 5.0078125, 5.3720703125, 5.736328125, 6.1005859375, 6.46484375, 6.8291015625, 7.193359375, 7.5576171875, 7.921875, 8.2861328125, 8.650390625, 9.0146484375, 9.37890625, 9.7431640625, 10.107421875, 10.4716796875, 10.8359375, 11.2001953125, 11.564453125, 11.9287109375, 12.29296875, 12.6572265625, 13.021484375, 13.3857421875, 13.75]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 3.0, 12.0, 18.0, 19.0, 13.0, 24.0, 44.0, 53.0, 81.0, 99.0, 170.0, 211.0, 263.0, 363.0, 409.0, 469.0, 450.0, 328.0, 258.0, 221.0, 155.0, 109.0, 80.0, 73.0, 38.0, 35.0, 21.0, 15.0, 11.0, 11.0, 5.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7265625, -13.3165283203125, -12.906494140625, -12.4964599609375, -12.08642578125, -11.6763916015625, -11.266357421875, -10.8563232421875, -10.4462890625, -10.0362548828125, -9.626220703125, -9.2161865234375, -8.80615234375, -8.3961181640625, -7.986083984375, -7.5760498046875, -7.166015625, -6.7559814453125, -6.345947265625, -5.9359130859375, -5.52587890625, -5.1158447265625, -4.705810546875, -4.2957763671875, -3.8857421875, -3.4757080078125, -3.065673828125, -2.6556396484375, -2.24560546875, -1.8355712890625, -1.425537109375, -1.0155029296875, -0.60546875, -0.1954345703125, 0.214599609375, 0.6246337890625, 1.03466796875, 1.4447021484375, 1.854736328125, 2.2647705078125, 2.6748046875, 3.0848388671875, 3.494873046875, 3.9049072265625, 4.31494140625, 4.7249755859375, 5.135009765625, 5.5450439453125, 5.955078125, 6.3651123046875, 6.775146484375, 7.1851806640625, 7.59521484375, 8.0052490234375, 8.415283203125, 8.8253173828125, 9.2353515625, 9.6453857421875, 10.055419921875, 10.4654541015625, 10.87548828125, 11.2855224609375, 11.695556640625, 12.1055908203125, 12.515625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 4.0, 2.0, 9.0, 9.0, 14.0, 20.0, 24.0, 51.0, 59.0, 94.0, 154.0, 260.0, 493.0, 1060.0, 2601.0, 10287.0, 186183.0, 3331619.0, 633701.0, 21065.0, 3818.0, 1348.0, 595.0, 323.0, 165.0, 100.0, 66.0, 37.0, 41.0, 26.0, 18.0, 14.0, 11.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.59375, -24.73095703125, -23.8681640625, -23.00537109375, -22.142578125, -21.27978515625, -20.4169921875, -19.55419921875, -18.69140625, -17.82861328125, -16.9658203125, -16.10302734375, -15.240234375, -14.37744140625, -13.5146484375, -12.65185546875, -11.7890625, -10.92626953125, -10.0634765625, -9.20068359375, -8.337890625, -7.47509765625, -6.6123046875, -5.74951171875, -4.88671875, -4.02392578125, -3.1611328125, -2.29833984375, -1.435546875, -0.57275390625, 0.2900390625, 1.15283203125, 2.015625, 2.87841796875, 3.7412109375, 4.60400390625, 5.466796875, 6.32958984375, 7.1923828125, 8.05517578125, 8.91796875, 9.78076171875, 10.6435546875, 11.50634765625, 12.369140625, 13.23193359375, 14.0947265625, 14.95751953125, 15.8203125, 16.68310546875, 17.5458984375, 18.40869140625, 19.271484375, 20.13427734375, 20.9970703125, 21.85986328125, 22.72265625, 23.58544921875, 24.4482421875, 25.31103515625, 26.173828125, 27.03662109375, 27.8994140625, 28.76220703125, 29.625]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 181.0, 690.0, 138.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-229.8671417236328, -217.4376220703125, -205.00808715820312, -192.5785675048828, -180.14903259277344, -167.71951293945312, -155.28997802734375, -142.86045837402344, -130.43093872070312, -118.00141143798828, -105.57188415527344, -93.14236450195312, -80.71282958984375, -68.28330993652344, -55.853782653808594, -43.42425537109375, -30.994720458984375, -18.56519317626953, -6.13566780090332, 6.293857574462891, 18.723384857177734, 31.152912139892578, 43.582435607910156, 56.011962890625, 68.44149017333984, 80.87101745605469, 93.30054473876953, 105.73007202148438, 118.15959167480469, 130.58912658691406, 143.01864624023438, 155.44818115234375, 167.87771606445312, 180.30723571777344, 192.7367706298828, 205.16629028320312, 217.5958251953125, 230.0253448486328, 242.45486450195312, 254.8843994140625, 267.3139343261719, 279.74346923828125, 292.1729736328125, 304.6025085449219, 317.03204345703125, 329.4615783691406, 341.8910827636719, 354.32061767578125, 366.7501220703125, 379.1796569824219, 391.6091613769531, 404.0386962890625, 416.4682312011719, 428.89776611328125, 441.3272705078125, 453.7568054199219, 466.18634033203125, 478.6158752441406, 491.0453796386719, 503.47491455078125, 515.9044189453125, 528.333984375, 540.7634887695312, 553.1929931640625, 565.62255859375]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 3.0, 5.0, 8.0, 19.0, 12.0, 22.0, 23.0, 25.0, 25.0, 29.0, 54.0, 51.0, 49.0, 51.0, 67.0, 70.0, 52.0, 68.0, 47.0, 54.0, 41.0, 30.0, 34.0, 28.0, 33.0, 30.0, 21.0, 17.0, 10.0, 8.0, 7.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.29891967773438, -62.327781677246094, -60.35664749145508, -58.38551330566406, -56.41437530517578, -54.4432373046875, -52.472103118896484, -50.50096893310547, -48.52983093261719, -46.558692932128906, -44.58755874633789, -42.616424560546875, -40.645286560058594, -38.67414855957031, -36.7030143737793, -34.73188018798828, -32.7607421875, -30.78960609436035, -28.818470001220703, -26.847333908081055, -24.876197814941406, -22.905061721801758, -20.93392562866211, -18.96278953552246, -16.991653442382812, -15.020517349243164, -13.049381256103516, -11.078245162963867, -9.107109069824219, -7.13597297668457, -5.164836883544922, -3.1937007904052734, -1.222564697265625, 0.7485713958740234, 2.719707489013672, 4.69084358215332, 6.661979675292969, 8.633115768432617, 10.604251861572266, 12.575387954711914, 14.546524047851562, 16.51766014099121, 18.48879623413086, 20.459932327270508, 22.431068420410156, 24.402204513549805, 26.373340606689453, 28.3444766998291, 30.31561279296875, 32.28675079345703, 34.25788497924805, 36.22901916503906, 38.200157165527344, 40.171295166015625, 42.14242935180664, 44.113563537597656, 46.08470153808594, 48.05583953857422, 50.026973724365234, 51.99810791015625, 53.96924591064453, 55.94038391113281, 57.91151809692383, 59.882652282714844, 61.853790283203125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 9.0, 13.0, 7.0, 11.0, 16.0, 22.0, 23.0, 24.0, 22.0, 20.0, 39.0, 32.0, 34.0, 36.0, 45.0, 35.0, 51.0, 45.0, 43.0, 39.0, 48.0, 48.0, 40.0, 40.0, 35.0, 32.0, 35.0, 27.0, 21.0, 26.0, 19.0, 12.0, 13.0, 8.0, 8.0, 1.0, 6.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.23046875, -7.01666259765625, -6.8028564453125, -6.58905029296875, -6.375244140625, -6.16143798828125, -5.9476318359375, -5.73382568359375, -5.52001953125, -5.30621337890625, -5.0924072265625, -4.87860107421875, -4.664794921875, -4.45098876953125, -4.2371826171875, -4.02337646484375, -3.8095703125, -3.59576416015625, -3.3819580078125, -3.16815185546875, -2.954345703125, -2.74053955078125, -2.5267333984375, -2.31292724609375, -2.09912109375, -1.88531494140625, -1.6715087890625, -1.45770263671875, -1.243896484375, -1.03009033203125, -0.8162841796875, -0.60247802734375, -0.388671875, -0.17486572265625, 0.0389404296875, 0.25274658203125, 0.466552734375, 0.68035888671875, 0.8941650390625, 1.10797119140625, 1.32177734375, 1.53558349609375, 1.7493896484375, 1.96319580078125, 2.177001953125, 2.39080810546875, 2.6046142578125, 2.81842041015625, 3.0322265625, 3.24603271484375, 3.4598388671875, 3.67364501953125, 3.887451171875, 4.10125732421875, 4.3150634765625, 4.52886962890625, 4.74267578125, 4.95648193359375, 5.1702880859375, 5.38409423828125, 5.597900390625, 5.81170654296875, 6.0255126953125, 6.23931884765625, 6.453125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 8.0, 9.0, 23.0, 26.0, 28.0, 41.0, 88.0, 130.0, 216.0, 330.0, 536.0, 865.0, 1376.0, 2070.0, 3381.0, 5402.0, 8477.0, 13414.0, 20479.0, 31316.0, 46330.0, 66445.0, 89551.0, 113484.0, 128533.0, 127974.0, 110616.0, 86266.0, 63367.0, 44615.0, 29569.0, 19165.0, 12648.0, 7932.0, 5196.0, 3128.0, 1980.0, 1316.0, 817.0, 550.0, 302.0, 214.0, 126.0, 70.0, 62.0, 30.0, 23.0, 8.0, 12.0, 5.0, 2.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.7177734375, -0.6952972412109375, -0.672821044921875, -0.6503448486328125, -0.62786865234375, -0.6053924560546875, -0.582916259765625, -0.5604400634765625, -0.5379638671875, -0.5154876708984375, -0.493011474609375, -0.4705352783203125, -0.44805908203125, -0.4255828857421875, -0.403106689453125, -0.3806304931640625, -0.358154296875, -0.3356781005859375, -0.313201904296875, -0.2907257080078125, -0.26824951171875, -0.2457733154296875, -0.223297119140625, -0.2008209228515625, -0.1783447265625, -0.1558685302734375, -0.133392333984375, -0.1109161376953125, -0.08843994140625, -0.0659637451171875, -0.043487548828125, -0.0210113525390625, 0.00146484375, 0.0239410400390625, 0.046417236328125, 0.0688934326171875, 0.09136962890625, 0.1138458251953125, 0.136322021484375, 0.1587982177734375, 0.1812744140625, 0.2037506103515625, 0.226226806640625, 0.2487030029296875, 0.27117919921875, 0.2936553955078125, 0.316131591796875, 0.3386077880859375, 0.361083984375, 0.3835601806640625, 0.406036376953125, 0.4285125732421875, 0.45098876953125, 0.4734649658203125, 0.495941162109375, 0.5184173583984375, 0.5408935546875, 0.5633697509765625, 0.585845947265625, 0.6083221435546875, 0.63079833984375, 0.6532745361328125, 0.675750732421875, 0.6982269287109375, 0.720703125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 4.0, 5.0, 7.0, 13.0, 13.0, 15.0, 13.0, 17.0, 14.0, 15.0, 26.0, 26.0, 41.0, 36.0, 41.0, 31.0, 44.0, 53.0, 38.0, 1069.0, 36.0, 45.0, 43.0, 51.0, 36.0, 34.0, 38.0, 40.0, 31.0, 23.0, 19.0, 18.0, 16.0, 15.0, 12.0, 8.0, 13.0, 4.0, 6.0, 7.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.44921875, -5.2969970703125, -5.144775390625, -4.9925537109375, -4.84033203125, -4.6881103515625, -4.535888671875, -4.3836669921875, -4.2314453125, -4.0792236328125, -3.927001953125, -3.7747802734375, -3.62255859375, -3.4703369140625, -3.318115234375, -3.1658935546875, -3.013671875, -2.8614501953125, -2.709228515625, -2.5570068359375, -2.40478515625, -2.2525634765625, -2.100341796875, -1.9481201171875, -1.7958984375, -1.6436767578125, -1.491455078125, -1.3392333984375, -1.18701171875, -1.0347900390625, -0.882568359375, -0.7303466796875, -0.578125, -0.4259033203125, -0.273681640625, -0.1214599609375, 0.03076171875, 0.1829833984375, 0.335205078125, 0.4874267578125, 0.6396484375, 0.7918701171875, 0.944091796875, 1.0963134765625, 1.24853515625, 1.4007568359375, 1.552978515625, 1.7052001953125, 1.857421875, 2.0096435546875, 2.161865234375, 2.3140869140625, 2.46630859375, 2.6185302734375, 2.770751953125, 2.9229736328125, 3.0751953125, 3.2274169921875, 3.379638671875, 3.5318603515625, 3.68408203125, 3.8363037109375, 3.988525390625, 4.1407470703125, 4.29296875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 10.0, 5.0, 6.0, 24.0, 24.0, 32.0, 50.0, 66.0, 120.0, 159.0, 260.0, 354.0, 515.0, 803.0, 1281.0, 1850.0, 2860.0, 4133.0, 6499.0, 9662.0, 14308.0, 21788.0, 33101.0, 1835774.0, 78503.0, 28407.0, 18748.0, 12631.0, 8179.0, 5619.0, 3779.0, 2488.0, 1717.0, 1090.0, 800.0, 485.0, 320.0, 218.0, 162.0, 97.0, 64.0, 54.0, 28.0, 24.0, 8.0, 12.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.615234375, -1.5674896240234375, -1.519744873046875, -1.4720001220703125, -1.42425537109375, -1.3765106201171875, -1.328765869140625, -1.2810211181640625, -1.2332763671875, -1.1855316162109375, -1.137786865234375, -1.0900421142578125, -1.04229736328125, -0.9945526123046875, -0.946807861328125, -0.8990631103515625, -0.851318359375, -0.8035736083984375, -0.755828857421875, -0.7080841064453125, -0.66033935546875, -0.6125946044921875, -0.564849853515625, -0.5171051025390625, -0.4693603515625, -0.4216156005859375, -0.373870849609375, -0.3261260986328125, -0.27838134765625, -0.2306365966796875, -0.182891845703125, -0.1351470947265625, -0.08740234375, -0.0396575927734375, 0.008087158203125, 0.0558319091796875, 0.10357666015625, 0.1513214111328125, 0.199066162109375, 0.2468109130859375, 0.2945556640625, 0.3423004150390625, 0.390045166015625, 0.4377899169921875, 0.48553466796875, 0.5332794189453125, 0.581024169921875, 0.6287689208984375, 0.676513671875, 0.7242584228515625, 0.772003173828125, 0.8197479248046875, 0.86749267578125, 0.9152374267578125, 0.962982177734375, 1.0107269287109375, 1.0584716796875, 1.1062164306640625, 1.153961181640625, 1.2017059326171875, 1.24945068359375, 1.2971954345703125, 1.344940185546875, 1.3926849365234375, 1.4404296875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 10.0, 9.0, 24.0, 40.0, 52.0, 83.0, 99.0, 112.0, 123.0, 131.0, 99.0, 79.0, 52.0, 32.0, 18.0, 14.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0406494140625, -0.03931236267089844, -0.037975311279296875, -0.03663825988769531, -0.03530120849609375, -0.03396415710449219, -0.032627105712890625, -0.03129005432128906, -0.0299530029296875, -0.028615951538085938, -0.027278900146484375, -0.025941848754882812, -0.02460479736328125, -0.023267745971679688, -0.021930694580078125, -0.020593643188476562, -0.019256591796875, -0.017919540405273438, -0.016582489013671875, -0.015245437622070312, -0.01390838623046875, -0.012571334838867188, -0.011234283447265625, -0.009897232055664062, -0.0085601806640625, -0.0072231292724609375, -0.005886077880859375, -0.0045490264892578125, -0.00321197509765625, -0.0018749237060546875, -0.000537872314453125, 0.0007991790771484375, 0.00213623046875, 0.0034732818603515625, 0.004810333251953125, 0.0061473846435546875, 0.00748443603515625, 0.008821487426757812, 0.010158538818359375, 0.011495590209960938, 0.0128326416015625, 0.014169692993164062, 0.015506744384765625, 0.016843795776367188, 0.01818084716796875, 0.019517898559570312, 0.020854949951171875, 0.022192001342773438, 0.023529052734375, 0.024866104125976562, 0.026203155517578125, 0.027540206909179688, 0.02887725830078125, 0.030214309692382812, 0.031551361083984375, 0.03288841247558594, 0.0342254638671875, 0.03556251525878906, 0.036899566650390625, 0.03823661804199219, 0.03957366943359375, 0.04091072082519531, 0.042247772216796875, 0.04358482360839844, 0.044921875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 15.0, 20.0, 28.0, 55.0, 82.0, 202.0, 435.0, 1274.0, 912446.0, 132192.0, 1035.0, 368.0, 176.0, 85.0, 53.0, 28.0, 19.0, 11.0, 8.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.87109375, -0.8454132080078125, -0.819732666015625, -0.7940521240234375, -0.76837158203125, -0.7426910400390625, -0.717010498046875, -0.6913299560546875, -0.6656494140625, -0.6399688720703125, -0.614288330078125, -0.5886077880859375, -0.56292724609375, -0.5372467041015625, -0.511566162109375, -0.4858856201171875, -0.460205078125, -0.4345245361328125, -0.408843994140625, -0.3831634521484375, -0.35748291015625, -0.3318023681640625, -0.306121826171875, -0.2804412841796875, -0.2547607421875, -0.2290802001953125, -0.203399658203125, -0.1777191162109375, -0.15203857421875, -0.1263580322265625, -0.100677490234375, -0.0749969482421875, -0.04931640625, -0.0236358642578125, 0.002044677734375, 0.0277252197265625, 0.05340576171875, 0.0790863037109375, 0.104766845703125, 0.1304473876953125, 0.1561279296875, 0.1818084716796875, 0.207489013671875, 0.2331695556640625, 0.25885009765625, 0.2845306396484375, 0.310211181640625, 0.3358917236328125, 0.361572265625, 0.3872528076171875, 0.412933349609375, 0.4386138916015625, 0.46429443359375, 0.4899749755859375, 0.515655517578125, 0.5413360595703125, 0.5670166015625, 0.5926971435546875, 0.618377685546875, 0.6440582275390625, 0.66973876953125, 0.6954193115234375, 0.721099853515625, 0.7467803955078125, 0.7724609375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 17.0, 993.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6852552890777588, -0.6687242388725281, -0.6521931886672974, -0.6356621980667114, -0.6191311478614807, -0.60260009765625, -0.5860691070556641, -0.5695380568504333, -0.5530070066452026, -0.5364759564399719, -0.5199449062347412, -0.5034139156341553, -0.48688286542892456, -0.47035181522369385, -0.4538207948207855, -0.4372897744178772, -0.4207587242126465, -0.40422767400741577, -0.38769665360450745, -0.3711656332015991, -0.3546345829963684, -0.3381035327911377, -0.32157251238822937, -0.30504149198532104, -0.28851044178009033, -0.2719793915748596, -0.2554483711719513, -0.23891733586788177, -0.22238630056381226, -0.20585526525974274, -0.18932422995567322, -0.1727931946516037, -0.15626218914985657, -0.13973115384578705, -0.12320011854171753, -0.10666908323764801, -0.09013804793357849, -0.07360701262950897, -0.05707597732543945, -0.040544942021369934, -0.024013906717300415, -0.007482871413230896, 0.009048163890838623, 0.025579199194908142, 0.04211023449897766, 0.05864126980304718, 0.0751723051071167, 0.09170334041118622, 0.10823437571525574, 0.12476541101932526, 0.14129644632339478, 0.1578274816274643, 0.1743585169315338, 0.19088955223560333, 0.20742058753967285, 0.22395162284374237, 0.2404826581478119, 0.2570136785507202, 0.2735447287559509, 0.29007577896118164, 0.30660679936408997, 0.3231378197669983, 0.339668869972229, 0.3561999201774597, 0.37273094058036804]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 7.0, 13.0, 13.0, 10.0, 17.0, 24.0, 26.0, 36.0, 54.0, 36.0, 55.0, 66.0, 59.0, 67.0, 75.0, 66.0, 69.0, 62.0, 44.0, 40.0, 31.0, 26.0, 24.0, 24.0, 15.0, 12.0, 9.0, 9.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040503501892089844, -0.03906629979610443, -0.03762909770011902, -0.036191895604133606, -0.03475469350814819, -0.03331749141216278, -0.03188028931617737, -0.030443087220191956, -0.029005885124206543, -0.02756868302822113, -0.026131480932235718, -0.024694278836250305, -0.023257076740264893, -0.02181987464427948, -0.020382672548294067, -0.018945470452308655, -0.017508268356323242, -0.01607106626033783, -0.014633864164352417, -0.013196662068367004, -0.011759459972381592, -0.01032225787639618, -0.008885055780410767, -0.007447853684425354, -0.006010651588439941, -0.004573449492454529, -0.003136247396469116, -0.0016990453004837036, -0.000261843204498291, 0.0011753588914871216, 0.002612560987472534, 0.004049763083457947, 0.005486965179443359, 0.006924167275428772, 0.008361369371414185, 0.009798571467399597, 0.01123577356338501, 0.012672975659370422, 0.014110177755355835, 0.015547379851341248, 0.01698458194732666, 0.018421784043312073, 0.019858986139297485, 0.021296188235282898, 0.02273339033126831, 0.024170592427253723, 0.025607794523239136, 0.02704499661922455, 0.02848219871520996, 0.029919400811195374, 0.031356602907180786, 0.0327938050031662, 0.03423100709915161, 0.035668209195137024, 0.037105411291122437, 0.03854261338710785, 0.03997981548309326, 0.041417017579078674, 0.04285421967506409, 0.0442914217710495, 0.04572862386703491, 0.047165825963020325, 0.04860302805900574, 0.05004023015499115, 0.05147743225097656]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 5.0, 3.0, 12.0, 9.0, 16.0, 8.0, 17.0, 14.0, 17.0, 18.0, 21.0, 25.0, 36.0, 28.0, 25.0, 47.0, 42.0, 47.0, 41.0, 52.0, 49.0, 36.0, 45.0, 35.0, 44.0, 37.0, 38.0, 43.0, 41.0, 22.0, 16.0, 13.0, 22.0, 19.0, 10.0, 12.0, 6.0, 10.0, 3.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.68359375, -6.4747314453125, -6.265869140625, -6.0570068359375, -5.84814453125, -5.6392822265625, -5.430419921875, -5.2215576171875, -5.0126953125, -4.8038330078125, -4.594970703125, -4.3861083984375, -4.17724609375, -3.9683837890625, -3.759521484375, -3.5506591796875, -3.341796875, -3.1329345703125, -2.924072265625, -2.7152099609375, -2.50634765625, -2.2974853515625, -2.088623046875, -1.8797607421875, -1.6708984375, -1.4620361328125, -1.253173828125, -1.0443115234375, -0.83544921875, -0.6265869140625, -0.417724609375, -0.2088623046875, 0.0, 0.2088623046875, 0.417724609375, 0.6265869140625, 0.83544921875, 1.0443115234375, 1.253173828125, 1.4620361328125, 1.6708984375, 1.8797607421875, 2.088623046875, 2.2974853515625, 2.50634765625, 2.7152099609375, 2.924072265625, 3.1329345703125, 3.341796875, 3.5506591796875, 3.759521484375, 3.9683837890625, 4.17724609375, 4.3861083984375, 4.594970703125, 4.8038330078125, 5.0126953125, 5.2215576171875, 5.430419921875, 5.6392822265625, 5.84814453125, 6.0570068359375, 6.265869140625, 6.4747314453125, 6.68359375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 4.0, 5.0, 5.0, 1.0, 10.0, 15.0, 20.0, 18.0, 33.0, 60.0, 55.0, 79.0, 103.0, 122.0, 171.0, 248.0, 321.0, 510.0, 897.0, 1574.0, 3024.0, 6505.0, 15752.0, 47371.0, 168436.0, 409993.0, 270901.0, 79602.0, 24151.0, 9251.0, 4064.0, 2063.0, 1099.0, 676.0, 358.0, 274.0, 214.0, 145.0, 93.0, 80.0, 72.0, 54.0, 37.0, 32.0, 14.0, 10.0, 13.0, 9.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.71875, -8.4600830078125, -8.201416015625, -7.9427490234375, -7.68408203125, -7.4254150390625, -7.166748046875, -6.9080810546875, -6.6494140625, -6.3907470703125, -6.132080078125, -5.8734130859375, -5.61474609375, -5.3560791015625, -5.097412109375, -4.8387451171875, -4.580078125, -4.3214111328125, -4.062744140625, -3.8040771484375, -3.54541015625, -3.2867431640625, -3.028076171875, -2.7694091796875, -2.5107421875, -2.2520751953125, -1.993408203125, -1.7347412109375, -1.47607421875, -1.2174072265625, -0.958740234375, -0.7000732421875, -0.44140625, -0.1827392578125, 0.075927734375, 0.3345947265625, 0.59326171875, 0.8519287109375, 1.110595703125, 1.3692626953125, 1.6279296875, 1.8865966796875, 2.145263671875, 2.4039306640625, 2.66259765625, 2.9212646484375, 3.179931640625, 3.4385986328125, 3.697265625, 3.9559326171875, 4.214599609375, 4.4732666015625, 4.73193359375, 4.9906005859375, 5.249267578125, 5.5079345703125, 5.7666015625, 6.0252685546875, 6.283935546875, 6.5426025390625, 6.80126953125, 7.0599365234375, 7.318603515625, 7.5772705078125, 7.8359375]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 10.0, 7.0, 9.0, 14.0, 15.0, 15.0, 27.0, 29.0, 26.0, 34.0, 36.0, 53.0, 60.0, 93.0, 168.0, 400.0, 1439.0, 198.0, 73.0, 57.0, 50.0, 37.0, 28.0, 22.0, 32.0, 22.0, 11.0, 16.0, 10.0, 10.0, 9.0, 8.0, 3.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-23.140625, -22.515625, -21.890625, -21.265625, -20.640625, -20.015625, -19.390625, -18.765625, -18.140625, -17.515625, -16.890625, -16.265625, -15.640625, -15.015625, -14.390625, -13.765625, -13.140625, -12.515625, -11.890625, -11.265625, -10.640625, -10.015625, -9.390625, -8.765625, -8.140625, -7.515625, -6.890625, -6.265625, -5.640625, -5.015625, -4.390625, -3.765625, -3.140625, -2.515625, -1.890625, -1.265625, -0.640625, -0.015625, 0.609375, 1.234375, 1.859375, 2.484375, 3.109375, 3.734375, 4.359375, 4.984375, 5.609375, 6.234375, 6.859375, 7.484375, 8.109375, 8.734375, 9.359375, 9.984375, 10.609375, 11.234375, 11.859375, 12.484375, 13.109375, 13.734375, 14.359375, 14.984375, 15.609375, 16.234375, 16.859375]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 6.0, 10.0, 23.0, 13.0, 14.0, 23.0, 30.0, 54.0, 60.0, 77.0, 117.0, 135.0, 213.0, 380.0, 746.0, 2919.0, 421209.0, 2711186.0, 6075.0, 968.0, 475.0, 284.0, 184.0, 133.0, 94.0, 65.0, 42.0, 39.0, 26.0, 25.0, 12.0, 10.0, 15.0, 8.0, 7.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.125, -31.05908203125, -29.9931640625, -28.92724609375, -27.861328125, -26.79541015625, -25.7294921875, -24.66357421875, -23.59765625, -22.53173828125, -21.4658203125, -20.39990234375, -19.333984375, -18.26806640625, -17.2021484375, -16.13623046875, -15.0703125, -14.00439453125, -12.9384765625, -11.87255859375, -10.806640625, -9.74072265625, -8.6748046875, -7.60888671875, -6.54296875, -5.47705078125, -4.4111328125, -3.34521484375, -2.279296875, -1.21337890625, -0.1474609375, 0.91845703125, 1.984375, 3.05029296875, 4.1162109375, 5.18212890625, 6.248046875, 7.31396484375, 8.3798828125, 9.44580078125, 10.51171875, 11.57763671875, 12.6435546875, 13.70947265625, 14.775390625, 15.84130859375, 16.9072265625, 17.97314453125, 19.0390625, 20.10498046875, 21.1708984375, 22.23681640625, 23.302734375, 24.36865234375, 25.4345703125, 26.50048828125, 27.56640625, 28.63232421875, 29.6982421875, 30.76416015625, 31.830078125, 32.89599609375, 33.9619140625, 35.02783203125, 36.09375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 48.0, 146.0, 288.0, 271.0, 173.0, 64.0, 8.0, 4.0, 1.0, 1.0], "bins": [-152.00912475585938, -149.3544158935547, -146.69969177246094, -144.04498291015625, -141.39027404785156, -138.7355499267578, -136.08084106445312, -133.42613220214844, -130.77142333984375, -128.11671447753906, -125.46199798583984, -122.80728149414062, -120.15257263183594, -117.49785614013672, -114.8431396484375, -112.18843078613281, -109.53370666503906, -106.87899017333984, -104.22428131103516, -101.56956481933594, -98.91485595703125, -96.26013946533203, -93.60542297363281, -90.95071411132812, -88.2959976196289, -85.64128112792969, -82.986572265625, -80.33185577392578, -77.67713928222656, -75.02243041992188, -72.36771392822266, -69.71299743652344, -67.05828094482422, -64.403564453125, -61.74885559082031, -59.094139099121094, -56.43942642211914, -53.78471374511719, -51.12999725341797, -48.475284576416016, -45.82057189941406, -43.16585922241211, -40.511146545410156, -37.85643005371094, -35.201717376708984, -32.54700469970703, -29.892290115356445, -27.23757553100586, -24.582862854003906, -21.928150177001953, -19.273435592651367, -16.61872100830078, -13.964008331298828, -11.309294700622559, -8.654581069946289, -5.999866485595703, -3.34515380859375, -0.6904401779174805, 1.964273452758789, 4.618987083435059, 7.273700714111328, 9.928414344787598, 12.583127975463867, 15.237842559814453, 17.892555236816406]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 8.0, 4.0, 13.0, 10.0, 3.0, 14.0, 16.0, 16.0, 24.0, 30.0, 25.0, 33.0, 29.0, 29.0, 27.0, 33.0, 39.0, 46.0, 40.0, 36.0, 39.0, 39.0, 34.0, 34.0, 36.0, 43.0, 31.0, 41.0, 26.0, 38.0, 26.0, 18.0, 27.0, 15.0, 11.0, 9.0, 15.0, 8.0, 10.0, 7.0, 7.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0], "bins": [-47.750030517578125, -46.51039505004883, -45.27075958251953, -44.0311279296875, -42.7914924621582, -41.551856994628906, -40.312225341796875, -39.07258987426758, -37.83295440673828, -36.593318939208984, -35.35368347167969, -34.114051818847656, -32.87441635131836, -31.634780883789062, -30.3951473236084, -29.155513763427734, -27.915878295898438, -26.67624282836914, -25.436609268188477, -24.196975708007812, -22.957340240478516, -21.71770477294922, -20.478071212768555, -19.23843765258789, -17.998802185058594, -16.759166717529297, -15.519533157348633, -14.279898643493652, -13.040264129638672, -11.800629615783691, -10.560995101928711, -9.32136058807373, -8.081729888916016, -6.842095375061035, -5.602460861206055, -4.362826347351074, -3.1231918334960938, -1.8835573196411133, -0.6439228057861328, 0.5957117080688477, 1.8353462219238281, 3.0749807357788086, 4.314615249633789, 5.5542497634887695, 6.79388427734375, 8.03351879119873, 9.273153305053711, 10.512787818908691, 11.752422332763672, 12.992056846618652, 14.231691360473633, 15.471325874328613, 16.710960388183594, 17.95059585571289, 19.190229415893555, 20.42986297607422, 21.669498443603516, 22.909133911132812, 24.148767471313477, 25.38840103149414, 26.628036499023438, 27.867671966552734, 29.1073055267334, 30.346939086914062, 31.58657455444336]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 3.0, 9.0, 5.0, 11.0, 16.0, 12.0, 23.0, 14.0, 21.0, 19.0, 37.0, 42.0, 31.0, 39.0, 30.0, 51.0, 45.0, 47.0, 38.0, 34.0, 48.0, 37.0, 50.0, 34.0, 40.0, 20.0, 37.0, 33.0, 20.0, 27.0, 26.0, 20.0, 14.0, 12.0, 10.0, 11.0, 8.0, 8.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.80859375, -7.57208251953125, -7.3355712890625, -7.09906005859375, -6.862548828125, -6.62603759765625, -6.3895263671875, -6.15301513671875, -5.91650390625, -5.67999267578125, -5.4434814453125, -5.20697021484375, -4.970458984375, -4.73394775390625, -4.4974365234375, -4.26092529296875, -4.0244140625, -3.78790283203125, -3.5513916015625, -3.31488037109375, -3.078369140625, -2.84185791015625, -2.6053466796875, -2.36883544921875, -2.13232421875, -1.89581298828125, -1.6593017578125, -1.42279052734375, -1.186279296875, -0.94976806640625, -0.7132568359375, -0.47674560546875, -0.240234375, -0.00372314453125, 0.2327880859375, 0.46929931640625, 0.705810546875, 0.94232177734375, 1.1788330078125, 1.41534423828125, 1.65185546875, 1.88836669921875, 2.1248779296875, 2.36138916015625, 2.597900390625, 2.83441162109375, 3.0709228515625, 3.30743408203125, 3.5439453125, 3.78045654296875, 4.0169677734375, 4.25347900390625, 4.489990234375, 4.72650146484375, 4.9630126953125, 5.19952392578125, 5.43603515625, 5.67254638671875, 5.9090576171875, 6.14556884765625, 6.382080078125, 6.61859130859375, 6.8551025390625, 7.09161376953125, 7.328125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 3.0, 11.0, 10.0, 7.0, 14.0, 18.0, 36.0, 40.0, 38.0, 86.0, 113.0, 142.0, 184.0, 260.0, 330.0, 491.0, 729.0, 1212.0, 2949.0, 19917.0, 399252.0, 2972163.0, 752505.0, 35698.0, 3876.0, 1381.0, 895.0, 532.0, 402.0, 257.0, 183.0, 140.0, 96.0, 78.0, 52.0, 37.0, 39.0, 24.0, 26.0, 12.0, 12.0, 3.0, 6.0, 8.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-31.5625, -30.623291015625, -29.68408203125, -28.744873046875, -27.8056640625, -26.866455078125, -25.92724609375, -24.988037109375, -24.048828125, -23.109619140625, -22.17041015625, -21.231201171875, -20.2919921875, -19.352783203125, -18.41357421875, -17.474365234375, -16.53515625, -15.595947265625, -14.65673828125, -13.717529296875, -12.7783203125, -11.839111328125, -10.89990234375, -9.960693359375, -9.021484375, -8.082275390625, -7.14306640625, -6.203857421875, -5.2646484375, -4.325439453125, -3.38623046875, -2.447021484375, -1.5078125, -0.568603515625, 0.37060546875, 1.309814453125, 2.2490234375, 3.188232421875, 4.12744140625, 5.066650390625, 6.005859375, 6.945068359375, 7.88427734375, 8.823486328125, 9.7626953125, 10.701904296875, 11.64111328125, 12.580322265625, 13.51953125, 14.458740234375, 15.39794921875, 16.337158203125, 17.2763671875, 18.215576171875, 19.15478515625, 20.093994140625, 21.033203125, 21.972412109375, 22.91162109375, 23.850830078125, 24.7900390625, 25.729248046875, 26.66845703125, 27.607666015625, 28.546875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 11.0, 11.0, 14.0, 17.0, 23.0, 41.0, 45.0, 72.0, 94.0, 106.0, 139.0, 166.0, 230.0, 258.0, 283.0, 341.0, 351.0, 315.0, 296.0, 287.0, 208.0, 172.0, 146.0, 124.0, 82.0, 78.0, 45.0, 32.0, 20.0, 15.0, 14.0, 14.0, 10.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8984375, -9.5250244140625, -9.151611328125, -8.7781982421875, -8.40478515625, -8.0313720703125, -7.657958984375, -7.2845458984375, -6.9111328125, -6.5377197265625, -6.164306640625, -5.7908935546875, -5.41748046875, -5.0440673828125, -4.670654296875, -4.2972412109375, -3.923828125, -3.5504150390625, -3.177001953125, -2.8035888671875, -2.43017578125, -2.0567626953125, -1.683349609375, -1.3099365234375, -0.9365234375, -0.5631103515625, -0.189697265625, 0.1837158203125, 0.55712890625, 0.9305419921875, 1.303955078125, 1.6773681640625, 2.05078125, 2.4241943359375, 2.797607421875, 3.1710205078125, 3.54443359375, 3.9178466796875, 4.291259765625, 4.6646728515625, 5.0380859375, 5.4114990234375, 5.784912109375, 6.1583251953125, 6.53173828125, 6.9051513671875, 7.278564453125, 7.6519775390625, 8.025390625, 8.3988037109375, 8.772216796875, 9.1456298828125, 9.51904296875, 9.8924560546875, 10.265869140625, 10.6392822265625, 11.0126953125, 11.3861083984375, 11.759521484375, 12.1329345703125, 12.50634765625, 12.8797607421875, 13.253173828125, 13.6265869140625, 14.0]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 11.0, 20.0, 31.0, 60.0, 90.0, 211.0, 443.0, 1187.0, 3555.0, 15001.0, 78916.0, 426866.0, 1619351.0, 1557467.0, 398535.0, 72861.0, 14154.0, 3509.0, 1154.0, 466.0, 181.0, 97.0, 46.0, 32.0, 14.0, 9.0, 6.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7421875, -12.317138671875, -11.89208984375, -11.467041015625, -11.0419921875, -10.616943359375, -10.19189453125, -9.766845703125, -9.341796875, -8.916748046875, -8.49169921875, -8.066650390625, -7.6416015625, -7.216552734375, -6.79150390625, -6.366455078125, -5.94140625, -5.516357421875, -5.09130859375, -4.666259765625, -4.2412109375, -3.816162109375, -3.39111328125, -2.966064453125, -2.541015625, -2.115966796875, -1.69091796875, -1.265869140625, -0.8408203125, -0.415771484375, 0.00927734375, 0.434326171875, 0.859375, 1.284423828125, 1.70947265625, 2.134521484375, 2.5595703125, 2.984619140625, 3.40966796875, 3.834716796875, 4.259765625, 4.684814453125, 5.10986328125, 5.534912109375, 5.9599609375, 6.385009765625, 6.81005859375, 7.235107421875, 7.66015625, 8.085205078125, 8.51025390625, 8.935302734375, 9.3603515625, 9.785400390625, 10.21044921875, 10.635498046875, 11.060546875, 11.485595703125, 11.91064453125, 12.335693359375, 12.7607421875, 13.185791015625, 13.61083984375, 14.035888671875, 14.4609375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 9.0, 9.0, 15.0, 20.0, 31.0, 38.0, 68.0, 68.0, 86.0, 91.0, 89.0, 84.0, 100.0, 72.0, 60.0, 48.0, 39.0, 25.0, 24.0, 8.0, 9.0, 6.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.99237060546875, -62.500450134277344, -59.00852584838867, -55.516605377197266, -52.024681091308594, -48.53276062011719, -45.04084014892578, -41.548919677734375, -38.0569953918457, -34.5650749206543, -31.073150634765625, -27.58123016357422, -24.08930778503418, -20.59738540649414, -17.105464935302734, -13.613542556762695, -10.121620178222656, -6.629698276519775, -3.1377763748168945, 0.3541450500488281, 3.846067428588867, 7.337989807128906, 10.829910278320312, 14.321832656860352, 17.81375503540039, 21.30567741394043, 24.79759979248047, 28.289520263671875, 31.781442642211914, 35.27336502075195, 38.76528549194336, 42.25720977783203, 45.74913024902344, 49.241050720214844, 52.732975006103516, 56.22489547729492, 59.716819763183594, 63.208740234375, 66.7006607055664, 70.19258117675781, 73.68450927734375, 77.17642974853516, 80.66835021972656, 84.1602783203125, 87.6521987915039, 91.14411926269531, 94.63603973388672, 98.12796020507812, 101.61988067626953, 105.11180114746094, 108.60372161865234, 112.09564208984375, 115.58757019042969, 119.0794906616211, 122.5714111328125, 126.0633316040039, 129.5552520751953, 133.04718017578125, 136.53909301757812, 140.03102111816406, 143.52293395996094, 147.01486206054688, 150.50677490234375, 153.9987030029297, 157.49063110351562]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 5.0, 9.0, 11.0, 12.0, 11.0, 15.0, 21.0, 11.0, 15.0, 21.0, 27.0, 28.0, 30.0, 32.0, 24.0, 25.0, 41.0, 34.0, 34.0, 31.0, 37.0, 24.0, 43.0, 48.0, 28.0, 30.0, 33.0, 31.0, 34.0, 28.0, 22.0, 21.0, 28.0, 24.0, 20.0, 8.0, 17.0, 13.0, 5.0, 12.0, 10.0, 4.0, 7.0, 4.0, 11.0, 3.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-48.0953369140625, -46.55536651611328, -45.01539611816406, -43.475425720214844, -41.935455322265625, -40.395484924316406, -38.85551452636719, -37.315547943115234, -35.775577545166016, -34.2356071472168, -32.69563674926758, -31.15566635131836, -29.615697860717773, -28.075727462768555, -26.535757064819336, -24.99578857421875, -23.4558162689209, -21.91584587097168, -20.37587547302246, -18.835906982421875, -17.295936584472656, -15.755966186523438, -14.215995788574219, -12.676026344299316, -11.136055946350098, -9.596085548400879, -8.056116104125977, -6.516145706176758, -4.976175785064697, -3.4362058639526367, -1.896235466003418, -0.3562660217285156, 1.1837043762207031, 2.7236742973327637, 4.263644218444824, 5.803614616394043, 7.3435845375061035, 8.883554458618164, 10.423524856567383, 11.963494300842285, 13.503464698791504, 15.043435096740723, 16.583404541015625, 18.123374938964844, 19.663345336914062, 21.20331573486328, 22.7432861328125, 24.283254623413086, 25.823225021362305, 27.363195419311523, 28.903165817260742, 30.443134307861328, 31.983104705810547, 33.523075103759766, 35.063045501708984, 36.6030158996582, 38.14298629760742, 39.68295669555664, 41.22292709350586, 42.76289749145508, 44.3028678894043, 45.84283447265625, 47.38280487060547, 48.92277526855469, 50.462745666503906]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 4.0, 4.0, 5.0, 6.0, 10.0, 8.0, 11.0, 12.0, 15.0, 18.0, 21.0, 23.0, 20.0, 29.0, 35.0, 27.0, 31.0, 20.0, 48.0, 44.0, 34.0, 44.0, 39.0, 38.0, 34.0, 42.0, 33.0, 32.0, 34.0, 23.0, 36.0, 37.0, 32.0, 23.0, 17.0, 15.0, 19.0, 12.0, 11.0, 6.0, 11.0, 11.0, 8.0, 8.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-100.75, -97.5947265625, -94.439453125, -91.2841796875, -88.12890625, -84.9736328125, -81.818359375, -78.6630859375, -75.5078125, -72.3525390625, -69.197265625, -66.0419921875, -62.88671875, -59.7314453125, -56.576171875, -53.4208984375, -50.265625, -47.1103515625, -43.955078125, -40.7998046875, -37.64453125, -34.4892578125, -31.333984375, -28.1787109375, -25.0234375, -21.8681640625, -18.712890625, -15.5576171875, -12.40234375, -9.2470703125, -6.091796875, -2.9365234375, 0.21875, 3.3740234375, 6.529296875, 9.6845703125, 12.83984375, 15.9951171875, 19.150390625, 22.3056640625, 25.4609375, 28.6162109375, 31.771484375, 34.9267578125, 38.08203125, 41.2373046875, 44.392578125, 47.5478515625, 50.703125, 53.8583984375, 57.013671875, 60.1689453125, 63.32421875, 66.4794921875, 69.634765625, 72.7900390625, 75.9453125, 79.1005859375, 82.255859375, 85.4111328125, 88.56640625, 91.7216796875, 94.876953125, 98.0322265625, 101.1875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 15.0, 14.0, 24.0, 32.0, 67.0, 100.0, 178.0, 264.0, 413.0, 680.0, 969.0, 1530.0, 2381.0, 3730.0, 5676.0, 8706.0, 13345.0, 20203.0, 29733.0, 43387.0, 61243.0, 82149.0, 105230.0, 122300.0, 125041.0, 111260.0, 91388.0, 68688.0, 48982.0, 33642.0, 22991.0, 15393.0, 10046.0, 6598.0, 4351.0, 2760.0, 1806.0, 1170.0, 739.0, 477.0, 305.0, 198.0, 140.0, 86.0, 51.0, 32.0, 22.0, 8.0, 8.0, 7.0, 3.0, 1.0, 1.0, 2.0], "bins": [-7.15625, -6.94683837890625, -6.7374267578125, -6.52801513671875, -6.318603515625, -6.10919189453125, -5.8997802734375, -5.69036865234375, -5.48095703125, -5.27154541015625, -5.0621337890625, -4.85272216796875, -4.643310546875, -4.43389892578125, -4.2244873046875, -4.01507568359375, -3.8056640625, -3.59625244140625, -3.3868408203125, -3.17742919921875, -2.968017578125, -2.75860595703125, -2.5491943359375, -2.33978271484375, -2.13037109375, -1.92095947265625, -1.7115478515625, -1.50213623046875, -1.292724609375, -1.08331298828125, -0.8739013671875, -0.66448974609375, -0.455078125, -0.24566650390625, -0.0362548828125, 0.17315673828125, 0.382568359375, 0.59197998046875, 0.8013916015625, 1.01080322265625, 1.22021484375, 1.42962646484375, 1.6390380859375, 1.84844970703125, 2.057861328125, 2.26727294921875, 2.4766845703125, 2.68609619140625, 2.8955078125, 3.10491943359375, 3.3143310546875, 3.52374267578125, 3.733154296875, 3.94256591796875, 4.1519775390625, 4.36138916015625, 4.57080078125, 4.78021240234375, 4.9896240234375, 5.19903564453125, 5.408447265625, 5.61785888671875, 5.8272705078125, 6.03668212890625, 6.24609375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 0.0, 4.0, 3.0, 6.0, 4.0, 3.0, 10.0, 12.0, 6.0, 8.0, 24.0, 19.0, 20.0, 17.0, 24.0, 21.0, 20.0, 32.0, 29.0, 29.0, 45.0, 34.0, 43.0, 45.0, 30.0, 1063.0, 40.0, 42.0, 40.0, 32.0, 27.0, 36.0, 37.0, 29.0, 31.0, 20.0, 19.0, 20.0, 12.0, 19.0, 11.0, 13.0, 7.0, 10.0, 4.0, 5.0, 6.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0], "bins": [-67.3125, -65.3154296875, -63.318359375, -61.3212890625, -59.32421875, -57.3271484375, -55.330078125, -53.3330078125, -51.3359375, -49.3388671875, -47.341796875, -45.3447265625, -43.34765625, -41.3505859375, -39.353515625, -37.3564453125, -35.359375, -33.3623046875, -31.365234375, -29.3681640625, -27.37109375, -25.3740234375, -23.376953125, -21.3798828125, -19.3828125, -17.3857421875, -15.388671875, -13.3916015625, -11.39453125, -9.3974609375, -7.400390625, -5.4033203125, -3.40625, -1.4091796875, 0.587890625, 2.5849609375, 4.58203125, 6.5791015625, 8.576171875, 10.5732421875, 12.5703125, 14.5673828125, 16.564453125, 18.5615234375, 20.55859375, 22.5556640625, 24.552734375, 26.5498046875, 28.546875, 30.5439453125, 32.541015625, 34.5380859375, 36.53515625, 38.5322265625, 40.529296875, 42.5263671875, 44.5234375, 46.5205078125, 48.517578125, 50.5146484375, 52.51171875, 54.5087890625, 56.505859375, 58.5029296875, 60.5]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 10.0, 10.0, 11.0, 20.0, 21.0, 29.0, 57.0, 62.0, 72.0, 126.0, 175.0, 225.0, 332.0, 441.0, 695.0, 879.0, 1344.0, 1909.0, 2742.0, 3868.0, 5723.0, 8219.0, 11775.0, 16928.0, 24199.0, 38887.0, 1854097.0, 42145.0, 24564.0, 17284.0, 12300.0, 8386.0, 5982.0, 4124.0, 2825.0, 1910.0, 1362.0, 988.0, 695.0, 514.0, 334.0, 274.0, 160.0, 121.0, 88.0, 64.0, 49.0, 27.0, 26.0, 16.0, 11.0, 10.0, 5.0, 8.0, 6.0, 1.0, 2.0, 3.0], "bins": [-17.5625, -17.022705078125, -16.48291015625, -15.943115234375, -15.4033203125, -14.863525390625, -14.32373046875, -13.783935546875, -13.244140625, -12.704345703125, -12.16455078125, -11.624755859375, -11.0849609375, -10.545166015625, -10.00537109375, -9.465576171875, -8.92578125, -8.385986328125, -7.84619140625, -7.306396484375, -6.7666015625, -6.226806640625, -5.68701171875, -5.147216796875, -4.607421875, -4.067626953125, -3.52783203125, -2.988037109375, -2.4482421875, -1.908447265625, -1.36865234375, -0.828857421875, -0.2890625, 0.250732421875, 0.79052734375, 1.330322265625, 1.8701171875, 2.409912109375, 2.94970703125, 3.489501953125, 4.029296875, 4.569091796875, 5.10888671875, 5.648681640625, 6.1884765625, 6.728271484375, 7.26806640625, 7.807861328125, 8.34765625, 8.887451171875, 9.42724609375, 9.967041015625, 10.5068359375, 11.046630859375, 11.58642578125, 12.126220703125, 12.666015625, 13.205810546875, 13.74560546875, 14.285400390625, 14.8251953125, 15.364990234375, 15.90478515625, 16.444580078125, 16.984375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 8.0, 1.0, 4.0, 10.0, 22.0, 22.0, 47.0, 48.0, 72.0, 49.0, 90.0, 100.0, 92.0, 92.0, 75.0, 83.0, 36.0, 52.0, 29.0, 15.0, 14.0, 9.0, 5.0, 8.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2685546875, -0.2604026794433594, -0.25225067138671875, -0.24409866333007812, -0.2359466552734375, -0.22779464721679688, -0.21964263916015625, -0.21149063110351562, -0.203338623046875, -0.19518661499023438, -0.18703460693359375, -0.17888259887695312, -0.1707305908203125, -0.16257858276367188, -0.15442657470703125, -0.14627456665039062, -0.13812255859375, -0.12997055053710938, -0.12181854248046875, -0.11366653442382812, -0.1055145263671875, -0.09736251831054688, -0.08921051025390625, -0.08105850219726562, -0.072906494140625, -0.06475448608398438, -0.05660247802734375, -0.048450469970703125, -0.0402984619140625, -0.032146453857421875, -0.02399444580078125, -0.015842437744140625, -0.0076904296875, 0.000461578369140625, 0.00861358642578125, 0.016765594482421875, 0.0249176025390625, 0.033069610595703125, 0.04122161865234375, 0.049373626708984375, 0.057525634765625, 0.06567764282226562, 0.07382965087890625, 0.08198165893554688, 0.0901336669921875, 0.09828567504882812, 0.10643768310546875, 0.11458969116210938, 0.12274169921875, 0.13089370727539062, 0.13904571533203125, 0.14719772338867188, 0.1553497314453125, 0.16350173950195312, 0.17165374755859375, 0.17980575561523438, 0.187957763671875, 0.19610977172851562, 0.20426177978515625, 0.21241378784179688, 0.2205657958984375, 0.22871780395507812, 0.23686981201171875, 0.24502182006835938, 0.253173828125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 9.0, 17.0, 8.0, 12.0, 19.0, 22.0, 25.0, 29.0, 40.0, 50.0, 71.0, 108.0, 158.0, 252.0, 430.0, 757.0, 1318.0, 3009.0, 7685.0, 22239.0, 70170.0, 212456.0, 373636.0, 234945.0, 79898.0, 25569.0, 8575.0, 3470.0, 1463.0, 816.0, 416.0, 282.0, 168.0, 111.0, 82.0, 63.0, 38.0, 36.0, 18.0, 17.0, 18.0, 7.0, 6.0, 7.0, 9.0, 7.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8857421875, -0.85577392578125, -0.8258056640625, -0.79583740234375, -0.765869140625, -0.73590087890625, -0.7059326171875, -0.67596435546875, -0.64599609375, -0.61602783203125, -0.5860595703125, -0.55609130859375, -0.526123046875, -0.49615478515625, -0.4661865234375, -0.43621826171875, -0.40625, -0.37628173828125, -0.3463134765625, -0.31634521484375, -0.286376953125, -0.25640869140625, -0.2264404296875, -0.19647216796875, -0.16650390625, -0.13653564453125, -0.1065673828125, -0.07659912109375, -0.046630859375, -0.01666259765625, 0.0133056640625, 0.04327392578125, 0.0732421875, 0.10321044921875, 0.1331787109375, 0.16314697265625, 0.193115234375, 0.22308349609375, 0.2530517578125, 0.28302001953125, 0.31298828125, 0.34295654296875, 0.3729248046875, 0.40289306640625, 0.432861328125, 0.46282958984375, 0.4927978515625, 0.52276611328125, 0.552734375, 0.58270263671875, 0.6126708984375, 0.64263916015625, 0.672607421875, 0.70257568359375, 0.7325439453125, 0.76251220703125, 0.79248046875, 0.82244873046875, 0.8524169921875, 0.88238525390625, 0.912353515625, 0.94232177734375, 0.9722900390625, 1.00225830078125, 1.0322265625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 7.0, 5.0, 24.0, 26.0, 50.0, 77.0, 101.0, 110.0, 112.0, 100.0, 102.0, 72.0, 55.0, 44.0, 30.0, 22.0, 19.0, 15.0, 6.0, 6.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13494135439395905, -0.1236642524600029, -0.11238715052604675, -0.1011100560426712, -0.08983295410871506, -0.07855585217475891, -0.06727875769138336, -0.056001655757427216, -0.04472455382347107, -0.03344745188951492, -0.022170353680849075, -0.010893255472183228, 0.0003838464617729187, 0.011660948395729065, 0.022938042879104614, 0.03421514481306076, 0.04549224674701691, 0.05676934868097305, 0.0680464506149292, 0.07932354509830475, 0.0906006470322609, 0.10187774896621704, 0.11315484344959259, 0.12443194538354874, 0.13570904731750488, 0.14698614180088043, 0.15826325118541718, 0.16954034566879272, 0.18081745505332947, 0.19209454953670502, 0.20337164402008057, 0.2146487534046173, 0.22592586278915405, 0.2372029572725296, 0.24848006665706635, 0.2597571611404419, 0.27103427052497864, 0.2823113799095154, 0.29358845949172974, 0.3048655688762665, 0.3161426782608032, 0.32741978764533997, 0.3386968672275543, 0.34997397661209106, 0.3612510859966278, 0.37252819538116455, 0.3838052749633789, 0.39508238434791565, 0.40635946393013, 0.41763657331466675, 0.4289136528968811, 0.44019076228141785, 0.4514678716659546, 0.46274495124816895, 0.4740220606327057, 0.48529917001724243, 0.4965762495994568, 0.5078533291816711, 0.5191304683685303, 0.5304075479507446, 0.541684627532959, 0.5529617667198181, 0.5642388463020325, 0.5755159258842468, 0.586793065071106]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 4.0, 12.0, 13.0, 15.0, 13.0, 8.0, 13.0, 30.0, 27.0, 33.0, 24.0, 28.0, 33.0, 35.0, 33.0, 26.0, 37.0, 34.0, 37.0, 41.0, 40.0, 34.0, 38.0, 31.0, 38.0, 35.0, 31.0, 27.0, 32.0, 27.0, 21.0, 22.0, 17.0, 14.0, 21.0, 11.0, 9.0, 9.0, 8.0, 6.0, 5.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.20501720905303955, -0.19857144355773926, -0.19212566316127777, -0.18567988276481628, -0.179234117269516, -0.1727883517742157, -0.1663425713777542, -0.15989679098129272, -0.15345102548599243, -0.14700525999069214, -0.14055947959423065, -0.13411369919776917, -0.12766793370246887, -0.12122216075658798, -0.11477638781070709, -0.1083306148648262, -0.10188484191894531, -0.09543906897306442, -0.08899329602718353, -0.08254752308130264, -0.07610175013542175, -0.06965597718954086, -0.06321020424365997, -0.05676443129777908, -0.05031865835189819, -0.0438728854060173, -0.037427112460136414, -0.030981339514255524, -0.024535566568374634, -0.018089793622493744, -0.011644020676612854, -0.005198247730731964, 0.0012475252151489258, 0.007693298161029816, 0.014139071106910706, 0.020584844052791595, 0.027030616998672485, 0.033476389944553375, 0.039922162890434265, 0.046367935836315155, 0.052813708782196045, 0.059259481728076935, 0.06570525467395782, 0.07215102761983871, 0.0785968005657196, 0.0850425735116005, 0.09148834645748138, 0.09793411940336227, 0.10437989234924316, 0.11082566529512405, 0.11727143824100494, 0.12371721118688583, 0.13016298413276672, 0.13660874962806702, 0.1430545300245285, 0.14950031042099, 0.15594607591629028, 0.16239184141159058, 0.16883762180805206, 0.17528340220451355, 0.18172916769981384, 0.18817493319511414, 0.19462071359157562, 0.2010664939880371, 0.2075122594833374]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 6.0, 4.0, 2.0, 7.0, 2.0, 8.0, 9.0, 6.0, 13.0, 19.0, 20.0, 19.0, 24.0, 22.0, 35.0, 25.0, 31.0, 30.0, 45.0, 30.0, 47.0, 52.0, 32.0, 31.0, 47.0, 38.0, 36.0, 33.0, 35.0, 35.0, 29.0, 31.0, 40.0, 21.0, 23.0, 26.0, 18.0, 12.0, 10.0, 6.0, 13.0, 7.0, 7.0, 3.0, 1.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-112.4375, -109.18359375, -105.9296875, -102.67578125, -99.421875, -96.16796875, -92.9140625, -89.66015625, -86.40625, -83.15234375, -79.8984375, -76.64453125, -73.390625, -70.13671875, -66.8828125, -63.62890625, -60.375, -57.12109375, -53.8671875, -50.61328125, -47.359375, -44.10546875, -40.8515625, -37.59765625, -34.34375, -31.08984375, -27.8359375, -24.58203125, -21.328125, -18.07421875, -14.8203125, -11.56640625, -8.3125, -5.05859375, -1.8046875, 1.44921875, 4.703125, 7.95703125, 11.2109375, 14.46484375, 17.71875, 20.97265625, 24.2265625, 27.48046875, 30.734375, 33.98828125, 37.2421875, 40.49609375, 43.75, 47.00390625, 50.2578125, 53.51171875, 56.765625, 60.01953125, 63.2734375, 66.52734375, 69.78125, 73.03515625, 76.2890625, 79.54296875, 82.796875, 86.05078125, 89.3046875, 92.55859375, 95.8125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 8.0, 7.0, 5.0, 7.0, 7.0, 11.0, 15.0, 21.0, 18.0, 27.0, 27.0, 57.0, 45.0, 97.0, 143.0, 213.0, 458.0, 1180.0, 4658.0, 34007.0, 292867.0, 575828.0, 121611.0, 13318.0, 2253.0, 704.0, 348.0, 203.0, 109.0, 68.0, 53.0, 40.0, 29.0, 19.0, 18.0, 12.0, 12.0, 11.0, 12.0, 4.0, 5.0, 3.0, 5.0, 7.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-24.1875, -23.501953125, -22.81640625, -22.130859375, -21.4453125, -20.759765625, -20.07421875, -19.388671875, -18.703125, -18.017578125, -17.33203125, -16.646484375, -15.9609375, -15.275390625, -14.58984375, -13.904296875, -13.21875, -12.533203125, -11.84765625, -11.162109375, -10.4765625, -9.791015625, -9.10546875, -8.419921875, -7.734375, -7.048828125, -6.36328125, -5.677734375, -4.9921875, -4.306640625, -3.62109375, -2.935546875, -2.25, -1.564453125, -0.87890625, -0.193359375, 0.4921875, 1.177734375, 1.86328125, 2.548828125, 3.234375, 3.919921875, 4.60546875, 5.291015625, 5.9765625, 6.662109375, 7.34765625, 8.033203125, 8.71875, 9.404296875, 10.08984375, 10.775390625, 11.4609375, 12.146484375, 12.83203125, 13.517578125, 14.203125, 14.888671875, 15.57421875, 16.259765625, 16.9453125, 17.630859375, 18.31640625, 19.001953125, 19.6875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 3.0, 5.0, 8.0, 11.0, 15.0, 16.0, 23.0, 31.0, 48.0, 42.0, 53.0, 50.0, 57.0, 72.0, 2092.0, 85.0, 73.0, 64.0, 67.0, 53.0, 42.0, 31.0, 27.0, 25.0, 16.0, 11.0, 7.0, 3.0, 8.0, 8.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-221.25, -214.046875, -206.84375, -199.640625, -192.4375, -185.234375, -178.03125, -170.828125, -163.625, -156.421875, -149.21875, -142.015625, -134.8125, -127.609375, -120.40625, -113.203125, -106.0, -98.796875, -91.59375, -84.390625, -77.1875, -69.984375, -62.78125, -55.578125, -48.375, -41.171875, -33.96875, -26.765625, -19.5625, -12.359375, -5.15625, 2.046875, 9.25, 16.453125, 23.65625, 30.859375, 38.0625, 45.265625, 52.46875, 59.671875, 66.875, 74.078125, 81.28125, 88.484375, 95.6875, 102.890625, 110.09375, 117.296875, 124.5, 131.703125, 138.90625, 146.109375, 153.3125, 160.515625, 167.71875, 174.921875, 182.125, 189.328125, 196.53125, 203.734375, 210.9375, 218.140625, 225.34375, 232.546875, 239.75]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 7.0, 8.0, 6.0, 5.0, 14.0, 17.0, 18.0, 25.0, 45.0, 50.0, 96.0, 139.0, 189.0, 396.0, 688.0, 1403.0, 3432.0, 14208.0, 154233.0, 2761099.0, 186139.0, 16455.0, 3677.0, 1546.0, 760.0, 382.0, 229.0, 147.0, 92.0, 50.0, 40.0, 27.0, 19.0, 14.0, 12.0, 8.0, 11.0, 7.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.421875, -17.7763671875, -17.130859375, -16.4853515625, -15.83984375, -15.1943359375, -14.548828125, -13.9033203125, -13.2578125, -12.6123046875, -11.966796875, -11.3212890625, -10.67578125, -10.0302734375, -9.384765625, -8.7392578125, -8.09375, -7.4482421875, -6.802734375, -6.1572265625, -5.51171875, -4.8662109375, -4.220703125, -3.5751953125, -2.9296875, -2.2841796875, -1.638671875, -0.9931640625, -0.34765625, 0.2978515625, 0.943359375, 1.5888671875, 2.234375, 2.8798828125, 3.525390625, 4.1708984375, 4.81640625, 5.4619140625, 6.107421875, 6.7529296875, 7.3984375, 8.0439453125, 8.689453125, 9.3349609375, 9.98046875, 10.6259765625, 11.271484375, 11.9169921875, 12.5625, 13.2080078125, 13.853515625, 14.4990234375, 15.14453125, 15.7900390625, 16.435546875, 17.0810546875, 17.7265625, 18.3720703125, 19.017578125, 19.6630859375, 20.30859375, 20.9541015625, 21.599609375, 22.2451171875, 22.890625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 10.0, 35.0, 64.0, 132.0, 236.0, 246.0, 136.0, 61.0, 27.0, 14.0, 7.0, 9.0, 4.0, 8.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-470.8799743652344, -459.4237365722656, -447.967529296875, -436.51129150390625, -425.0550842285156, -413.5988464355469, -402.14263916015625, -390.6864013671875, -379.23016357421875, -367.77392578125, -356.3177185058594, -344.8614807128906, -333.4052734375, -321.94903564453125, -310.4927978515625, -299.0365905761719, -287.58038330078125, -276.1241455078125, -264.6679382324219, -253.21170043945312, -241.7554931640625, -230.29925537109375, -218.84303283691406, -207.38681030273438, -195.9305877685547, -184.474365234375, -173.0181427001953, -161.56192016601562, -150.10568237304688, -138.64947509765625, -127.1932373046875, -115.73701477050781, -104.28082275390625, -92.82460021972656, -81.36837768554688, -69.91214752197266, -58.45592498779297, -46.99970245361328, -35.54347229003906, -24.087249755859375, -12.631027221679688, -1.1748027801513672, 10.281421661376953, 21.737648010253906, 33.193870544433594, 44.65009307861328, 56.1063232421875, 67.56254577636719, 79.01876831054688, 90.47499084472656, 101.93121337890625, 113.38744354248047, 124.84366607666016, 136.29989624023438, 147.75611877441406, 159.21234130859375, 170.66856384277344, 182.12478637695312, 193.5810089111328, 205.0372314453125, 216.49346923828125, 227.94967651367188, 239.40591430664062, 250.8621368408203, 262.318359375]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 4.0, 6.0, 4.0, 5.0, 8.0, 8.0, 7.0, 18.0, 17.0, 15.0, 18.0, 26.0, 25.0, 40.0, 39.0, 37.0, 30.0, 33.0, 46.0, 36.0, 53.0, 34.0, 38.0, 43.0, 53.0, 35.0, 31.0, 39.0, 31.0, 31.0, 29.0, 29.0, 17.0, 13.0, 13.0, 19.0, 15.0, 11.0, 11.0, 10.0, 7.0, 6.0, 4.0, 1.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-229.23513793945312, -222.5076904296875, -215.78024291992188, -209.05279541015625, -202.32534790039062, -195.597900390625, -188.87045288085938, -182.1430206298828, -175.4155731201172, -168.68812561035156, -161.96067810058594, -155.2332305908203, -148.5057830810547, -141.77835083007812, -135.0509033203125, -128.32345581054688, -121.59600067138672, -114.8685531616211, -108.14110565185547, -101.41366577148438, -94.68621826171875, -87.95877075195312, -81.2313232421875, -74.50387573242188, -67.77642822265625, -61.048980712890625, -54.321537017822266, -47.59408950805664, -40.86664581298828, -34.139198303222656, -27.41175079345703, -20.684307098388672, -13.956863403320312, -7.229417324066162, -0.5019712448120117, 6.225475311279297, 12.952920913696289, 19.68036651611328, 26.407814025878906, 33.135257720947266, 39.86270523071289, 46.590152740478516, 53.317596435546875, 60.0450439453125, 66.77249145507812, 73.49993896484375, 80.22738647460938, 86.95482635498047, 93.6822738647461, 100.40972137451172, 107.13716888427734, 113.86460876464844, 120.59205627441406, 127.31950378417969, 134.0469512939453, 140.77439880371094, 147.50184631347656, 154.2292938232422, 160.9567413330078, 167.68418884277344, 174.41163635253906, 181.13906860351562, 187.86651611328125, 194.59396362304688, 201.3214111328125]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 7.0, 4.0, 8.0, 19.0, 23.0, 29.0, 39.0, 63.0, 108.0, 142.0, 202.0, 284.0, 410.0, 565.0, 873.0, 1272.0, 1827.0, 2594.0, 3461.0, 4344.0, 1010938.0, 5695.0, 4242.0, 3334.0, 2438.0, 1716.0, 1230.0, 913.0, 599.0, 388.0, 249.0, 174.0, 112.0, 90.0, 54.0, 34.0, 24.0, 20.0, 12.0, 5.0, 8.0, 3.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0], "bins": [-45.61445617675781, -44.378963470458984, -43.14346694946289, -41.90797424316406, -40.672481536865234, -39.436988830566406, -38.20149230957031, -36.965999603271484, -35.730506896972656, -34.49501419067383, -33.259517669677734, -32.024024963378906, -30.788532257080078, -29.553037643432617, -28.317543029785156, -27.082050323486328, -25.846553802490234, -24.611059188842773, -23.375566482543945, -22.140071868896484, -20.904579162597656, -19.669084548950195, -18.433589935302734, -17.198097229003906, -15.962602615356445, -14.7271089553833, -13.491615295410156, -12.256120681762695, -11.02062702178955, -9.785133361816406, -8.549638748168945, -7.314145088195801, -6.078651428222656, -4.843157768249512, -3.607663631439209, -2.3721697330474854, -1.1366758346557617, 0.09881782531738281, 1.3343119621276855, 2.5698060989379883, 3.805299758911133, 5.040793418884277, 6.27628755569458, 7.511781692504883, 8.747275352478027, 9.982769012451172, 11.218263626098633, 12.453757286071777, 13.689250946044922, 14.924744606018066, 16.16023826599121, 17.395732879638672, 18.6312255859375, 19.86672019958496, 21.102214813232422, 22.33770751953125, 23.57320213317871, 24.808696746826172, 26.044189453125, 27.27968406677246, 28.515178680419922, 29.75067138671875, 30.98616600036621, 32.22166061401367, 33.4571533203125]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 8.0, 4.0, 17.0, 24.0, 35.0, 42.0, 72.0, 137.0, 578.0, 51460228.0, 1717.0, 126.0, 52.0, 35.0, 20.0, 10.0, 7.0, 6.0, 6.0, 5.0, 6.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1655.0, -1578.5308837890625, -1502.061767578125, -1425.5926513671875, -1349.12353515625, -1272.654296875, -1196.1851806640625, -1119.716064453125, -1043.2469482421875, -966.77783203125, -890.3087158203125, -813.8395385742188, -737.3704223632812, -660.9013061523438, -584.43212890625, -507.9630126953125, -431.493896484375, -355.0247802734375, -278.5556335449219, -202.0865020751953, -125.61737060546875, -49.14825439453125, 27.320892333984375, 103.7900390625, 180.2591552734375, 256.728271484375, 333.1974182128906, 409.66656494140625, 486.13568115234375, 562.6047973632812, 639.073974609375, 715.5430908203125, 792.011962890625, 868.4810791015625, 944.9501953125, 1021.4193725585938, 1097.888427734375, 1174.357666015625, 1250.8267822265625, 1327.2958984375, 1403.7650146484375, 1480.234130859375, 1556.7032470703125, 1633.17236328125, 1709.6416015625, 1786.110595703125, 1862.579833984375, 1939.0489501953125, 2015.51806640625, 2091.9873046875, 2168.456298828125, 2244.925537109375, 2321.39453125, 2397.86376953125, 2474.332763671875, 2550.802001953125, 2627.27099609375, 2703.740234375, 2780.209228515625, 2856.678466796875, 2933.1474609375, 3009.61669921875, 3086.085693359375, 3162.554931640625, 3239.024169921875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 5.0, 12.0, 25.0, 17.0, 35.0, 56.0, 104.0, 232.0, 267.0, 135.0, 50.0, 25.0, 9.0, 7.0, 7.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.85078430175781, -112.39032745361328, -107.92986297607422, -103.46940612792969, -99.00894165039062, -94.5484848022461, -90.08802795410156, -85.6275634765625, -81.16710662841797, -76.70664978027344, -72.24618530273438, -67.78572845458984, -63.32526779174805, -58.86480712890625, -54.40435028076172, -49.94388961791992, -45.483428955078125, -41.02296829223633, -36.56250762939453, -32.10205078125, -27.641590118408203, -23.181129455566406, -18.720670700073242, -14.260211944580078, -9.799751281738281, -5.339291572570801, -0.8788318634033203, 3.58162784576416, 8.04208755493164, 12.502548217773438, 16.9630069732666, 21.423465728759766, 25.883941650390625, 30.344402313232422, 34.80486297607422, 39.26531982421875, 43.72578048706055, 48.186241149902344, 52.646697998046875, 57.10715866088867, 61.56761932373047, 66.028076171875, 70.48854064941406, 74.9489974975586, 79.40945434570312, 83.86991882324219, 88.33037567138672, 92.79083251953125, 97.25129699707031, 101.71175384521484, 106.1722183227539, 110.63267517089844, 115.0931396484375, 119.55359649658203, 124.01405334472656, 128.47451782226562, 132.93496704101562, 137.3954315185547, 141.8558807373047, 146.31634521484375, 150.7768096923828, 155.23727416992188, 159.69772338867188, 164.15818786621094, 168.61865234375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 2.0, 5.0, 9.0, 14.0, 15.0, 19.0, 31.0, 29.0, 43.0, 52.0, 63.0, 63.0, 69.0, 80.0, 76.0, 83.0, 75.0, 59.0, 53.0, 47.0, 23.0, 18.0, 23.0, 10.0, 11.0, 5.0, 6.0, 5.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-145.66624450683594, -141.7189483642578, -137.7716522216797, -133.82435607910156, -129.87704467773438, -125.92974853515625, -121.98245239257812, -118.03515625, -114.08786010742188, -110.14056396484375, -106.1932601928711, -102.24596405029297, -98.29866790771484, -94.35136413574219, -90.40406799316406, -86.45677185058594, -82.50947570800781, -78.56217956542969, -74.61487579345703, -70.6675796508789, -66.72028350830078, -62.77298355102539, -58.82568359375, -54.878387451171875, -50.93108367919922, -46.98378372192383, -43.0364875793457, -39.08918762207031, -35.14189147949219, -31.194591522216797, -27.24729347229004, -23.29999542236328, -19.352699279785156, -15.405401229858398, -11.45810317993164, -7.510804176330566, -3.5635061264038086, 0.3837928771972656, 4.331090927124023, 8.278388977050781, 12.225687026977539, 16.172985076904297, 20.120283126831055, 24.067581176757812, 28.014881134033203, 31.96217918395996, 35.90947723388672, 39.856773376464844, 43.804073333740234, 47.751373291015625, 51.69866943359375, 55.64596939086914, 59.593265533447266, 63.540565490722656, 67.48786163330078, 71.43516540527344, 75.38246154785156, 79.32975769042969, 83.27706146240234, 87.22435760498047, 91.1716537475586, 95.11895751953125, 99.06625366210938, 103.0135498046875, 106.96084594726562]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 8.0, 13.0, 31.0, 27.0, 39.0, 56.0, 80.0, 118.0, 159.0, 276.0, 336.0, 516.0, 863.0, 1243.0, 1981.0, 3328.0, 6000.0, 11770.0, 28077.0, 120029.0, 3923392.0, 58922.0, 18326.0, 8156.0, 4117.0, 2427.0, 1445.0, 842.0, 616.0, 361.0, 232.0, 167.0, 102.0, 72.0, 48.0, 38.0, 15.0, 20.0, 12.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.884765625, -2.79266357421875, -2.7005615234375, -2.60845947265625, -2.516357421875, -2.42425537109375, -2.3321533203125, -2.24005126953125, -2.14794921875, -2.05584716796875, -1.9637451171875, -1.87164306640625, -1.779541015625, -1.68743896484375, -1.5953369140625, -1.50323486328125, -1.4111328125, -1.31903076171875, -1.2269287109375, -1.13482666015625, -1.042724609375, -0.95062255859375, -0.8585205078125, -0.76641845703125, -0.67431640625, -0.58221435546875, -0.4901123046875, -0.39801025390625, -0.305908203125, -0.21380615234375, -0.1217041015625, -0.02960205078125, 0.0625, 0.15460205078125, 0.2467041015625, 0.33880615234375, 0.430908203125, 0.52301025390625, 0.6151123046875, 0.70721435546875, 0.79931640625, 0.89141845703125, 0.9835205078125, 1.07562255859375, 1.167724609375, 1.25982666015625, 1.3519287109375, 1.44403076171875, 1.5361328125, 1.62823486328125, 1.7203369140625, 1.81243896484375, 1.904541015625, 1.99664306640625, 2.0887451171875, 2.18084716796875, 2.27294921875, 2.36505126953125, 2.4571533203125, 2.54925537109375, 2.641357421875, 2.73345947265625, 2.8255615234375, 2.91766357421875, 3.009765625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 4.0, 7.0, 0.0, 2.0, 5.0, 5.0, 9.0, 10.0, 9.0, 9.0, 13.0, 16.0, 15.0, 195.0, 578.0, 24.0, 16.0, 9.0, 10.0, 14.0, 4.0, 4.0, 8.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.611328125, -0.592193603515625, -0.57305908203125, -0.553924560546875, -0.5347900390625, -0.515655517578125, -0.49652099609375, -0.477386474609375, -0.458251953125, -0.439117431640625, -0.41998291015625, -0.400848388671875, -0.3817138671875, -0.362579345703125, -0.34344482421875, -0.324310302734375, -0.30517578125, -0.286041259765625, -0.26690673828125, -0.247772216796875, -0.2286376953125, -0.209503173828125, -0.19036865234375, -0.171234130859375, -0.152099609375, -0.132965087890625, -0.11383056640625, -0.094696044921875, -0.0755615234375, -0.056427001953125, -0.03729248046875, -0.018157958984375, 0.0009765625, 0.020111083984375, 0.03924560546875, 0.058380126953125, 0.0775146484375, 0.096649169921875, 0.11578369140625, 0.134918212890625, 0.154052734375, 0.173187255859375, 0.19232177734375, 0.211456298828125, 0.2305908203125, 0.249725341796875, 0.26885986328125, 0.287994384765625, 0.30712890625, 0.326263427734375, 0.34539794921875, 0.364532470703125, 0.3836669921875, 0.402801513671875, 0.42193603515625, 0.441070556640625, 0.460205078125, 0.479339599609375, 0.49847412109375, 0.517608642578125, 0.5367431640625, 0.555877685546875, 0.57501220703125, 0.594146728515625, 0.61328125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 6.0, 11.0, 14.0, 15.0, 32.0, 52.0, 71.0, 104.0, 209.0, 333.0, 561.0, 979.0, 1955.0, 4143.0, 10115.0, 28744.0, 108512.0, 936698.0, 2867820.0, 169654.0, 39939.0, 13397.0, 5398.0, 2526.0, 1260.0, 723.0, 386.0, 234.0, 140.0, 85.0, 53.0, 32.0, 26.0, 17.0, 10.0, 8.0, 7.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6064453125, -1.554840087890625, -1.50323486328125, -1.451629638671875, -1.4000244140625, -1.348419189453125, -1.29681396484375, -1.245208740234375, -1.193603515625, -1.141998291015625, -1.09039306640625, -1.038787841796875, -0.9871826171875, -0.935577392578125, -0.88397216796875, -0.832366943359375, -0.78076171875, -0.729156494140625, -0.67755126953125, -0.625946044921875, -0.5743408203125, -0.522735595703125, -0.47113037109375, -0.419525146484375, -0.367919921875, -0.316314697265625, -0.26470947265625, -0.213104248046875, -0.1614990234375, -0.109893798828125, -0.05828857421875, -0.006683349609375, 0.044921875, 0.096527099609375, 0.14813232421875, 0.199737548828125, 0.2513427734375, 0.302947998046875, 0.35455322265625, 0.406158447265625, 0.457763671875, 0.509368896484375, 0.56097412109375, 0.612579345703125, 0.6641845703125, 0.715789794921875, 0.76739501953125, 0.819000244140625, 0.87060546875, 0.922210693359375, 0.97381591796875, 1.025421142578125, 1.0770263671875, 1.128631591796875, 1.18023681640625, 1.231842041015625, 1.283447265625, 1.335052490234375, 1.38665771484375, 1.438262939453125, 1.4898681640625, 1.541473388671875, 1.59307861328125, 1.644683837890625, 1.6962890625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 6.0, 14.0, 11.0, 8.0, 15.0, 24.0, 25.0, 29.0, 30.0, 53.0, 63.0, 88.0, 139.0, 210.0, 363.0, 1076.0, 849.0, 359.0, 176.0, 143.0, 98.0, 69.0, 53.0, 41.0, 30.0, 26.0, 19.0, 10.0, 16.0, 13.0, 5.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5244140625, -0.5062713623046875, -0.488128662109375, -0.4699859619140625, -0.45184326171875, -0.4337005615234375, -0.415557861328125, -0.3974151611328125, -0.3792724609375, -0.3611297607421875, -0.342987060546875, -0.3248443603515625, -0.30670166015625, -0.2885589599609375, -0.270416259765625, -0.2522735595703125, -0.234130859375, -0.2159881591796875, -0.197845458984375, -0.1797027587890625, -0.16156005859375, -0.1434173583984375, -0.125274658203125, -0.1071319580078125, -0.0889892578125, -0.0708465576171875, -0.052703857421875, -0.0345611572265625, -0.01641845703125, 0.0017242431640625, 0.019866943359375, 0.0380096435546875, 0.05615234375, 0.0742950439453125, 0.092437744140625, 0.1105804443359375, 0.12872314453125, 0.1468658447265625, 0.165008544921875, 0.1831512451171875, 0.2012939453125, 0.2194366455078125, 0.237579345703125, 0.2557220458984375, 0.27386474609375, 0.2920074462890625, 0.310150146484375, 0.3282928466796875, 0.346435546875, 0.3645782470703125, 0.382720947265625, 0.4008636474609375, 0.41900634765625, 0.4371490478515625, 0.455291748046875, 0.4734344482421875, 0.4915771484375, 0.5097198486328125, 0.527862548828125, 0.5460052490234375, 0.56414794921875, 0.5822906494140625, 0.600433349609375, 0.6185760498046875, 0.63671875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 10.0, 19.0, 32.0, 57.0, 124.0, 206.0, 215.0, 166.0, 75.0, 40.0, 20.0, 8.0, 7.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.288210391998291, -5.137660980224609, -4.9871110916137695, -4.836561679840088, -4.686011791229248, -4.535462379455566, -4.384912490844727, -4.234363079071045, -4.083813190460205, -3.9332635402679443, -3.7827138900756836, -3.632164239883423, -3.481614589691162, -3.3310649394989014, -3.1805152893066406, -3.029965877532959, -2.8794162273406982, -2.7288665771484375, -2.5783169269561768, -2.427767276763916, -2.2772176265716553, -2.1266679763793945, -1.9761184453964233, -1.8255687952041626, -1.6750191450119019, -1.5244694948196411, -1.3739198446273804, -1.2233703136444092, -1.0728206634521484, -0.9222709536552429, -0.771721363067627, -0.6211717128753662, -0.47062206268310547, -0.3200724124908447, -0.16952279210090637, -0.018973171710968018, 0.13157647848129272, 0.28212612867355347, 0.43267571926116943, 0.5832253694534302, 0.7337750196456909, 0.8843246698379517, 1.0348743200302124, 1.1854238510131836, 1.3359735012054443, 1.486523151397705, 1.6370728015899658, 1.7876224517822266, 1.9381721019744873, 2.088721752166748, 2.239271402359009, 2.3898210525512695, 2.5403707027435303, 2.690920352935791, 2.8414697647094727, 2.9920196533203125, 3.142569065093994, 3.293118715286255, 3.4436683654785156, 3.5942180156707764, 3.744767665863037, 3.895317316055298, 4.045866966247559, 4.19641637802124, 4.34696626663208]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 4.0, 8.0, 9.0, 11.0, 9.0, 16.0, 20.0, 28.0, 19.0, 29.0, 39.0, 36.0, 43.0, 51.0, 49.0, 49.0, 50.0, 68.0, 51.0, 42.0, 45.0, 45.0, 51.0, 44.0, 35.0, 31.0, 23.0, 19.0, 17.0, 15.0, 7.0, 7.0, 5.0, 4.0, 8.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5471043586730957, -2.4660542011260986, -2.3850040435791016, -2.3039536476135254, -2.2229034900665283, -2.1418533325195312, -2.060803174972534, -1.979753017425537, -1.8987027406692505, -1.8176525831222534, -1.7366023063659668, -1.6555521488189697, -1.5745019912719727, -1.493451714515686, -1.412401556968689, -1.3313512802124023, -1.2503011226654053, -1.1692509651184082, -1.0882006883621216, -1.0071505308151245, -0.9261003136634827, -0.8450500965118408, -0.7639999389648438, -0.6829497218132019, -0.6018995046615601, -0.5208492875099182, -0.43979910016059875, -0.3587489128112793, -0.27769869565963745, -0.1966484785079956, -0.11559829115867615, -0.03454810380935669, 0.046502113342285156, 0.1275523155927658, 0.20860251784324646, 0.2896527051925659, 0.37070292234420776, 0.4517531394958496, 0.5328032970428467, 0.6138535141944885, 0.6949037313461304, 0.7759539484977722, 0.8570041656494141, 0.9380543231964111, 1.0191044807434082, 1.1001547574996948, 1.181204915046692, 1.2622551918029785, 1.3433053493499756, 1.4243555068969727, 1.5054057836532593, 1.5864559412002563, 1.667506217956543, 1.74855637550354, 1.829606533050537, 1.9106566905975342, 1.9917069673538208, 2.0727572441101074, 2.1538074016571045, 2.2348575592041016, 2.3159077167510986, 2.3969578742980957, 2.478008270263672, 2.559058427810669, 2.640108585357666]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 10.0, 16.0, 22.0, 28.0, 41.0, 60.0, 84.0, 128.0, 198.0, 258.0, 404.0, 634.0, 903.0, 1419.0, 2294.0, 3893.0, 6477.0, 10664.0, 19077.0, 36598.0, 627056.0, 264215.0, 31676.0, 17148.0, 9835.0, 5777.0, 3534.0, 2173.0, 1352.0, 868.0, 583.0, 332.0, 253.0, 176.0, 126.0, 86.0, 55.0, 38.0, 30.0, 20.0, 7.0, 4.0, 7.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.798828125, -2.72088623046875, -2.6429443359375, -2.56500244140625, -2.487060546875, -2.40911865234375, -2.3311767578125, -2.25323486328125, -2.17529296875, -2.09735107421875, -2.0194091796875, -1.94146728515625, -1.863525390625, -1.78558349609375, -1.7076416015625, -1.62969970703125, -1.5517578125, -1.47381591796875, -1.3958740234375, -1.31793212890625, -1.239990234375, -1.16204833984375, -1.0841064453125, -1.00616455078125, -0.92822265625, -0.85028076171875, -0.7723388671875, -0.69439697265625, -0.616455078125, -0.53851318359375, -0.4605712890625, -0.38262939453125, -0.3046875, -0.22674560546875, -0.1488037109375, -0.07086181640625, 0.007080078125, 0.08502197265625, 0.1629638671875, 0.24090576171875, 0.31884765625, 0.39678955078125, 0.4747314453125, 0.55267333984375, 0.630615234375, 0.70855712890625, 0.7864990234375, 0.86444091796875, 0.9423828125, 1.02032470703125, 1.0982666015625, 1.17620849609375, 1.254150390625, 1.33209228515625, 1.4100341796875, 1.48797607421875, 1.56591796875, 1.64385986328125, 1.7218017578125, 1.79974365234375, 1.877685546875, 1.95562744140625, 2.0335693359375, 2.11151123046875, 2.189453125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 5.0, 5.0, 4.0, 3.0, 8.0, 6.0, 7.0, 7.0, 9.0, 12.0, 14.0, 21.0, 144.0, 477.0, 163.0, 25.0, 11.0, 10.0, 8.0, 11.0, 6.0, 5.0, 7.0, 6.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61328125, -0.5943450927734375, -0.575408935546875, -0.5564727783203125, -0.53753662109375, -0.5186004638671875, -0.499664306640625, -0.4807281494140625, -0.4617919921875, -0.4428558349609375, -0.423919677734375, -0.4049835205078125, -0.38604736328125, -0.3671112060546875, -0.348175048828125, -0.3292388916015625, -0.310302734375, -0.2913665771484375, -0.272430419921875, -0.2534942626953125, -0.23455810546875, -0.2156219482421875, -0.196685791015625, -0.1777496337890625, -0.1588134765625, -0.1398773193359375, -0.120941162109375, -0.1020050048828125, -0.08306884765625, -0.0641326904296875, -0.045196533203125, -0.0262603759765625, -0.00732421875, 0.0116119384765625, 0.030548095703125, 0.0494842529296875, 0.06842041015625, 0.0873565673828125, 0.106292724609375, 0.1252288818359375, 0.1441650390625, 0.1631011962890625, 0.182037353515625, 0.2009735107421875, 0.21990966796875, 0.2388458251953125, 0.257781982421875, 0.2767181396484375, 0.295654296875, 0.3145904541015625, 0.333526611328125, 0.3524627685546875, 0.37139892578125, 0.3903350830078125, 0.409271240234375, 0.4282073974609375, 0.4471435546875, 0.4660797119140625, 0.485015869140625, 0.5039520263671875, 0.52288818359375, 0.5418243408203125, 0.560760498046875, 0.5796966552734375, 0.5986328125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 15.0, 9.0, 11.0, 12.0, 23.0, 37.0, 47.0, 57.0, 87.0, 154.0, 176.0, 262.0, 457.0, 688.0, 1123.0, 1832.0, 3041.0, 5379.0, 9863.0, 19787.0, 46883.0, 125714.0, 308031.0, 308786.0, 125832.0, 46933.0, 20100.0, 9902.0, 5389.0, 3053.0, 1789.0, 1103.0, 637.0, 451.0, 248.0, 195.0, 129.0, 86.0, 66.0, 53.0, 35.0, 21.0, 18.0, 11.0, 4.0, 4.0, 4.0, 5.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.513671875, -1.46636962890625, -1.4190673828125, -1.37176513671875, -1.324462890625, -1.27716064453125, -1.2298583984375, -1.18255615234375, -1.13525390625, -1.08795166015625, -1.0406494140625, -0.99334716796875, -0.946044921875, -0.89874267578125, -0.8514404296875, -0.80413818359375, -0.7568359375, -0.70953369140625, -0.6622314453125, -0.61492919921875, -0.567626953125, -0.52032470703125, -0.4730224609375, -0.42572021484375, -0.37841796875, -0.33111572265625, -0.2838134765625, -0.23651123046875, -0.189208984375, -0.14190673828125, -0.0946044921875, -0.04730224609375, 0.0, 0.04730224609375, 0.0946044921875, 0.14190673828125, 0.189208984375, 0.23651123046875, 0.2838134765625, 0.33111572265625, 0.37841796875, 0.42572021484375, 0.4730224609375, 0.52032470703125, 0.567626953125, 0.61492919921875, 0.6622314453125, 0.70953369140625, 0.7568359375, 0.80413818359375, 0.8514404296875, 0.89874267578125, 0.946044921875, 0.99334716796875, 1.0406494140625, 1.08795166015625, 1.13525390625, 1.18255615234375, 1.2298583984375, 1.27716064453125, 1.324462890625, 1.37176513671875, 1.4190673828125, 1.46636962890625, 1.513671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 1.0, 5.0, 4.0, 6.0, 8.0, 9.0, 8.0, 15.0, 17.0, 19.0, 13.0, 15.0, 18.0, 24.0, 20.0, 36.0, 34.0, 36.0, 49.0, 45.0, 32.0, 49.0, 37.0, 39.0, 39.0, 40.0, 23.0, 32.0, 32.0, 32.0, 23.0, 34.0, 29.0, 17.0, 25.0, 24.0, 28.0, 15.0, 9.0, 10.0, 7.0, 10.0, 7.0, 9.0, 7.0, 4.0, 0.0, 3.0, 3.0, 3.0, 1.0, 1.0], "bins": [-2.2109375, -2.147430419921875, -2.08392333984375, -2.020416259765625, -1.9569091796875, -1.893402099609375, -1.82989501953125, -1.766387939453125, -1.702880859375, -1.639373779296875, -1.57586669921875, -1.512359619140625, -1.4488525390625, -1.385345458984375, -1.32183837890625, -1.258331298828125, -1.19482421875, -1.131317138671875, -1.06781005859375, -1.004302978515625, -0.9407958984375, -0.877288818359375, -0.81378173828125, -0.750274658203125, -0.686767578125, -0.623260498046875, -0.55975341796875, -0.496246337890625, -0.4327392578125, -0.369232177734375, -0.30572509765625, -0.242218017578125, -0.1787109375, -0.115203857421875, -0.05169677734375, 0.011810302734375, 0.0753173828125, 0.138824462890625, 0.20233154296875, 0.265838623046875, 0.329345703125, 0.392852783203125, 0.45635986328125, 0.519866943359375, 0.5833740234375, 0.646881103515625, 0.71038818359375, 0.773895263671875, 0.83740234375, 0.900909423828125, 0.96441650390625, 1.027923583984375, 1.0914306640625, 1.154937744140625, 1.21844482421875, 1.281951904296875, 1.345458984375, 1.408966064453125, 1.47247314453125, 1.535980224609375, 1.5994873046875, 1.662994384765625, 1.72650146484375, 1.790008544921875, 1.853515625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 6.0, 7.0, 11.0, 25.0, 43.0, 73.0, 181.0, 539.0, 1801.0, 11525.0, 968443.0, 60528.0, 3962.0, 875.0, 306.0, 114.0, 50.0, 29.0, 18.0, 9.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.0, -21.4171142578125, -20.834228515625, -20.2513427734375, -19.66845703125, -19.0855712890625, -18.502685546875, -17.9197998046875, -17.3369140625, -16.7540283203125, -16.171142578125, -15.5882568359375, -15.00537109375, -14.4224853515625, -13.839599609375, -13.2567138671875, -12.673828125, -12.0909423828125, -11.508056640625, -10.9251708984375, -10.34228515625, -9.7593994140625, -9.176513671875, -8.5936279296875, -8.0107421875, -7.4278564453125, -6.844970703125, -6.2620849609375, -5.67919921875, -5.0963134765625, -4.513427734375, -3.9305419921875, -3.34765625, -2.7647705078125, -2.181884765625, -1.5989990234375, -1.01611328125, -0.4332275390625, 0.149658203125, 0.7325439453125, 1.3154296875, 1.8983154296875, 2.481201171875, 3.0640869140625, 3.64697265625, 4.2298583984375, 4.812744140625, 5.3956298828125, 5.978515625, 6.5614013671875, 7.144287109375, 7.7271728515625, 8.31005859375, 8.8929443359375, 9.475830078125, 10.0587158203125, 10.6416015625, 11.2244873046875, 11.807373046875, 12.3902587890625, 12.97314453125, 13.5560302734375, 14.138916015625, 14.7218017578125, 15.3046875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 4.0, 8.0, 13.0, 14.0, 27.0, 44.0, 68.0, 84.0, 207.0, 200.0, 119.0, 56.0, 40.0, 33.0, 22.0, 17.0, 9.0, 8.0, 7.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00033593177795410156, -0.00032438337802886963, -0.0003128349781036377, -0.00030128657817840576, -0.00028973817825317383, -0.0002781897783279419, -0.00026664137840270996, -0.00025509297847747803, -0.0002435445785522461, -0.00023199617862701416, -0.00022044777870178223, -0.0002088993787765503, -0.00019735097885131836, -0.00018580257892608643, -0.0001742541790008545, -0.00016270577907562256, -0.00015115737915039062, -0.0001396089792251587, -0.00012806057929992676, -0.00011651217937469482, -0.00010496377944946289, -9.341537952423096e-05, -8.186697959899902e-05, -7.031857967376709e-05, -5.8770179748535156e-05, -4.722177982330322e-05, -3.567337989807129e-05, -2.4124979972839355e-05, -1.2576580047607422e-05, -1.0281801223754883e-06, 1.0520219802856445e-05, 2.206861972808838e-05, 3.361701965332031e-05, 4.5165419578552246e-05, 5.671381950378418e-05, 6.826221942901611e-05, 7.981061935424805e-05, 9.135901927947998e-05, 0.00010290741920471191, 0.00011445581912994385, 0.00012600421905517578, 0.00013755261898040771, 0.00014910101890563965, 0.00016064941883087158, 0.00017219781875610352, 0.00018374621868133545, 0.00019529461860656738, 0.00020684301853179932, 0.00021839141845703125, 0.00022993981838226318, 0.00024148821830749512, 0.00025303661823272705, 0.000264585018157959, 0.0002761334180831909, 0.00028768181800842285, 0.0002992302179336548, 0.0003107786178588867, 0.00032232701778411865, 0.0003338754177093506, 0.0003454238176345825, 0.00035697221755981445, 0.0003685206174850464, 0.0003800690174102783, 0.00039161741733551025, 0.0004031658172607422]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 12.0, 15.0, 39.0, 51.0, 85.0, 210.0, 555.0, 1664.0, 9241.0, 257805.0, 761426.0, 14059.0, 2275.0, 617.0, 250.0, 109.0, 47.0, 26.0, 21.0, 13.0, 8.0, 7.0, 3.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8984375, -9.5582275390625, -9.218017578125, -8.8778076171875, -8.53759765625, -8.1973876953125, -7.857177734375, -7.5169677734375, -7.1767578125, -6.8365478515625, -6.496337890625, -6.1561279296875, -5.81591796875, -5.4757080078125, -5.135498046875, -4.7952880859375, -4.455078125, -4.1148681640625, -3.774658203125, -3.4344482421875, -3.09423828125, -2.7540283203125, -2.413818359375, -2.0736083984375, -1.7333984375, -1.3931884765625, -1.052978515625, -0.7127685546875, -0.37255859375, -0.0323486328125, 0.307861328125, 0.6480712890625, 0.98828125, 1.3284912109375, 1.668701171875, 2.0089111328125, 2.34912109375, 2.6893310546875, 3.029541015625, 3.3697509765625, 3.7099609375, 4.0501708984375, 4.390380859375, 4.7305908203125, 5.07080078125, 5.4110107421875, 5.751220703125, 6.0914306640625, 6.431640625, 6.7718505859375, 7.112060546875, 7.4522705078125, 7.79248046875, 8.1326904296875, 8.472900390625, 8.8131103515625, 9.1533203125, 9.4935302734375, 9.833740234375, 10.1739501953125, 10.51416015625, 10.8543701171875, 11.194580078125, 11.5347900390625, 11.875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 10.0, 17.0, 13.0, 10.0, 24.0, 29.0, 47.0, 44.0, 78.0, 98.0, 105.0, 110.0, 98.0, 89.0, 48.0, 37.0, 25.0, 19.0, 22.0, 18.0, 14.0, 7.0, 4.0, 5.0, 4.0, 1.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.80859375, -2.697021484375, -2.58544921875, -2.473876953125, -2.3623046875, -2.250732421875, -2.13916015625, -2.027587890625, -1.916015625, -1.804443359375, -1.69287109375, -1.581298828125, -1.4697265625, -1.358154296875, -1.24658203125, -1.135009765625, -1.0234375, -0.911865234375, -0.80029296875, -0.688720703125, -0.5771484375, -0.465576171875, -0.35400390625, -0.242431640625, -0.130859375, -0.019287109375, 0.09228515625, 0.203857421875, 0.3154296875, 0.427001953125, 0.53857421875, 0.650146484375, 0.76171875, 0.873291015625, 0.98486328125, 1.096435546875, 1.2080078125, 1.319580078125, 1.43115234375, 1.542724609375, 1.654296875, 1.765869140625, 1.87744140625, 1.989013671875, 2.1005859375, 2.212158203125, 2.32373046875, 2.435302734375, 2.546875, 2.658447265625, 2.77001953125, 2.881591796875, 2.9931640625, 3.104736328125, 3.21630859375, 3.327880859375, 3.439453125, 3.551025390625, 3.66259765625, 3.774169921875, 3.8857421875, 3.997314453125, 4.10888671875, 4.220458984375, 4.33203125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 12.0, 33.0, 128.0, 370.0, 332.0, 72.0, 27.0, 10.0, 5.0, 6.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.97212219238281, -72.76140594482422, -70.55068969726562, -68.33997344970703, -66.12925720214844, -63.918540954589844, -61.707828521728516, -59.49711227416992, -57.28639602661133, -55.075679779052734, -52.86496353149414, -50.65424728393555, -48.44353485107422, -46.232818603515625, -44.02210235595703, -41.81138610839844, -39.600669860839844, -37.38995361328125, -35.179237365722656, -32.96852111816406, -30.7578067779541, -28.547090530395508, -26.336376190185547, -24.125659942626953, -21.91494369506836, -19.704227447509766, -17.493511199951172, -15.282796859741211, -13.072080612182617, -10.861364364624023, -8.650649070739746, -6.439933776855469, -4.229225158691406, -2.0185093879699707, 0.19220638275146484, 2.4029221534729004, 4.613637924194336, 6.82435417175293, 9.035069465637207, 11.245784759521484, 13.456501007080078, 15.667217254638672, 17.877933502197266, 20.088647842407227, 22.29936408996582, 24.510080337524414, 26.720794677734375, 28.93151092529297, 31.142227172851562, 33.352943420410156, 35.56365966796875, 37.774375915527344, 39.98509216308594, 42.19580841064453, 44.40652084350586, 46.61723709106445, 48.82795333862305, 51.03866958618164, 53.249385833740234, 55.46010208129883, 57.670814514160156, 59.88153076171875, 62.092247009277344, 64.30296325683594, 66.51367950439453]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 8.0, 8.0, 2.0, 3.0, 6.0, 24.0, 21.0, 45.0, 67.0, 95.0, 114.0, 145.0, 135.0, 94.0, 69.0, 55.0, 21.0, 26.0, 7.0, 9.0, 6.0, 4.0, 2.0, 8.0, 3.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.02294158935547, -38.572608947753906, -37.12227249145508, -35.671939849853516, -34.22160339355469, -32.771270751953125, -31.320938110351562, -29.870603561401367, -28.420269012451172, -26.969934463500977, -25.51959991455078, -24.06926727294922, -22.618932723999023, -21.168598175048828, -19.718265533447266, -18.26793098449707, -16.817596435546875, -15.36726188659668, -13.9169282913208, -12.466594696044922, -11.016260147094727, -9.565925598144531, -8.115592002868652, -6.665258407592773, -5.214923858642578, -3.764589786529541, -2.314255714416504, -0.8639216423034668, 0.5864124298095703, 2.0367465019226074, 3.4870805740356445, 4.937414169311523, 6.387748718261719, 7.838082790374756, 9.288416862487793, 10.738750457763672, 12.189085006713867, 13.639419555664062, 15.089753150939941, 16.54008674621582, 17.990421295166016, 19.44075584411621, 20.891090393066406, 22.34142303466797, 23.791757583618164, 25.24209213256836, 26.692424774169922, 28.142759323120117, 29.593093872070312, 31.043428421020508, 32.4937629699707, 33.944095611572266, 35.394432067871094, 36.844764709472656, 38.29509735107422, 39.74542999267578, 41.19576644897461, 42.64609909057617, 44.096435546875, 45.54676818847656, 46.997100830078125, 48.44743728637695, 49.897769927978516, 51.348106384277344, 52.798439025878906]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 2.0, 5.0, 6.0, 5.0, 7.0, 16.0, 13.0, 18.0, 24.0, 36.0, 50.0, 75.0, 105.0, 169.0, 232.0, 393.0, 637.0, 1090.0, 2139.0, 4827.0, 12734.0, 53049.0, 3561180.0, 505315.0, 34157.0, 9814.0, 3898.0, 1848.0, 993.0, 508.0, 324.0, 185.0, 118.0, 101.0, 64.0, 39.0, 24.0, 20.0, 20.0, 9.0, 11.0, 10.0, 4.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.80078125, -5.6295166015625, -5.458251953125, -5.2869873046875, -5.11572265625, -4.9444580078125, -4.773193359375, -4.6019287109375, -4.4306640625, -4.2593994140625, -4.088134765625, -3.9168701171875, -3.74560546875, -3.5743408203125, -3.403076171875, -3.2318115234375, -3.060546875, -2.8892822265625, -2.718017578125, -2.5467529296875, -2.37548828125, -2.2042236328125, -2.032958984375, -1.8616943359375, -1.6904296875, -1.5191650390625, -1.347900390625, -1.1766357421875, -1.00537109375, -0.8341064453125, -0.662841796875, -0.4915771484375, -0.3203125, -0.1490478515625, 0.022216796875, 0.1934814453125, 0.36474609375, 0.5360107421875, 0.707275390625, 0.8785400390625, 1.0498046875, 1.2210693359375, 1.392333984375, 1.5635986328125, 1.73486328125, 1.9061279296875, 2.077392578125, 2.2486572265625, 2.419921875, 2.5911865234375, 2.762451171875, 2.9337158203125, 3.10498046875, 3.2762451171875, 3.447509765625, 3.6187744140625, 3.7900390625, 3.9613037109375, 4.132568359375, 4.3038330078125, 4.47509765625, 4.6463623046875, 4.817626953125, 4.9888916015625, 5.16015625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 6.0, 10.0, 1.0, 5.0, 14.0, 16.0, 17.0, 25.0, 64.0, 150.0, 279.0, 219.0, 87.0, 32.0, 23.0, 3.0, 7.0, 10.0, 6.0, 7.0, 6.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72119140625, -0.7009735107421875, -0.680755615234375, -0.6605377197265625, -0.64031982421875, -0.6201019287109375, -0.599884033203125, -0.5796661376953125, -0.5594482421875, -0.5392303466796875, -0.519012451171875, -0.4987945556640625, -0.47857666015625, -0.4583587646484375, -0.438140869140625, -0.4179229736328125, -0.397705078125, -0.3774871826171875, -0.357269287109375, -0.3370513916015625, -0.31683349609375, -0.2966156005859375, -0.276397705078125, -0.2561798095703125, -0.2359619140625, -0.2157440185546875, -0.195526123046875, -0.1753082275390625, -0.15509033203125, -0.1348724365234375, -0.114654541015625, -0.0944366455078125, -0.07421875, -0.0540008544921875, -0.033782958984375, -0.0135650634765625, 0.00665283203125, 0.0268707275390625, 0.047088623046875, 0.0673065185546875, 0.0875244140625, 0.1077423095703125, 0.127960205078125, 0.1481781005859375, 0.16839599609375, 0.1886138916015625, 0.208831787109375, 0.2290496826171875, 0.249267578125, 0.2694854736328125, 0.289703369140625, 0.3099212646484375, 0.33013916015625, 0.3503570556640625, 0.370574951171875, 0.3907928466796875, 0.4110107421875, 0.4312286376953125, 0.451446533203125, 0.4716644287109375, 0.49188232421875, 0.5121002197265625, 0.532318115234375, 0.5525360107421875, 0.57275390625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 2.0, 10.0, 8.0, 8.0, 15.0, 17.0, 31.0, 37.0, 61.0, 95.0, 155.0, 242.0, 452.0, 850.0, 1734.0, 3938.0, 9936.0, 32895.0, 172651.0, 3240892.0, 632269.0, 69376.0, 17371.0, 6147.0, 2517.0, 1188.0, 559.0, 335.0, 158.0, 107.0, 56.0, 46.0, 32.0, 20.0, 18.0, 12.0, 10.0, 8.0, 5.0, 6.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.48828125, -3.390716552734375, -3.29315185546875, -3.195587158203125, -3.0980224609375, -3.000457763671875, -2.90289306640625, -2.805328369140625, -2.707763671875, -2.610198974609375, -2.51263427734375, -2.415069580078125, -2.3175048828125, -2.219940185546875, -2.12237548828125, -2.024810791015625, -1.92724609375, -1.829681396484375, -1.73211669921875, -1.634552001953125, -1.5369873046875, -1.439422607421875, -1.34185791015625, -1.244293212890625, -1.146728515625, -1.049163818359375, -0.95159912109375, -0.854034423828125, -0.7564697265625, -0.658905029296875, -0.56134033203125, -0.463775634765625, -0.3662109375, -0.268646240234375, -0.17108154296875, -0.073516845703125, 0.0240478515625, 0.121612548828125, 0.21917724609375, 0.316741943359375, 0.414306640625, 0.511871337890625, 0.60943603515625, 0.707000732421875, 0.8045654296875, 0.902130126953125, 0.99969482421875, 1.097259521484375, 1.19482421875, 1.292388916015625, 1.38995361328125, 1.487518310546875, 1.5850830078125, 1.682647705078125, 1.78021240234375, 1.877777099609375, 1.975341796875, 2.072906494140625, 2.17047119140625, 2.268035888671875, 2.3656005859375, 2.463165283203125, 2.56072998046875, 2.658294677734375, 2.755859375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 7.0, 11.0, 8.0, 19.0, 18.0, 22.0, 39.0, 48.0, 68.0, 107.0, 198.0, 393.0, 929.0, 1178.0, 434.0, 222.0, 120.0, 88.0, 48.0, 35.0, 25.0, 15.0, 5.0, 11.0, 5.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5546875, -0.5362319946289062, -0.5177764892578125, -0.49932098388671875, -0.480865478515625, -0.46240997314453125, -0.4439544677734375, -0.42549896240234375, -0.40704345703125, -0.38858795166015625, -0.3701324462890625, -0.35167694091796875, -0.333221435546875, -0.31476593017578125, -0.2963104248046875, -0.27785491943359375, -0.2593994140625, -0.24094390869140625, -0.2224884033203125, -0.20403289794921875, -0.185577392578125, -0.16712188720703125, -0.1486663818359375, -0.13021087646484375, -0.11175537109375, -0.09329986572265625, -0.0748443603515625, -0.05638885498046875, -0.037933349609375, -0.01947784423828125, -0.0010223388671875, 0.01743316650390625, 0.035888671875, 0.05434417724609375, 0.0727996826171875, 0.09125518798828125, 0.109710693359375, 0.12816619873046875, 0.1466217041015625, 0.16507720947265625, 0.18353271484375, 0.20198822021484375, 0.2204437255859375, 0.23889923095703125, 0.257354736328125, 0.27581024169921875, 0.2942657470703125, 0.31272125244140625, 0.3311767578125, 0.34963226318359375, 0.3680877685546875, 0.38654327392578125, 0.404998779296875, 0.42345428466796875, 0.4419097900390625, 0.46036529541015625, 0.47882080078125, 0.49727630615234375, 0.5157318115234375, 0.5341873168945312, 0.552642822265625, 0.5710983276367188, 0.5895538330078125, 0.6080093383789062, 0.62646484375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 39.0, 345.0, 500.0, 81.0, 21.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.640778541564941, -6.228817939758301, -5.81685733795166, -5.4048967361450195, -4.992936134338379, -4.580975532531738, -4.1690144538879395, -3.757053852081299, -3.345093250274658, -2.9331326484680176, -2.521172046661377, -2.1092112064361572, -1.6972506046295166, -1.285290002822876, -0.8733291625976562, -0.4613685607910156, -0.049407958984375, 0.3625527024269104, 0.7745133638381958, 1.186474084854126, 1.5984346866607666, 2.0103952884674072, 2.422356128692627, 2.8343167304992676, 3.246277332305908, 3.658237934112549, 4.0701985359191895, 4.482159614562988, 4.894120216369629, 5.3060808181762695, 5.71804141998291, 6.130002021789551, 6.541963577270508, 6.953924179077148, 7.365884780883789, 7.77784538269043, 8.18980598449707, 8.601766586303711, 9.013727188110352, 9.425687789916992, 9.837648391723633, 10.249608993530273, 10.661569595336914, 11.073530197143555, 11.485490798950195, 11.897451400756836, 12.309412002563477, 12.721372604370117, 13.133334159851074, 13.545294761657715, 13.957255363464355, 14.369215965270996, 14.781176567077637, 15.193137168884277, 15.605098724365234, 16.017059326171875, 16.429019927978516, 16.840980529785156, 17.252941131591797, 17.664901733398438, 18.076862335205078, 18.48882293701172, 18.90078353881836, 19.312744140625, 19.72470474243164]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 7.0, 5.0, 13.0, 6.0, 19.0, 23.0, 32.0, 33.0, 45.0, 50.0, 74.0, 61.0, 88.0, 74.0, 58.0, 81.0, 57.0, 49.0, 47.0, 41.0, 33.0, 24.0, 20.0, 13.0, 14.0, 7.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.380535364151001, -3.2862942218780518, -3.1920533180236816, -3.0978121757507324, -3.003571033477783, -2.909330129623413, -2.815088987350464, -2.7208480834960938, -2.6266069412231445, -2.5323657989501953, -2.438124895095825, -2.343883752822876, -2.249642848968506, -2.1554017066955566, -2.0611605644226074, -1.9669195413589478, -1.872678518295288, -1.7784374952316284, -1.6841964721679688, -1.5899553298950195, -1.4957143068313599, -1.4014732837677002, -1.307232141494751, -1.2129911184310913, -1.1187500953674316, -1.024509072303772, -0.9302679896354675, -0.8360269069671631, -0.7417858839035034, -0.6475448608398438, -0.5533037781715393, -0.45906269550323486, -0.3648219108581543, -0.27058085799217224, -0.17633980512619019, -0.08209875226020813, 0.012142300605773926, 0.10638335347175598, 0.20062440633773804, 0.2948654890060425, 0.38910651206970215, 0.4833475649356842, 0.5775886178016663, 0.6718297004699707, 0.7660707235336304, 0.86031174659729, 0.9545528292655945, 1.048793911933899, 1.1430349349975586, 1.2372759580612183, 1.331516981124878, 1.4257581233978271, 1.5199991464614868, 1.6142401695251465, 1.7084813117980957, 1.8027223348617554, 1.896963357925415, 1.9912043809890747, 2.0854454040527344, 2.1796865463256836, 2.273927688598633, 2.368168592453003, 2.462409734725952, 2.5566506385803223, 2.6508917808532715]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 8.0, 7.0, 17.0, 36.0, 41.0, 42.0, 84.0, 168.0, 219.0, 423.0, 650.0, 1113.0, 2131.0, 3995.0, 7600.0, 15881.0, 36059.0, 221606.0, 638947.0, 72812.0, 23387.0, 11036.0, 5532.0, 2911.0, 1610.0, 904.0, 520.0, 289.0, 190.0, 105.0, 80.0, 56.0, 29.0, 14.0, 20.0, 8.0, 9.0, 4.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8125, -3.704376220703125, -3.59625244140625, -3.488128662109375, -3.3800048828125, -3.271881103515625, -3.16375732421875, -3.055633544921875, -2.947509765625, -2.839385986328125, -2.73126220703125, -2.623138427734375, -2.5150146484375, -2.406890869140625, -2.29876708984375, -2.190643310546875, -2.08251953125, -1.974395751953125, -1.86627197265625, -1.758148193359375, -1.6500244140625, -1.541900634765625, -1.43377685546875, -1.325653076171875, -1.217529296875, -1.109405517578125, -1.00128173828125, -0.893157958984375, -0.7850341796875, -0.676910400390625, -0.56878662109375, -0.460662841796875, -0.3525390625, -0.244415283203125, -0.13629150390625, -0.028167724609375, 0.0799560546875, 0.188079833984375, 0.29620361328125, 0.404327392578125, 0.512451171875, 0.620574951171875, 0.72869873046875, 0.836822509765625, 0.9449462890625, 1.053070068359375, 1.16119384765625, 1.269317626953125, 1.37744140625, 1.485565185546875, 1.59368896484375, 1.701812744140625, 1.8099365234375, 1.918060302734375, 2.02618408203125, 2.134307861328125, 2.242431640625, 2.350555419921875, 2.45867919921875, 2.566802978515625, 2.6749267578125, 2.783050537109375, 2.89117431640625, 2.999298095703125, 3.107421875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 4.0, 8.0, 5.0, 7.0, 11.0, 13.0, 32.0, 60.0, 145.0, 239.0, 230.0, 128.0, 35.0, 18.0, 13.0, 9.0, 11.0, 6.0, 8.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74267578125, -0.7224960327148438, -0.7023162841796875, -0.6821365356445312, -0.661956787109375, -0.6417770385742188, -0.6215972900390625, -0.6014175415039062, -0.58123779296875, -0.5610580444335938, -0.5408782958984375, -0.5206985473632812, -0.500518798828125, -0.48033905029296875, -0.4601593017578125, -0.43997955322265625, -0.4197998046875, -0.39962005615234375, -0.3794403076171875, -0.35926055908203125, -0.339080810546875, -0.31890106201171875, -0.2987213134765625, -0.27854156494140625, -0.25836181640625, -0.23818206787109375, -0.2180023193359375, -0.19782257080078125, -0.177642822265625, -0.15746307373046875, -0.1372833251953125, -0.11710357666015625, -0.096923828125, -0.07674407958984375, -0.0565643310546875, -0.03638458251953125, -0.016204833984375, 0.00397491455078125, 0.0241546630859375, 0.04433441162109375, 0.06451416015625, 0.08469390869140625, 0.1048736572265625, 0.12505340576171875, 0.145233154296875, 0.16541290283203125, 0.1855926513671875, 0.20577239990234375, 0.2259521484375, 0.24613189697265625, 0.2663116455078125, 0.28649139404296875, 0.306671142578125, 0.32685089111328125, 0.3470306396484375, 0.36721038818359375, 0.38739013671875, 0.40756988525390625, 0.4277496337890625, 0.44792938232421875, 0.468109130859375, 0.48828887939453125, 0.5084686279296875, 0.5286483764648438, 0.548828125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 5.0, 3.0, 2.0, 9.0, 9.0, 8.0, 11.0, 25.0, 37.0, 30.0, 67.0, 91.0, 116.0, 172.0, 267.0, 470.0, 696.0, 1261.0, 2351.0, 5066.0, 12309.0, 33931.0, 105065.0, 281339.0, 354773.0, 162405.0, 54271.0, 18925.0, 7287.0, 3292.0, 1736.0, 879.0, 580.0, 362.0, 218.0, 144.0, 110.0, 61.0, 55.0, 34.0, 27.0, 18.0, 10.0, 6.0, 6.0, 8.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.40625, -1.352569580078125, -1.29888916015625, -1.245208740234375, -1.1915283203125, -1.137847900390625, -1.08416748046875, -1.030487060546875, -0.976806640625, -0.923126220703125, -0.86944580078125, -0.815765380859375, -0.7620849609375, -0.708404541015625, -0.65472412109375, -0.601043701171875, -0.54736328125, -0.493682861328125, -0.44000244140625, -0.386322021484375, -0.3326416015625, -0.278961181640625, -0.22528076171875, -0.171600341796875, -0.117919921875, -0.064239501953125, -0.01055908203125, 0.043121337890625, 0.0968017578125, 0.150482177734375, 0.20416259765625, 0.257843017578125, 0.3115234375, 0.365203857421875, 0.41888427734375, 0.472564697265625, 0.5262451171875, 0.579925537109375, 0.63360595703125, 0.687286376953125, 0.740966796875, 0.794647216796875, 0.84832763671875, 0.902008056640625, 0.9556884765625, 1.009368896484375, 1.06304931640625, 1.116729736328125, 1.17041015625, 1.224090576171875, 1.27777099609375, 1.331451416015625, 1.3851318359375, 1.438812255859375, 1.49249267578125, 1.546173095703125, 1.599853515625, 1.653533935546875, 1.70721435546875, 1.760894775390625, 1.8145751953125, 1.868255615234375, 1.92193603515625, 1.975616455078125, 2.029296875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 6.0, 7.0, 7.0, 8.0, 5.0, 11.0, 6.0, 12.0, 13.0, 18.0, 28.0, 19.0, 27.0, 29.0, 32.0, 36.0, 30.0, 37.0, 36.0, 40.0, 36.0, 38.0, 37.0, 45.0, 40.0, 41.0, 32.0, 42.0, 27.0, 30.0, 29.0, 27.0, 33.0, 23.0, 19.0, 18.0, 12.0, 8.0, 12.0, 14.0, 7.0, 6.0, 7.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2021484375, -1.160614013671875, -1.11907958984375, -1.077545166015625, -1.0360107421875, -0.994476318359375, -0.95294189453125, -0.911407470703125, -0.869873046875, -0.828338623046875, -0.78680419921875, -0.745269775390625, -0.7037353515625, -0.662200927734375, -0.62066650390625, -0.579132080078125, -0.53759765625, -0.496063232421875, -0.45452880859375, -0.412994384765625, -0.3714599609375, -0.329925537109375, -0.28839111328125, -0.246856689453125, -0.205322265625, -0.163787841796875, -0.12225341796875, -0.080718994140625, -0.0391845703125, 0.002349853515625, 0.04388427734375, 0.085418701171875, 0.126953125, 0.168487548828125, 0.21002197265625, 0.251556396484375, 0.2930908203125, 0.334625244140625, 0.37615966796875, 0.417694091796875, 0.459228515625, 0.500762939453125, 0.54229736328125, 0.583831787109375, 0.6253662109375, 0.666900634765625, 0.70843505859375, 0.749969482421875, 0.79150390625, 0.833038330078125, 0.87457275390625, 0.916107177734375, 0.9576416015625, 0.999176025390625, 1.04071044921875, 1.082244873046875, 1.123779296875, 1.165313720703125, 1.20684814453125, 1.248382568359375, 1.2899169921875, 1.331451416015625, 1.37298583984375, 1.414520263671875, 1.4560546875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 13.0, 9.0, 29.0, 37.0, 50.0, 101.0, 153.0, 308.0, 800.0, 3106.0, 31772.0, 981275.0, 26517.0, 2899.0, 768.0, 328.0, 148.0, 88.0, 51.0, 31.0, 15.0, 11.0, 10.0, 6.0, 9.0, 4.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-15.5546875, -15.150390625, -14.74609375, -14.341796875, -13.9375, -13.533203125, -13.12890625, -12.724609375, -12.3203125, -11.916015625, -11.51171875, -11.107421875, -10.703125, -10.298828125, -9.89453125, -9.490234375, -9.0859375, -8.681640625, -8.27734375, -7.873046875, -7.46875, -7.064453125, -6.66015625, -6.255859375, -5.8515625, -5.447265625, -5.04296875, -4.638671875, -4.234375, -3.830078125, -3.42578125, -3.021484375, -2.6171875, -2.212890625, -1.80859375, -1.404296875, -1.0, -0.595703125, -0.19140625, 0.212890625, 0.6171875, 1.021484375, 1.42578125, 1.830078125, 2.234375, 2.638671875, 3.04296875, 3.447265625, 3.8515625, 4.255859375, 4.66015625, 5.064453125, 5.46875, 5.873046875, 6.27734375, 6.681640625, 7.0859375, 7.490234375, 7.89453125, 8.298828125, 8.703125, 9.107421875, 9.51171875, 9.916015625, 10.3203125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 4.0, 0.0, 6.0, 10.0, 10.0, 18.0, 14.0, 24.0, 31.0, 49.0, 102.0, 157.0, 201.0, 143.0, 84.0, 41.0, 22.0, 21.0, 18.0, 16.0, 9.0, 2.0, 3.0, 6.0, 4.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020503997802734375, -0.00019545480608940125, -0.00018586963415145874, -0.00017628446221351624, -0.00016669929027557373, -0.00015711411833763123, -0.00014752894639968872, -0.00013794377446174622, -0.0001283586025238037, -0.0001187734305858612, -0.0001091882586479187, -9.96030867099762e-05, -9.001791477203369e-05, -8.043274283409119e-05, -7.084757089614868e-05, -6.126239895820618e-05, -5.167722702026367e-05, -4.209205508232117e-05, -3.250688314437866e-05, -2.2921711206436157e-05, -1.3336539268493652e-05, -3.7513673305511475e-06, 5.833804607391357e-06, 1.5418976545333862e-05, 2.5004148483276367e-05, 3.458932042121887e-05, 4.417449235916138e-05, 5.375966429710388e-05, 6.334483623504639e-05, 7.293000817298889e-05, 8.25151801109314e-05, 9.21003520488739e-05, 0.0001016855239868164, 0.00011127069592475891, 0.00012085586786270142, 0.00013044103980064392, 0.00014002621173858643, 0.00014961138367652893, 0.00015919655561447144, 0.00016878172755241394, 0.00017836689949035645, 0.00018795207142829895, 0.00019753724336624146, 0.00020712241530418396, 0.00021670758724212646, 0.00022629275918006897, 0.00023587793111801147, 0.000245463103055954, 0.0002550482749938965, 0.000264633446931839, 0.0002742186188697815, 0.000283803790807724, 0.0002933889627456665, 0.000302974134683609, 0.0003125593066215515, 0.000322144478559494, 0.0003317296504974365, 0.00034131482243537903, 0.00035089999437332153, 0.00036048516631126404, 0.00037007033824920654, 0.00037965551018714905, 0.00038924068212509155, 0.00039882585406303406, 0.00040841102600097656]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 5.0, 5.0, 1.0, 14.0, 18.0, 33.0, 33.0, 62.0, 130.0, 182.0, 392.0, 902.0, 2449.0, 10140.0, 105376.0, 856142.0, 61207.0, 7623.0, 2127.0, 857.0, 342.0, 219.0, 103.0, 67.0, 38.0, 23.0, 18.0, 15.0, 7.0, 5.0, 3.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.25390625, -5.062255859375, -4.87060546875, -4.678955078125, -4.4873046875, -4.295654296875, -4.10400390625, -3.912353515625, -3.720703125, -3.529052734375, -3.33740234375, -3.145751953125, -2.9541015625, -2.762451171875, -2.57080078125, -2.379150390625, -2.1875, -1.995849609375, -1.80419921875, -1.612548828125, -1.4208984375, -1.229248046875, -1.03759765625, -0.845947265625, -0.654296875, -0.462646484375, -0.27099609375, -0.079345703125, 0.1123046875, 0.303955078125, 0.49560546875, 0.687255859375, 0.87890625, 1.070556640625, 1.26220703125, 1.453857421875, 1.6455078125, 1.837158203125, 2.02880859375, 2.220458984375, 2.412109375, 2.603759765625, 2.79541015625, 2.987060546875, 3.1787109375, 3.370361328125, 3.56201171875, 3.753662109375, 3.9453125, 4.136962890625, 4.32861328125, 4.520263671875, 4.7119140625, 4.903564453125, 5.09521484375, 5.286865234375, 5.478515625, 5.670166015625, 5.86181640625, 6.053466796875, 6.2451171875, 6.436767578125, 6.62841796875, 6.820068359375, 7.01171875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 4.0, 11.0, 18.0, 24.0, 45.0, 72.0, 109.0, 196.0, 222.0, 135.0, 56.0, 37.0, 26.0, 12.0, 12.0, 6.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.93359375, -3.76251220703125, -3.5914306640625, -3.42034912109375, -3.249267578125, -3.07818603515625, -2.9071044921875, -2.73602294921875, -2.56494140625, -2.39385986328125, -2.2227783203125, -2.05169677734375, -1.880615234375, -1.70953369140625, -1.5384521484375, -1.36737060546875, -1.1962890625, -1.02520751953125, -0.8541259765625, -0.68304443359375, -0.511962890625, -0.34088134765625, -0.1697998046875, 0.00128173828125, 0.17236328125, 0.34344482421875, 0.5145263671875, 0.68560791015625, 0.856689453125, 1.02777099609375, 1.1988525390625, 1.36993408203125, 1.541015625, 1.71209716796875, 1.8831787109375, 2.05426025390625, 2.225341796875, 2.39642333984375, 2.5675048828125, 2.73858642578125, 2.90966796875, 3.08074951171875, 3.2518310546875, 3.42291259765625, 3.593994140625, 3.76507568359375, 3.9361572265625, 4.10723876953125, 4.2783203125, 4.44940185546875, 4.6204833984375, 4.79156494140625, 4.962646484375, 5.13372802734375, 5.3048095703125, 5.47589111328125, 5.64697265625, 5.81805419921875, 5.9891357421875, 6.16021728515625, 6.331298828125, 6.50238037109375, 6.6734619140625, 6.84454345703125, 7.015625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 11.0, 32.0, 122.0, 350.0, 362.0, 88.0, 14.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-64.21833801269531, -62.761375427246094, -61.30441665649414, -59.84745407104492, -58.3904914855957, -56.933528900146484, -55.47657012939453, -54.01960754394531, -52.562644958496094, -51.105682373046875, -49.64872360229492, -48.1917610168457, -46.734798431396484, -45.277835845947266, -43.82087707519531, -42.363914489746094, -40.906951904296875, -39.449989318847656, -37.9930305480957, -36.536067962646484, -35.079105377197266, -33.62214279174805, -32.165184020996094, -30.708221435546875, -29.251262664794922, -27.794301986694336, -26.337339401245117, -24.88037872314453, -23.423416137695312, -21.966455459594727, -20.50949478149414, -19.052532196044922, -17.595569610595703, -16.138608932495117, -14.681646347045898, -13.224685668945312, -11.767723083496094, -10.310762405395508, -8.853800773620605, -7.396839141845703, -5.939877510070801, -4.482915878295898, -3.025954484939575, -1.568993091583252, -0.11203145980834961, 1.3449301719665527, 2.801891326904297, 4.258852958679199, 5.715814590454102, 7.172776222229004, 8.629737854003906, 10.086698532104492, 11.543661117553711, 13.000621795654297, 14.4575834274292, 15.914545059204102, 17.371505737304688, 18.828466415405273, 20.285429000854492, 21.742389678955078, 23.199352264404297, 24.656312942504883, 26.11327362060547, 27.570236206054688, 29.027198791503906]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 6.0, 6.0, 5.0, 22.0, 24.0, 32.0, 48.0, 61.0, 78.0, 87.0, 99.0, 120.0, 88.0, 84.0, 68.0, 42.0, 31.0, 21.0, 16.0, 9.0, 5.0, 8.0, 5.0, 4.0, 0.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.642147064208984, -16.961448669433594, -16.28074836730957, -15.60004997253418, -14.919351577758789, -14.238652229309082, -13.557952880859375, -12.877254486083984, -12.196555137634277, -11.51585578918457, -10.83515739440918, -10.154458045959473, -9.473758697509766, -8.793060302734375, -8.112360954284668, -7.431662082672119, -6.75096321105957, -6.0702643394470215, -5.389565467834473, -4.708866119384766, -4.028167247772217, -3.347468376159668, -2.666769027709961, -1.986070156097412, -1.3053712844848633, -0.6246722936630249, 0.05602669715881348, 0.7367258071899414, 1.4174246788024902, 2.098123550415039, 2.778822898864746, 3.459521770477295, 4.140220642089844, 4.820919513702393, 5.501618385314941, 6.182317733764648, 6.863016605377197, 7.543715476989746, 8.224414825439453, 8.905113220214844, 9.58581256866455, 10.266511917114258, 10.947210311889648, 11.627909660339355, 12.308609008789062, 12.989307403564453, 13.67000675201416, 14.350706100463867, 15.031404495239258, 15.712103843688965, 16.392803192138672, 17.073501586914062, 17.754199981689453, 18.434898376464844, 19.115598678588867, 19.796297073364258, 20.47699737548828, 21.157695770263672, 21.838396072387695, 22.519094467163086, 23.199792861938477, 23.8804931640625, 24.56119155883789, 25.24188995361328, 25.922588348388672]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 5.0, 4.0, 5.0, 5.0, 1.0, 5.0, 9.0, 7.0, 17.0, 13.0, 25.0, 31.0, 27.0, 38.0, 50.0, 102.0, 128.0, 202.0, 246.0, 457.0, 860.0, 1714.0, 4538.0, 21146.0, 3456535.0, 684292.0, 16599.0, 3964.0, 1554.0, 649.0, 355.0, 206.0, 144.0, 111.0, 77.0, 52.0, 35.0, 20.0, 15.0, 15.0, 4.0, 9.0, 8.0, 5.0, 3.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0], "bins": [-11.2265625, -10.9306640625, -10.634765625, -10.3388671875, -10.04296875, -9.7470703125, -9.451171875, -9.1552734375, -8.859375, -8.5634765625, -8.267578125, -7.9716796875, -7.67578125, -7.3798828125, -7.083984375, -6.7880859375, -6.4921875, -6.1962890625, -5.900390625, -5.6044921875, -5.30859375, -5.0126953125, -4.716796875, -4.4208984375, -4.125, -3.8291015625, -3.533203125, -3.2373046875, -2.94140625, -2.6455078125, -2.349609375, -2.0537109375, -1.7578125, -1.4619140625, -1.166015625, -0.8701171875, -0.57421875, -0.2783203125, 0.017578125, 0.3134765625, 0.609375, 0.9052734375, 1.201171875, 1.4970703125, 1.79296875, 2.0888671875, 2.384765625, 2.6806640625, 2.9765625, 3.2724609375, 3.568359375, 3.8642578125, 4.16015625, 4.4560546875, 4.751953125, 5.0478515625, 5.34375, 5.6396484375, 5.935546875, 6.2314453125, 6.52734375, 6.8232421875, 7.119140625, 7.4150390625, 7.7109375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 10.0, 12.0, 14.0, 33.0, 56.0, 135.0, 233.0, 239.0, 123.0, 59.0, 31.0, 22.0, 12.0, 6.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79052734375, -0.7678680419921875, -0.745208740234375, -0.7225494384765625, -0.69989013671875, -0.6772308349609375, -0.654571533203125, -0.6319122314453125, -0.6092529296875, -0.5865936279296875, -0.563934326171875, -0.5412750244140625, -0.51861572265625, -0.4959564208984375, -0.473297119140625, -0.4506378173828125, -0.427978515625, -0.4053192138671875, -0.382659912109375, -0.3600006103515625, -0.33734130859375, -0.3146820068359375, -0.292022705078125, -0.2693634033203125, -0.2467041015625, -0.2240447998046875, -0.201385498046875, -0.1787261962890625, -0.15606689453125, -0.1334075927734375, -0.110748291015625, -0.0880889892578125, -0.0654296875, -0.0427703857421875, -0.020111083984375, 0.0025482177734375, 0.02520751953125, 0.0478668212890625, 0.070526123046875, 0.0931854248046875, 0.1158447265625, 0.1385040283203125, 0.161163330078125, 0.1838226318359375, 0.20648193359375, 0.2291412353515625, 0.251800537109375, 0.2744598388671875, 0.297119140625, 0.3197784423828125, 0.342437744140625, 0.3650970458984375, 0.38775634765625, 0.4104156494140625, 0.433074951171875, 0.4557342529296875, 0.4783935546875, 0.5010528564453125, 0.523712158203125, 0.5463714599609375, 0.56903076171875, 0.5916900634765625, 0.614349365234375, 0.6370086669921875, 0.65966796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 8.0, 8.0, 20.0, 27.0, 42.0, 129.0, 362.0, 2109.0, 59471.0, 4115126.0, 15477.0, 1029.0, 254.0, 89.0, 53.0, 27.0, 17.0, 8.0, 6.0, 6.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.140625, -10.68310546875, -10.2255859375, -9.76806640625, -9.310546875, -8.85302734375, -8.3955078125, -7.93798828125, -7.48046875, -7.02294921875, -6.5654296875, -6.10791015625, -5.650390625, -5.19287109375, -4.7353515625, -4.27783203125, -3.8203125, -3.36279296875, -2.9052734375, -2.44775390625, -1.990234375, -1.53271484375, -1.0751953125, -0.61767578125, -0.16015625, 0.29736328125, 0.7548828125, 1.21240234375, 1.669921875, 2.12744140625, 2.5849609375, 3.04248046875, 3.5, 3.95751953125, 4.4150390625, 4.87255859375, 5.330078125, 5.78759765625, 6.2451171875, 6.70263671875, 7.16015625, 7.61767578125, 8.0751953125, 8.53271484375, 8.990234375, 9.44775390625, 9.9052734375, 10.36279296875, 10.8203125, 11.27783203125, 11.7353515625, 12.19287109375, 12.650390625, 13.10791015625, 13.5654296875, 14.02294921875, 14.48046875, 14.93798828125, 15.3955078125, 15.85302734375, 16.310546875, 16.76806640625, 17.2255859375, 17.68310546875, 18.140625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 10.0, 6.0, 26.0, 31.0, 45.0, 88.0, 166.0, 420.0, 1559.0, 1024.0, 345.0, 155.0, 78.0, 41.0, 22.0, 14.0, 13.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.109375, -1.0808181762695312, -1.0522613525390625, -1.0237045288085938, -0.995147705078125, -0.9665908813476562, -0.9380340576171875, -0.9094772338867188, -0.88092041015625, -0.8523635864257812, -0.8238067626953125, -0.7952499389648438, -0.766693115234375, -0.7381362915039062, -0.7095794677734375, -0.6810226440429688, -0.6524658203125, -0.6239089965820312, -0.5953521728515625, -0.5667953491210938, -0.538238525390625, -0.5096817016601562, -0.4811248779296875, -0.45256805419921875, -0.42401123046875, -0.39545440673828125, -0.3668975830078125, -0.33834075927734375, -0.309783935546875, -0.28122711181640625, -0.2526702880859375, -0.22411346435546875, -0.195556640625, -0.16699981689453125, -0.1384429931640625, -0.10988616943359375, -0.081329345703125, -0.05277252197265625, -0.0242156982421875, 0.00434112548828125, 0.03289794921875, 0.06145477294921875, 0.0900115966796875, 0.11856842041015625, 0.147125244140625, 0.17568206787109375, 0.2042388916015625, 0.23279571533203125, 0.2613525390625, 0.28990936279296875, 0.3184661865234375, 0.34702301025390625, 0.375579833984375, 0.40413665771484375, 0.4326934814453125, 0.46125030517578125, 0.48980712890625, 0.5183639526367188, 0.5469207763671875, 0.5754776000976562, 0.604034423828125, 0.6325912475585938, 0.6611480712890625, 0.6897048950195312, 0.71826171875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 19.0, 29.0, 121.0, 267.0, 316.0, 169.0, 56.0, 17.0, 3.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1326751708984375, -6.911565780639648, -6.690456390380859, -6.46934700012207, -6.248237609863281, -6.027128219604492, -5.806018829345703, -5.584909439086914, -5.363800048828125, -5.142690658569336, -4.921581268310547, -4.700471878051758, -4.479362487792969, -4.25825309753418, -4.037143707275391, -3.8160340785980225, -3.5949244499206543, -3.3738150596618652, -3.152705669403076, -2.931596279144287, -2.710486888885498, -2.489377498626709, -2.268267869949341, -2.0471584796905518, -1.8260490894317627, -1.6049396991729736, -1.3838303089141846, -1.162720799446106, -0.9416114091873169, -0.7205020189285278, -0.4993925094604492, -0.27828311920166016, -0.05717325210571289, 0.16393616795539856, 0.38504558801651, 0.6061550378799438, 0.8272644281387329, 1.048373818397522, 1.2694833278656006, 1.4905927181243896, 1.7117021083831787, 1.9328114986419678, 2.153920888900757, 2.375030517578125, 2.596139907836914, 2.817249298095703, 3.038358688354492, 3.2594680786132812, 3.4805774688720703, 3.7016868591308594, 3.9227962493896484, 4.1439056396484375, 4.365015029907227, 4.586124420166016, 4.807233810424805, 5.028343200683594, 5.249452590942383, 5.470561981201172, 5.691671371459961, 5.91278076171875, 6.133890151977539, 6.354999542236328, 6.576108932495117, 6.797218322753906, 7.0183281898498535]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 2.0, 5.0, 1.0, 2.0, 3.0, 5.0, 7.0, 7.0, 4.0, 17.0, 22.0, 27.0, 30.0, 40.0, 46.0, 50.0, 59.0, 72.0, 71.0, 54.0, 61.0, 69.0, 72.0, 58.0, 42.0, 45.0, 29.0, 24.0, 23.0, 22.0, 12.0, 8.0, 1.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6822056770324707, -2.595564126968384, -2.5089223384857178, -2.422280788421631, -2.335638999938965, -2.248997449874878, -2.162355661392212, -2.075714111328125, -1.989072322845459, -1.9024306535720825, -1.815788984298706, -1.7291473150253296, -1.6425056457519531, -1.5558639764785767, -1.4692223072052002, -1.3825807571411133, -1.2959390878677368, -1.2092974185943604, -1.1226557493209839, -1.0360140800476074, -0.949372410774231, -0.8627307415008545, -0.7760891318321228, -0.6894474625587463, -0.6028057932853699, -0.5161641240119934, -0.42952245473861694, -0.34288081526756287, -0.2562391459941864, -0.16959747672080994, -0.08295583724975586, 0.0036858320236206055, 0.09032750129699707, 0.17696917057037354, 0.26361083984375, 0.3502524793148041, 0.43689414858818054, 0.5235358476638794, 0.6101774573326111, 0.6968191266059875, 0.783460795879364, 0.8701024651527405, 0.9567441344261169, 1.0433857440948486, 1.130027413368225, 1.2166690826416016, 1.303310751914978, 1.3899524211883545, 1.476594090461731, 1.5632357597351074, 1.6498774290084839, 1.7365190982818604, 1.8231607675552368, 1.9098024368286133, 1.9964439868927002, 2.083085775375366, 2.169727325439453, 2.25636887550354, 2.343010663986206, 2.429652214050293, 2.516294002532959, 2.602935552597046, 2.689577341079712, 2.776218891143799, 2.862860679626465]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 9.0, 9.0, 15.0, 23.0, 33.0, 55.0, 74.0, 152.0, 236.0, 457.0, 891.0, 2119.0, 6225.0, 30885.0, 450671.0, 511681.0, 34211.0, 6492.0, 2263.0, 965.0, 469.0, 254.0, 141.0, 89.0, 47.0, 27.0, 23.0, 13.0, 9.0, 4.0, 4.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.96875, -4.80859375, -4.6484375, -4.48828125, -4.328125, -4.16796875, -4.0078125, -3.84765625, -3.6875, -3.52734375, -3.3671875, -3.20703125, -3.046875, -2.88671875, -2.7265625, -2.56640625, -2.40625, -2.24609375, -2.0859375, -1.92578125, -1.765625, -1.60546875, -1.4453125, -1.28515625, -1.125, -0.96484375, -0.8046875, -0.64453125, -0.484375, -0.32421875, -0.1640625, -0.00390625, 0.15625, 0.31640625, 0.4765625, 0.63671875, 0.796875, 0.95703125, 1.1171875, 1.27734375, 1.4375, 1.59765625, 1.7578125, 1.91796875, 2.078125, 2.23828125, 2.3984375, 2.55859375, 2.71875, 2.87890625, 3.0390625, 3.19921875, 3.359375, 3.51953125, 3.6796875, 3.83984375, 4.0, 4.16015625, 4.3203125, 4.48046875, 4.640625, 4.80078125, 4.9609375, 5.12109375, 5.28125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 2.0, 8.0, 14.0, 40.0, 72.0, 148.0, 189.0, 217.0, 147.0, 80.0, 40.0, 20.0, 3.0, 7.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72509765625, -0.7037353515625, -0.682373046875, -0.6610107421875, -0.6396484375, -0.6182861328125, -0.596923828125, -0.5755615234375, -0.55419921875, -0.5328369140625, -0.511474609375, -0.4901123046875, -0.46875, -0.4473876953125, -0.426025390625, -0.4046630859375, -0.38330078125, -0.3619384765625, -0.340576171875, -0.3192138671875, -0.2978515625, -0.2764892578125, -0.255126953125, -0.2337646484375, -0.21240234375, -0.1910400390625, -0.169677734375, -0.1483154296875, -0.126953125, -0.1055908203125, -0.084228515625, -0.0628662109375, -0.04150390625, -0.0201416015625, 0.001220703125, 0.0225830078125, 0.0439453125, 0.0653076171875, 0.086669921875, 0.1080322265625, 0.12939453125, 0.1507568359375, 0.172119140625, 0.1934814453125, 0.21484375, 0.2362060546875, 0.257568359375, 0.2789306640625, 0.30029296875, 0.3216552734375, 0.343017578125, 0.3643798828125, 0.3857421875, 0.4071044921875, 0.428466796875, 0.4498291015625, 0.47119140625, 0.4925537109375, 0.513916015625, 0.5352783203125, 0.556640625, 0.5780029296875, 0.599365234375, 0.6207275390625, 0.64208984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 7.0, 9.0, 8.0, 13.0, 10.0, 17.0, 37.0, 42.0, 38.0, 58.0, 65.0, 109.0, 136.0, 177.0, 316.0, 504.0, 765.0, 1351.0, 2960.0, 7710.0, 25821.0, 100511.0, 341131.0, 390064.0, 127565.0, 32543.0, 9134.0, 3365.0, 1527.0, 840.0, 539.0, 332.0, 263.0, 171.0, 111.0, 80.0, 59.0, 37.0, 25.0, 26.0, 16.0, 21.0, 6.0, 6.0, 10.0, 4.0, 2.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.53515625, -2.456146240234375, -2.37713623046875, -2.298126220703125, -2.2191162109375, -2.140106201171875, -2.06109619140625, -1.982086181640625, -1.903076171875, -1.824066162109375, -1.74505615234375, -1.666046142578125, -1.5870361328125, -1.508026123046875, -1.42901611328125, -1.350006103515625, -1.27099609375, -1.191986083984375, -1.11297607421875, -1.033966064453125, -0.9549560546875, -0.875946044921875, -0.79693603515625, -0.717926025390625, -0.638916015625, -0.559906005859375, -0.48089599609375, -0.401885986328125, -0.3228759765625, -0.243865966796875, -0.16485595703125, -0.085845947265625, -0.0068359375, 0.072174072265625, 0.15118408203125, 0.230194091796875, 0.3092041015625, 0.388214111328125, 0.46722412109375, 0.546234130859375, 0.625244140625, 0.704254150390625, 0.78326416015625, 0.862274169921875, 0.9412841796875, 1.020294189453125, 1.09930419921875, 1.178314208984375, 1.25732421875, 1.336334228515625, 1.41534423828125, 1.494354248046875, 1.5733642578125, 1.652374267578125, 1.73138427734375, 1.810394287109375, 1.889404296875, 1.968414306640625, 2.04742431640625, 2.126434326171875, 2.2054443359375, 2.284454345703125, 2.36346435546875, 2.442474365234375, 2.521484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 4.0, 4.0, 5.0, 3.0, 1.0, 4.0, 6.0, 6.0, 6.0, 11.0, 13.0, 16.0, 16.0, 14.0, 20.0, 29.0, 19.0, 29.0, 20.0, 28.0, 23.0, 34.0, 30.0, 38.0, 42.0, 47.0, 51.0, 31.0, 43.0, 39.0, 29.0, 35.0, 29.0, 32.0, 28.0, 29.0, 32.0, 23.0, 23.0, 19.0, 18.0, 15.0, 16.0, 10.0, 6.0, 6.0, 6.0, 6.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.388671875, -1.3437652587890625, -1.298858642578125, -1.2539520263671875, -1.20904541015625, -1.1641387939453125, -1.119232177734375, -1.0743255615234375, -1.0294189453125, -0.9845123291015625, -0.939605712890625, -0.8946990966796875, -0.84979248046875, -0.8048858642578125, -0.759979248046875, -0.7150726318359375, -0.670166015625, -0.6252593994140625, -0.580352783203125, -0.5354461669921875, -0.49053955078125, -0.4456329345703125, -0.400726318359375, -0.3558197021484375, -0.3109130859375, -0.2660064697265625, -0.221099853515625, -0.1761932373046875, -0.13128662109375, -0.0863800048828125, -0.041473388671875, 0.0034332275390625, 0.04833984375, 0.0932464599609375, 0.138153076171875, 0.1830596923828125, 0.22796630859375, 0.2728729248046875, 0.317779541015625, 0.3626861572265625, 0.4075927734375, 0.4524993896484375, 0.497406005859375, 0.5423126220703125, 0.58721923828125, 0.6321258544921875, 0.677032470703125, 0.7219390869140625, 0.766845703125, 0.8117523193359375, 0.856658935546875, 0.9015655517578125, 0.94647216796875, 0.9913787841796875, 1.036285400390625, 1.0811920166015625, 1.1260986328125, 1.1710052490234375, 1.215911865234375, 1.2608184814453125, 1.30572509765625, 1.3506317138671875, 1.395538330078125, 1.4404449462890625, 1.4853515625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 7.0, 5.0, 11.0, 12.0, 2.0, 19.0, 33.0, 62.0, 89.0, 174.0, 318.0, 631.0, 1755.0, 5806.0, 30783.0, 362505.0, 586523.0, 48042.0, 7931.0, 2208.0, 818.0, 361.0, 179.0, 107.0, 56.0, 32.0, 32.0, 18.0, 8.0, 11.0, 9.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2265625, -2.13787841796875, -2.0491943359375, -1.96051025390625, -1.871826171875, -1.78314208984375, -1.6944580078125, -1.60577392578125, -1.51708984375, -1.42840576171875, -1.3397216796875, -1.25103759765625, -1.162353515625, -1.07366943359375, -0.9849853515625, -0.89630126953125, -0.8076171875, -0.71893310546875, -0.6302490234375, -0.54156494140625, -0.452880859375, -0.36419677734375, -0.2755126953125, -0.18682861328125, -0.09814453125, -0.00946044921875, 0.0792236328125, 0.16790771484375, 0.256591796875, 0.34527587890625, 0.4339599609375, 0.52264404296875, 0.611328125, 0.70001220703125, 0.7886962890625, 0.87738037109375, 0.966064453125, 1.05474853515625, 1.1434326171875, 1.23211669921875, 1.32080078125, 1.40948486328125, 1.4981689453125, 1.58685302734375, 1.675537109375, 1.76422119140625, 1.8529052734375, 1.94158935546875, 2.0302734375, 2.11895751953125, 2.2076416015625, 2.29632568359375, 2.385009765625, 2.47369384765625, 2.5623779296875, 2.65106201171875, 2.73974609375, 2.82843017578125, 2.9171142578125, 3.00579833984375, 3.094482421875, 3.18316650390625, 3.2718505859375, 3.36053466796875, 3.44921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 1.0, 2.0, 7.0, 2.0, 2.0, 4.0, 6.0, 6.0, 7.0, 19.0, 12.0, 25.0, 23.0, 31.0, 28.0, 42.0, 57.0, 69.0, 73.0, 85.0, 79.0, 90.0, 72.0, 47.0, 44.0, 31.0, 31.0, 29.0, 14.0, 9.0, 11.0, 9.0, 9.0, 9.0, 3.0, 6.0, 3.0, 0.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022077560424804688, -0.0002140924334526062, -0.00020740926265716553, -0.00020072609186172485, -0.00019404292106628418, -0.0001873597502708435, -0.00018067657947540283, -0.00017399340867996216, -0.00016731023788452148, -0.0001606270670890808, -0.00015394389629364014, -0.00014726072549819946, -0.0001405775547027588, -0.00013389438390731812, -0.00012721121311187744, -0.00012052804231643677, -0.0001138448715209961, -0.00010716170072555542, -0.00010047852993011475, -9.379535913467407e-05, -8.71121883392334e-05, -8.042901754379272e-05, -7.374584674835205e-05, -6.706267595291138e-05, -6.03795051574707e-05, -5.369633436203003e-05, -4.7013163566589355e-05, -4.032999277114868e-05, -3.364682197570801e-05, -2.6963651180267334e-05, -2.028048038482666e-05, -1.3597309589385986e-05, -6.9141387939453125e-06, -2.3096799850463867e-07, 6.452202796936035e-06, 1.3135373592376709e-05, 1.9818544387817383e-05, 2.6501715183258057e-05, 3.318488597869873e-05, 3.9868056774139404e-05, 4.655122756958008e-05, 5.323439836502075e-05, 5.9917569160461426e-05, 6.66007399559021e-05, 7.328391075134277e-05, 7.996708154678345e-05, 8.665025234222412e-05, 9.33334231376648e-05, 0.00010001659393310547, 0.00010669976472854614, 0.00011338293552398682, 0.00012006610631942749, 0.00012674927711486816, 0.00013343244791030884, 0.0001401156187057495, 0.00014679878950119019, 0.00015348196029663086, 0.00016016513109207153, 0.0001668483018875122, 0.00017353147268295288, 0.00018021464347839355, 0.00018689781427383423, 0.0001935809850692749, 0.00020026415586471558, 0.00020694732666015625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 6.0, 3.0, 10.0, 15.0, 11.0, 28.0, 28.0, 41.0, 73.0, 100.0, 192.0, 346.0, 700.0, 1856.0, 6654.0, 37443.0, 455198.0, 495675.0, 39599.0, 7019.0, 1966.0, 696.0, 390.0, 191.0, 101.0, 62.0, 51.0, 29.0, 24.0, 14.0, 8.0, 10.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.658203125, -2.559814453125, -2.46142578125, -2.363037109375, -2.2646484375, -2.166259765625, -2.06787109375, -1.969482421875, -1.87109375, -1.772705078125, -1.67431640625, -1.575927734375, -1.4775390625, -1.379150390625, -1.28076171875, -1.182373046875, -1.083984375, -0.985595703125, -0.88720703125, -0.788818359375, -0.6904296875, -0.592041015625, -0.49365234375, -0.395263671875, -0.296875, -0.198486328125, -0.10009765625, -0.001708984375, 0.0966796875, 0.195068359375, 0.29345703125, 0.391845703125, 0.490234375, 0.588623046875, 0.68701171875, 0.785400390625, 0.8837890625, 0.982177734375, 1.08056640625, 1.178955078125, 1.27734375, 1.375732421875, 1.47412109375, 1.572509765625, 1.6708984375, 1.769287109375, 1.86767578125, 1.966064453125, 2.064453125, 2.162841796875, 2.26123046875, 2.359619140625, 2.4580078125, 2.556396484375, 2.65478515625, 2.753173828125, 2.8515625, 2.949951171875, 3.04833984375, 3.146728515625, 3.2451171875, 3.343505859375, 3.44189453125, 3.540283203125, 3.638671875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 2.0, 3.0, 5.0, 6.0, 5.0, 13.0, 18.0, 16.0, 21.0, 31.0, 26.0, 58.0, 55.0, 69.0, 104.0, 103.0, 94.0, 70.0, 68.0, 60.0, 28.0, 31.0, 23.0, 18.0, 17.0, 14.0, 12.0, 5.0, 2.0, 5.0, 2.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3642578125, -1.3237457275390625, -1.283233642578125, -1.2427215576171875, -1.20220947265625, -1.1616973876953125, -1.121185302734375, -1.0806732177734375, -1.0401611328125, -0.9996490478515625, -0.959136962890625, -0.9186248779296875, -0.87811279296875, -0.8376007080078125, -0.797088623046875, -0.7565765380859375, -0.716064453125, -0.6755523681640625, -0.635040283203125, -0.5945281982421875, -0.55401611328125, -0.5135040283203125, -0.472991943359375, -0.4324798583984375, -0.3919677734375, -0.3514556884765625, -0.310943603515625, -0.2704315185546875, -0.22991943359375, -0.1894073486328125, -0.148895263671875, -0.1083831787109375, -0.06787109375, -0.0273590087890625, 0.013153076171875, 0.0536651611328125, 0.09417724609375, 0.1346893310546875, 0.175201416015625, 0.2157135009765625, 0.2562255859375, 0.2967376708984375, 0.337249755859375, 0.3777618408203125, 0.41827392578125, 0.4587860107421875, 0.499298095703125, 0.5398101806640625, 0.580322265625, 0.6208343505859375, 0.661346435546875, 0.7018585205078125, 0.74237060546875, 0.7828826904296875, 0.823394775390625, 0.8639068603515625, 0.9044189453125, 0.9449310302734375, 0.985443115234375, 1.0259552001953125, 1.06646728515625, 1.1069793701171875, 1.147491455078125, 1.1880035400390625, 1.228515625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 24.0, 65.0, 202.0, 331.0, 246.0, 72.0, 36.0, 5.0, 7.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.010255813598633, -13.82130241394043, -12.63234806060791, -11.443394660949707, -10.254440307617188, -9.065486907958984, -7.876533508300781, -6.687579154968262, -5.498625755310059, -4.309671878814697, -3.120718240737915, -1.9317646026611328, -0.7428107261657715, 0.44614315032958984, 1.635096549987793, 2.8240509033203125, 4.013004302978516, 5.201958179473877, 6.390912055969238, 7.579865455627441, 8.768819808959961, 9.957773208618164, 11.146726608276367, 12.335680961608887, 13.52463436126709, 14.713587760925293, 15.902542114257812, 17.091495513916016, 18.28044891357422, 19.469402313232422, 20.658355712890625, 21.84731101989746, 23.036266326904297, 24.2252197265625, 25.414173126220703, 26.603126525878906, 27.792081832885742, 28.981035232543945, 30.16998863220215, 31.358943939208984, 32.54789733886719, 33.73685073852539, 34.925804138183594, 36.1147575378418, 37.3037109375, 38.49266815185547, 39.681617736816406, 40.870574951171875, 42.05952453613281, 43.248477935791016, 44.43743133544922, 45.62638473510742, 46.815338134765625, 48.004295349121094, 49.19324493408203, 50.3822021484375, 51.5711555480957, 52.760108947753906, 53.94906234741211, 55.13801574707031, 56.326969146728516, 57.51592254638672, 58.70487976074219, 59.89383316040039, 61.082786560058594]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 3.0, 1.0, 3.0, 6.0, 8.0, 11.0, 8.0, 15.0, 25.0, 32.0, 40.0, 40.0, 56.0, 47.0, 60.0, 87.0, 79.0, 70.0, 64.0, 57.0, 52.0, 48.0, 44.0, 37.0, 26.0, 27.0, 14.0, 18.0, 13.0, 2.0, 7.0, 0.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-28.47422218322754, -27.817100524902344, -27.159976959228516, -26.50285530090332, -25.845733642578125, -25.188610076904297, -24.5314884185791, -23.874366760253906, -23.217243194580078, -22.560121536254883, -21.902997970581055, -21.24587631225586, -20.58875274658203, -19.931631088256836, -19.27450942993164, -18.617385864257812, -17.960264205932617, -17.303142547607422, -16.646018981933594, -15.988897323608398, -15.331774711608887, -14.674652099609375, -14.01753044128418, -13.360407829284668, -12.703285217285156, -12.046162605285645, -11.389039993286133, -10.731918334960938, -10.074795722961426, -9.417673110961914, -8.760551452636719, -8.103428840637207, -7.4463043212890625, -6.789181709289551, -6.132059574127197, -5.474937438964844, -4.817814826965332, -4.16069221496582, -3.503570079803467, -2.8464479446411133, -2.1893253326416016, -1.532202959060669, -0.8750805854797363, -0.2179582118988037, 0.4391641616821289, 1.0962865352630615, 1.7534089088439941, 2.4105310440063477, 3.0676536560058594, 3.724776029586792, 4.381898403167725, 5.039020538330078, 5.69614315032959, 6.353265762329102, 7.010387897491455, 7.667510032653809, 8.32463264465332, 8.981755256652832, 9.638877868652344, 10.295999526977539, 10.95312213897705, 11.610244750976562, 12.267366409301758, 12.92448902130127, 13.581611633300781]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 6.0, 3.0, 17.0, 18.0, 43.0, 80.0, 181.0, 657.0, 6286.0, 4176971.0, 9200.0, 514.0, 177.0, 64.0, 37.0, 12.0, 7.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.796875, -30.876953125, -29.95703125, -29.037109375, -28.1171875, -27.197265625, -26.27734375, -25.357421875, -24.4375, -23.517578125, -22.59765625, -21.677734375, -20.7578125, -19.837890625, -18.91796875, -17.998046875, -17.078125, -16.158203125, -15.23828125, -14.318359375, -13.3984375, -12.478515625, -11.55859375, -10.638671875, -9.71875, -8.798828125, -7.87890625, -6.958984375, -6.0390625, -5.119140625, -4.19921875, -3.279296875, -2.359375, -1.439453125, -0.51953125, 0.400390625, 1.3203125, 2.240234375, 3.16015625, 4.080078125, 5.0, 5.919921875, 6.83984375, 7.759765625, 8.6796875, 9.599609375, 10.51953125, 11.439453125, 12.359375, 13.279296875, 14.19921875, 15.119140625, 16.0390625, 16.958984375, 17.87890625, 18.798828125, 19.71875, 20.638671875, 21.55859375, 22.478515625, 23.3984375, 24.318359375, 25.23828125, 26.158203125, 27.078125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 5.0, 5.0, 6.0, 16.0, 23.0, 40.0, 90.0, 155.0, 147.0, 194.0, 133.0, 81.0, 59.0, 23.0, 11.0, 7.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.953125, -0.9249801635742188, -0.8968353271484375, -0.8686904907226562, -0.840545654296875, -0.8124008178710938, -0.7842559814453125, -0.7561111450195312, -0.72796630859375, -0.6998214721679688, -0.6716766357421875, -0.6435317993164062, -0.615386962890625, -0.5872421264648438, -0.5590972900390625, -0.5309524536132812, -0.5028076171875, -0.47466278076171875, -0.4465179443359375, -0.41837310791015625, -0.390228271484375, -0.36208343505859375, -0.3339385986328125, -0.30579376220703125, -0.27764892578125, -0.24950408935546875, -0.2213592529296875, -0.19321441650390625, -0.165069580078125, -0.13692474365234375, -0.1087799072265625, -0.08063507080078125, -0.052490234375, -0.02434539794921875, 0.0037994384765625, 0.03194427490234375, 0.060089111328125, 0.08823394775390625, 0.1163787841796875, 0.14452362060546875, 0.17266845703125, 0.20081329345703125, 0.2289581298828125, 0.25710296630859375, 0.285247802734375, 0.31339263916015625, 0.3415374755859375, 0.36968231201171875, 0.3978271484375, 0.42597198486328125, 0.4541168212890625, 0.48226165771484375, 0.510406494140625, 0.5385513305664062, 0.5666961669921875, 0.5948410034179688, 0.62298583984375, 0.6511306762695312, 0.6792755126953125, 0.7074203491210938, 0.735565185546875, 0.7637100219726562, 0.7918548583984375, 0.8199996948242188, 0.84814453125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 8.0, 12.0, 15.0, 23.0, 24.0, 46.0, 88.0, 176.0, 398.0, 1144.0, 4255.0, 19691.0, 170593.0, 3616043.0, 341041.0, 31284.0, 6493.0, 1790.0, 575.0, 237.0, 134.0, 82.0, 41.0, 20.0, 20.0, 11.0, 6.0, 9.0, 7.0, 7.0, 5.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.091796875, -2.971099853515625, -2.85040283203125, -2.729705810546875, -2.6090087890625, -2.488311767578125, -2.36761474609375, -2.246917724609375, -2.126220703125, -2.005523681640625, -1.88482666015625, -1.764129638671875, -1.6434326171875, -1.522735595703125, -1.40203857421875, -1.281341552734375, -1.16064453125, -1.039947509765625, -0.91925048828125, -0.798553466796875, -0.6778564453125, -0.557159423828125, -0.43646240234375, -0.315765380859375, -0.195068359375, -0.074371337890625, 0.04632568359375, 0.167022705078125, 0.2877197265625, 0.408416748046875, 0.52911376953125, 0.649810791015625, 0.7705078125, 0.891204833984375, 1.01190185546875, 1.132598876953125, 1.2532958984375, 1.373992919921875, 1.49468994140625, 1.615386962890625, 1.736083984375, 1.856781005859375, 1.97747802734375, 2.098175048828125, 2.2188720703125, 2.339569091796875, 2.46026611328125, 2.580963134765625, 2.70166015625, 2.822357177734375, 2.94305419921875, 3.063751220703125, 3.1844482421875, 3.305145263671875, 3.42584228515625, 3.546539306640625, 3.667236328125, 3.787933349609375, 3.90863037109375, 4.029327392578125, 4.1500244140625, 4.270721435546875, 4.39141845703125, 4.512115478515625, 4.6328125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 8.0, 4.0, 7.0, 12.0, 15.0, 22.0, 23.0, 56.0, 92.0, 131.0, 208.0, 339.0, 753.0, 1240.0, 462.0, 250.0, 133.0, 87.0, 58.0, 38.0, 30.0, 33.0, 12.0, 13.0, 4.0, 12.0, 3.0, 6.0, 6.0, 5.0, 4.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6376953125, -0.6179046630859375, -0.598114013671875, -0.5783233642578125, -0.55853271484375, -0.5387420654296875, -0.518951416015625, -0.4991607666015625, -0.4793701171875, -0.4595794677734375, -0.439788818359375, -0.4199981689453125, -0.40020751953125, -0.3804168701171875, -0.360626220703125, -0.3408355712890625, -0.321044921875, -0.3012542724609375, -0.281463623046875, -0.2616729736328125, -0.24188232421875, -0.2220916748046875, -0.202301025390625, -0.1825103759765625, -0.1627197265625, -0.1429290771484375, -0.123138427734375, -0.1033477783203125, -0.08355712890625, -0.0637664794921875, -0.043975830078125, -0.0241851806640625, -0.00439453125, 0.0153961181640625, 0.035186767578125, 0.0549774169921875, 0.07476806640625, 0.0945587158203125, 0.114349365234375, 0.1341400146484375, 0.1539306640625, 0.1737213134765625, 0.193511962890625, 0.2133026123046875, 0.23309326171875, 0.2528839111328125, 0.272674560546875, 0.2924652099609375, 0.312255859375, 0.3320465087890625, 0.351837158203125, 0.3716278076171875, 0.39141845703125, 0.4112091064453125, 0.430999755859375, 0.4507904052734375, 0.4705810546875, 0.4903717041015625, 0.510162353515625, 0.5299530029296875, 0.54974365234375, 0.5695343017578125, 0.589324951171875, 0.6091156005859375, 0.62890625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 15.0, 29.0, 46.0, 93.0, 158.0, 228.0, 165.0, 138.0, 68.0, 30.0, 11.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.2774910926818848, -3.1247718334198, -2.972052574157715, -2.81933331489563, -2.666614055633545, -2.51389479637146, -2.361175537109375, -2.208456516265869, -2.055737018585205, -1.9030177593231201, -1.7502985000610352, -1.5975792407989502, -1.4448599815368652, -1.2921407222747803, -1.1394215822219849, -0.9867023229598999, -0.8339831829071045, -0.6812639236450195, -0.5285446643829346, -0.3758254647254944, -0.22310620546340942, -0.07038694620132446, 0.08233225345611572, 0.23505151271820068, 0.38777077198028564, 0.5404900312423706, 0.6932092905044556, 0.8459284901618958, 0.9986477494239807, 1.151366949081421, 1.3040862083435059, 1.4568054676055908, 1.6095247268676758, 1.7622439861297607, 1.9149632453918457, 2.0676825046539307, 2.2204017639160156, 2.3731210231781006, 2.5258402824401855, 2.6785593032836914, 2.8312788009643555, 2.9839980602264404, 3.1367173194885254, 3.2894365787506104, 3.4421558380126953, 3.5948750972747803, 3.7475943565368652, 3.900313377380371, 4.053032875061035, 4.205751895904541, 4.358471393585205, 4.511190414428711, 4.663909912109375, 4.816628932952881, 4.969348430633545, 5.122067451477051, 5.274786472320557, 5.4275054931640625, 5.580224990844727, 5.732944011688232, 5.8856635093688965, 6.038382530212402, 6.191102027893066, 6.343821048736572, 6.496540546417236]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 9.0, 5.0, 14.0, 10.0, 11.0, 15.0, 13.0, 25.0, 28.0, 36.0, 33.0, 30.0, 46.0, 42.0, 54.0, 55.0, 54.0, 45.0, 42.0, 52.0, 43.0, 45.0, 43.0, 43.0, 32.0, 19.0, 37.0, 27.0, 23.0, 12.0, 16.0, 6.0, 8.0, 11.0, 5.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.2708489894866943, -2.2000014781951904, -2.1291539669036865, -2.0583064556121826, -1.9874589443206787, -1.9166114330291748, -1.845763921737671, -1.774916410446167, -1.704068899154663, -1.6332213878631592, -1.5623738765716553, -1.4915263652801514, -1.4206788539886475, -1.3498313426971436, -1.2789838314056396, -1.2081363201141357, -1.1372888088226318, -1.066441297531128, -0.995593786239624, -0.9247462749481201, -0.8538987636566162, -0.7830512523651123, -0.7122037410736084, -0.6413562297821045, -0.5705087184906006, -0.4996612071990967, -0.4288136959075928, -0.35796618461608887, -0.28711867332458496, -0.21627116203308105, -0.14542365074157715, -0.07457613945007324, -0.003728628158569336, 0.06711888313293457, 0.13796639442443848, 0.20881390571594238, 0.2796614170074463, 0.3505089282989502, 0.4213564395904541, 0.492203950881958, 0.5630514621734619, 0.6338989734649658, 0.7047464847564697, 0.7755939960479736, 0.8464415073394775, 0.9172890186309814, 0.9881365299224854, 1.0589840412139893, 1.1298315525054932, 1.200679063796997, 1.271526575088501, 1.3423740863800049, 1.4132215976715088, 1.4840691089630127, 1.5549166202545166, 1.6257641315460205, 1.6966116428375244, 1.7674591541290283, 1.8383066654205322, 1.9091541767120361, 1.98000168800354, 2.050849199295044, 2.121696710586548, 2.1925442218780518, 2.2633917331695557]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 4.0, 9.0, 8.0, 12.0, 17.0, 32.0, 50.0, 80.0, 141.0, 261.0, 540.0, 1127.0, 2724.0, 8274.0, 69579.0, 725778.0, 218001.0, 15044.0, 3808.0, 1562.0, 755.0, 329.0, 174.0, 92.0, 54.0, 24.0, 20.0, 14.0, 7.0, 7.0, 5.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.12109375, -4.95947265625, -4.7978515625, -4.63623046875, -4.474609375, -4.31298828125, -4.1513671875, -3.98974609375, -3.828125, -3.66650390625, -3.5048828125, -3.34326171875, -3.181640625, -3.02001953125, -2.8583984375, -2.69677734375, -2.53515625, -2.37353515625, -2.2119140625, -2.05029296875, -1.888671875, -1.72705078125, -1.5654296875, -1.40380859375, -1.2421875, -1.08056640625, -0.9189453125, -0.75732421875, -0.595703125, -0.43408203125, -0.2724609375, -0.11083984375, 0.05078125, 0.21240234375, 0.3740234375, 0.53564453125, 0.697265625, 0.85888671875, 1.0205078125, 1.18212890625, 1.34375, 1.50537109375, 1.6669921875, 1.82861328125, 1.990234375, 2.15185546875, 2.3134765625, 2.47509765625, 2.63671875, 2.79833984375, 2.9599609375, 3.12158203125, 3.283203125, 3.44482421875, 3.6064453125, 3.76806640625, 3.9296875, 4.09130859375, 4.2529296875, 4.41455078125, 4.576171875, 4.73779296875, 4.8994140625, 5.06103515625, 5.22265625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 4.0, 3.0, 7.0, 5.0, 25.0, 52.0, 85.0, 133.0, 164.0, 184.0, 142.0, 108.0, 46.0, 22.0, 12.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94580078125, -0.9179153442382812, -0.8900299072265625, -0.8621444702148438, -0.834259033203125, -0.8063735961914062, -0.7784881591796875, -0.7506027221679688, -0.72271728515625, -0.6948318481445312, -0.6669464111328125, -0.6390609741210938, -0.611175537109375, -0.5832901000976562, -0.5554046630859375, -0.5275192260742188, -0.4996337890625, -0.47174835205078125, -0.4438629150390625, -0.41597747802734375, -0.388092041015625, -0.36020660400390625, -0.3323211669921875, -0.30443572998046875, -0.27655029296875, -0.24866485595703125, -0.2207794189453125, -0.19289398193359375, -0.165008544921875, -0.13712310791015625, -0.1092376708984375, -0.08135223388671875, -0.053466796875, -0.02558135986328125, 0.0023040771484375, 0.03018951416015625, 0.058074951171875, 0.08596038818359375, 0.1138458251953125, 0.14173126220703125, 0.16961669921875, 0.19750213623046875, 0.2253875732421875, 0.25327301025390625, 0.281158447265625, 0.30904388427734375, 0.3369293212890625, 0.36481475830078125, 0.3927001953125, 0.42058563232421875, 0.4484710693359375, 0.47635650634765625, 0.504241943359375, 0.5321273803710938, 0.5600128173828125, 0.5878982543945312, 0.61578369140625, 0.6436691284179688, 0.6715545654296875, 0.6994400024414062, 0.727325439453125, 0.7552108764648438, 0.7830963134765625, 0.8109817504882812, 0.8388671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 7.0, 11.0, 13.0, 17.0, 38.0, 47.0, 65.0, 90.0, 122.0, 205.0, 278.0, 445.0, 827.0, 1652.0, 3791.0, 11065.0, 42449.0, 194061.0, 463074.0, 250685.0, 57353.0, 13760.0, 4321.0, 1810.0, 927.0, 513.0, 313.0, 190.0, 121.0, 83.0, 70.0, 44.0, 24.0, 24.0, 16.0, 8.0, 9.0, 3.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.263671875, -2.178558349609375, -2.09344482421875, -2.008331298828125, -1.9232177734375, -1.838104248046875, -1.75299072265625, -1.667877197265625, -1.582763671875, -1.497650146484375, -1.41253662109375, -1.327423095703125, -1.2423095703125, -1.157196044921875, -1.07208251953125, -0.986968994140625, -0.90185546875, -0.816741943359375, -0.73162841796875, -0.646514892578125, -0.5614013671875, -0.476287841796875, -0.39117431640625, -0.306060791015625, -0.220947265625, -0.135833740234375, -0.05072021484375, 0.034393310546875, 0.1195068359375, 0.204620361328125, 0.28973388671875, 0.374847412109375, 0.4599609375, 0.545074462890625, 0.63018798828125, 0.715301513671875, 0.8004150390625, 0.885528564453125, 0.97064208984375, 1.055755615234375, 1.140869140625, 1.225982666015625, 1.31109619140625, 1.396209716796875, 1.4813232421875, 1.566436767578125, 1.65155029296875, 1.736663818359375, 1.82177734375, 1.906890869140625, 1.99200439453125, 2.077117919921875, 2.1622314453125, 2.247344970703125, 2.33245849609375, 2.417572021484375, 2.502685546875, 2.587799072265625, 2.67291259765625, 2.758026123046875, 2.8431396484375, 2.928253173828125, 3.01336669921875, 3.098480224609375, 3.18359375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 1.0, 4.0, 10.0, 12.0, 13.0, 14.0, 11.0, 13.0, 22.0, 30.0, 23.0, 40.0, 42.0, 31.0, 65.0, 47.0, 65.0, 58.0, 56.0, 59.0, 49.0, 42.0, 54.0, 51.0, 42.0, 36.0, 16.0, 18.0, 16.0, 17.0, 12.0, 8.0, 7.0, 3.0, 2.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.18359375, -2.1077880859375, -2.031982421875, -1.9561767578125, -1.88037109375, -1.8045654296875, -1.728759765625, -1.6529541015625, -1.5771484375, -1.5013427734375, -1.425537109375, -1.3497314453125, -1.27392578125, -1.1981201171875, -1.122314453125, -1.0465087890625, -0.970703125, -0.8948974609375, -0.819091796875, -0.7432861328125, -0.66748046875, -0.5916748046875, -0.515869140625, -0.4400634765625, -0.3642578125, -0.2884521484375, -0.212646484375, -0.1368408203125, -0.06103515625, 0.0147705078125, 0.090576171875, 0.1663818359375, 0.2421875, 0.3179931640625, 0.393798828125, 0.4696044921875, 0.54541015625, 0.6212158203125, 0.697021484375, 0.7728271484375, 0.8486328125, 0.9244384765625, 1.000244140625, 1.0760498046875, 1.15185546875, 1.2276611328125, 1.303466796875, 1.3792724609375, 1.455078125, 1.5308837890625, 1.606689453125, 1.6824951171875, 1.75830078125, 1.8341064453125, 1.909912109375, 1.9857177734375, 2.0615234375, 2.1373291015625, 2.213134765625, 2.2889404296875, 2.36474609375, 2.4405517578125, 2.516357421875, 2.5921630859375, 2.66796875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 2.0, 5.0, 8.0, 10.0, 22.0, 43.0, 62.0, 125.0, 231.0, 493.0, 1501.0, 5584.0, 29377.0, 247921.0, 644279.0, 100084.0, 14067.0, 3071.0, 938.0, 380.0, 138.0, 86.0, 39.0, 36.0, 21.0, 8.0, 5.0, 7.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.435546875, -2.373565673828125, -2.31158447265625, -2.249603271484375, -2.1876220703125, -2.125640869140625, -2.06365966796875, -2.001678466796875, -1.939697265625, -1.877716064453125, -1.81573486328125, -1.753753662109375, -1.6917724609375, -1.629791259765625, -1.56781005859375, -1.505828857421875, -1.44384765625, -1.381866455078125, -1.31988525390625, -1.257904052734375, -1.1959228515625, -1.133941650390625, -1.07196044921875, -1.009979248046875, -0.947998046875, -0.886016845703125, -0.82403564453125, -0.762054443359375, -0.7000732421875, -0.638092041015625, -0.57611083984375, -0.514129638671875, -0.4521484375, -0.390167236328125, -0.32818603515625, -0.266204833984375, -0.2042236328125, -0.142242431640625, -0.08026123046875, -0.018280029296875, 0.043701171875, 0.105682373046875, 0.16766357421875, 0.229644775390625, 0.2916259765625, 0.353607177734375, 0.41558837890625, 0.477569580078125, 0.53955078125, 0.601531982421875, 0.66351318359375, 0.725494384765625, 0.7874755859375, 0.849456787109375, 0.91143798828125, 0.973419189453125, 1.035400390625, 1.097381591796875, 1.15936279296875, 1.221343994140625, 1.2833251953125, 1.345306396484375, 1.40728759765625, 1.469268798828125, 1.53125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 12.0, 13.0, 4.0, 13.0, 15.0, 22.0, 17.0, 32.0, 41.0, 53.0, 52.0, 71.0, 92.0, 103.0, 95.0, 56.0, 56.0, 53.0, 37.0, 30.0, 29.0, 19.0, 13.0, 12.0, 11.0, 9.0, 12.0, 7.0, 4.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002193450927734375, -0.00021351128816604614, -0.00020767748355865479, -0.00020184367895126343, -0.00019600987434387207, -0.0001901760697364807, -0.00018434226512908936, -0.000178508460521698, -0.00017267465591430664, -0.00016684085130691528, -0.00016100704669952393, -0.00015517324209213257, -0.0001493394374847412, -0.00014350563287734985, -0.0001376718282699585, -0.00013183802366256714, -0.00012600421905517578, -0.00012017041444778442, -0.00011433660984039307, -0.00010850280523300171, -0.00010266900062561035, -9.6835196018219e-05, -9.100139141082764e-05, -8.516758680343628e-05, -7.933378219604492e-05, -7.349997758865356e-05, -6.766617298126221e-05, -6.183236837387085e-05, -5.599856376647949e-05, -5.0164759159088135e-05, -4.433095455169678e-05, -3.849714994430542e-05, -3.266334533691406e-05, -2.6829540729522705e-05, -2.0995736122131348e-05, -1.516193151473999e-05, -9.328126907348633e-06, -3.4943222999572754e-06, 2.339482307434082e-06, 8.17328691482544e-06, 1.4007091522216797e-05, 1.9840896129608154e-05, 2.5674700736999512e-05, 3.150850534439087e-05, 3.7342309951782227e-05, 4.3176114559173584e-05, 4.900991916656494e-05, 5.48437237739563e-05, 6.0677528381347656e-05, 6.651133298873901e-05, 7.234513759613037e-05, 7.817894220352173e-05, 8.401274681091309e-05, 8.984655141830444e-05, 9.56803560256958e-05, 0.00010151416063308716, 0.00010734796524047852, 0.00011318176984786987, 0.00011901557445526123, 0.0001248493790626526, 0.00013068318367004395, 0.0001365169882774353, 0.00014235079288482666, 0.00014818459749221802, 0.00015401840209960938]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 9.0, 8.0, 4.0, 6.0, 9.0, 16.0, 13.0, 27.0, 25.0, 48.0, 68.0, 86.0, 126.0, 165.0, 260.0, 344.0, 663.0, 1156.0, 2543.0, 6193.0, 19096.0, 68777.0, 293039.0, 494105.0, 114710.0, 30721.0, 9242.0, 3368.0, 1440.0, 794.0, 484.0, 296.0, 187.0, 143.0, 110.0, 72.0, 52.0, 40.0, 31.0, 21.0, 18.0, 12.0, 7.0, 4.0, 3.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3369140625, -1.2911224365234375, -1.245330810546875, -1.1995391845703125, -1.15374755859375, -1.1079559326171875, -1.062164306640625, -1.0163726806640625, -0.9705810546875, -0.9247894287109375, -0.878997802734375, -0.8332061767578125, -0.78741455078125, -0.7416229248046875, -0.695831298828125, -0.6500396728515625, -0.604248046875, -0.5584564208984375, -0.512664794921875, -0.4668731689453125, -0.42108154296875, -0.3752899169921875, -0.329498291015625, -0.2837066650390625, -0.2379150390625, -0.1921234130859375, -0.146331787109375, -0.1005401611328125, -0.05474853515625, -0.0089569091796875, 0.036834716796875, 0.0826263427734375, 0.12841796875, 0.1742095947265625, 0.220001220703125, 0.2657928466796875, 0.31158447265625, 0.3573760986328125, 0.403167724609375, 0.4489593505859375, 0.4947509765625, 0.5405426025390625, 0.586334228515625, 0.6321258544921875, 0.67791748046875, 0.7237091064453125, 0.769500732421875, 0.8152923583984375, 0.861083984375, 0.9068756103515625, 0.952667236328125, 0.9984588623046875, 1.04425048828125, 1.0900421142578125, 1.135833740234375, 1.1816253662109375, 1.2274169921875, 1.2732086181640625, 1.319000244140625, 1.3647918701171875, 1.41058349609375, 1.4563751220703125, 1.502166748046875, 1.5479583740234375, 1.59375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 4.0, 7.0, 11.0, 12.0, 13.0, 21.0, 21.0, 26.0, 28.0, 31.0, 40.0, 37.0, 68.0, 79.0, 99.0, 90.0, 87.0, 72.0, 50.0, 38.0, 29.0, 23.0, 24.0, 14.0, 20.0, 10.0, 8.0, 9.0, 5.0, 11.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0185546875, -0.9834747314453125, -0.948394775390625, -0.9133148193359375, -0.87823486328125, -0.8431549072265625, -0.808074951171875, -0.7729949951171875, -0.7379150390625, -0.7028350830078125, -0.667755126953125, -0.6326751708984375, -0.59759521484375, -0.5625152587890625, -0.527435302734375, -0.4923553466796875, -0.457275390625, -0.4221954345703125, -0.387115478515625, -0.3520355224609375, -0.31695556640625, -0.2818756103515625, -0.246795654296875, -0.2117156982421875, -0.1766357421875, -0.1415557861328125, -0.106475830078125, -0.0713958740234375, -0.03631591796875, -0.0012359619140625, 0.033843994140625, 0.0689239501953125, 0.10400390625, 0.1390838623046875, 0.174163818359375, 0.2092437744140625, 0.24432373046875, 0.2794036865234375, 0.314483642578125, 0.3495635986328125, 0.3846435546875, 0.4197235107421875, 0.454803466796875, 0.4898834228515625, 0.52496337890625, 0.5600433349609375, 0.595123291015625, 0.6302032470703125, 0.665283203125, 0.7003631591796875, 0.735443115234375, 0.7705230712890625, 0.80560302734375, 0.8406829833984375, 0.875762939453125, 0.9108428955078125, 0.9459228515625, 0.9810028076171875, 1.016082763671875, 1.0511627197265625, 1.08624267578125, 1.1213226318359375, 1.156402587890625, 1.1914825439453125, 1.2265625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 14.0, 16.0, 18.0, 33.0, 76.0, 110.0, 170.0, 168.0, 155.0, 103.0, 53.0, 31.0, 22.0, 6.0, 6.0, 6.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.83820915222168, -15.279619216918945, -14.721029281616211, -14.162439346313477, -13.603849411010742, -13.045259475708008, -12.486669540405273, -11.928079605102539, -11.369489669799805, -10.81089973449707, -10.252309799194336, -9.693719863891602, -9.135129928588867, -8.576539993286133, -8.017950057983398, -7.459360122680664, -6.90077018737793, -6.342180252075195, -5.783590316772461, -5.225000381469727, -4.666410446166992, -4.107820510864258, -3.5492305755615234, -2.990640640258789, -2.4320507049560547, -1.8734607696533203, -1.314870834350586, -0.7562808990478516, -0.1976909637451172, 0.3608989715576172, 0.9194889068603516, 1.478078842163086, 2.0366668701171875, 2.595256805419922, 3.1538467407226562, 3.7124366760253906, 4.271026611328125, 4.829616546630859, 5.388206481933594, 5.946796417236328, 6.5053863525390625, 7.063976287841797, 7.622566223144531, 8.181156158447266, 8.73974609375, 9.298336029052734, 9.856925964355469, 10.415515899658203, 10.974105834960938, 11.532695770263672, 12.091285705566406, 12.64987564086914, 13.208465576171875, 13.76705551147461, 14.325645446777344, 14.884235382080078, 15.442825317382812, 16.001415252685547, 16.56000518798828, 17.118595123291016, 17.67718505859375, 18.235774993896484, 18.79436492919922, 19.352954864501953, 19.911544799804688]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 1.0, 7.0, 13.0, 10.0, 9.0, 18.0, 19.0, 21.0, 21.0, 26.0, 22.0, 30.0, 32.0, 29.0, 35.0, 35.0, 36.0, 50.0, 47.0, 38.0, 46.0, 43.0, 38.0, 38.0, 44.0, 41.0, 32.0, 42.0, 24.0, 23.0, 22.0, 23.0, 15.0, 9.0, 13.0, 7.0, 7.0, 7.0, 3.0, 6.0, 8.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-13.540027618408203, -13.131022453308105, -12.722017288208008, -12.31301212310791, -11.904006958007812, -11.495001792907715, -11.085996627807617, -10.67699146270752, -10.267986297607422, -9.858981132507324, -9.449975967407227, -9.040970802307129, -8.631965637207031, -8.222960472106934, -7.813955307006836, -7.404950141906738, -6.995944976806641, -6.586939811706543, -6.177934646606445, -5.768929481506348, -5.35992431640625, -4.950919151306152, -4.541913986206055, -4.132908821105957, -3.7239036560058594, -3.3148984909057617, -2.905893325805664, -2.4968881607055664, -2.0878829956054688, -1.678877830505371, -1.2698726654052734, -0.8608675003051758, -0.4518613815307617, -0.04285621643066406, 0.3661489486694336, 0.7751541137695312, 1.184159278869629, 1.5931644439697266, 2.002169609069824, 2.411174774169922, 2.8201799392700195, 3.229185104370117, 3.638190269470215, 4.0471954345703125, 4.45620059967041, 4.865205764770508, 5.2742109298706055, 5.683216094970703, 6.092221260070801, 6.501226425170898, 6.910231590270996, 7.319236755371094, 7.728241920471191, 8.137247085571289, 8.546252250671387, 8.955257415771484, 9.364262580871582, 9.77326774597168, 10.182272911071777, 10.591278076171875, 11.000283241271973, 11.40928840637207, 11.818293571472168, 12.227298736572266, 12.636303901672363]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 2.0, 2.0, 8.0, 7.0, 9.0, 20.0, 26.0, 39.0, 72.0, 103.0, 203.0, 409.0, 886.0, 2600.0, 16300.0, 3387539.0, 772024.0, 11097.0, 1740.0, 617.0, 254.0, 143.0, 63.0, 43.0, 16.0, 14.0, 12.0, 3.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.56640625, -7.361572265625, -7.15673828125, -6.951904296875, -6.7470703125, -6.542236328125, -6.33740234375, -6.132568359375, -5.927734375, -5.722900390625, -5.51806640625, -5.313232421875, -5.1083984375, -4.903564453125, -4.69873046875, -4.493896484375, -4.2890625, -4.084228515625, -3.87939453125, -3.674560546875, -3.4697265625, -3.264892578125, -3.06005859375, -2.855224609375, -2.650390625, -2.445556640625, -2.24072265625, -2.035888671875, -1.8310546875, -1.626220703125, -1.42138671875, -1.216552734375, -1.01171875, -0.806884765625, -0.60205078125, -0.397216796875, -0.1923828125, 0.012451171875, 0.21728515625, 0.422119140625, 0.626953125, 0.831787109375, 1.03662109375, 1.241455078125, 1.4462890625, 1.651123046875, 1.85595703125, 2.060791015625, 2.265625, 2.470458984375, 2.67529296875, 2.880126953125, 3.0849609375, 3.289794921875, 3.49462890625, 3.699462890625, 3.904296875, 4.109130859375, 4.31396484375, 4.518798828125, 4.7236328125, 4.928466796875, 5.13330078125, 5.338134765625, 5.54296875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 15.0, 19.0, 44.0, 80.0, 86.0, 98.0, 127.0, 156.0, 125.0, 91.0, 71.0, 41.0, 13.0, 9.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.001953125, -0.972320556640625, -0.94268798828125, -0.913055419921875, -0.8834228515625, -0.853790283203125, -0.82415771484375, -0.794525146484375, -0.764892578125, -0.735260009765625, -0.70562744140625, -0.675994873046875, -0.6463623046875, -0.616729736328125, -0.58709716796875, -0.557464599609375, -0.52783203125, -0.498199462890625, -0.46856689453125, -0.438934326171875, -0.4093017578125, -0.379669189453125, -0.35003662109375, -0.320404052734375, -0.290771484375, -0.261138916015625, -0.23150634765625, -0.201873779296875, -0.1722412109375, -0.142608642578125, -0.11297607421875, -0.083343505859375, -0.0537109375, -0.024078369140625, 0.00555419921875, 0.035186767578125, 0.0648193359375, 0.094451904296875, 0.12408447265625, 0.153717041015625, 0.183349609375, 0.212982177734375, 0.24261474609375, 0.272247314453125, 0.3018798828125, 0.331512451171875, 0.36114501953125, 0.390777587890625, 0.42041015625, 0.450042724609375, 0.47967529296875, 0.509307861328125, 0.5389404296875, 0.568572998046875, 0.59820556640625, 0.627838134765625, 0.657470703125, 0.687103271484375, 0.71673583984375, 0.746368408203125, 0.7760009765625, 0.805633544921875, 0.83526611328125, 0.864898681640625, 0.89453125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 6.0, 6.0, 5.0, 9.0, 9.0, 13.0, 18.0, 36.0, 49.0, 59.0, 111.0, 195.0, 335.0, 875.0, 2549.0, 9995.0, 65856.0, 2864351.0, 1193775.0, 45027.0, 7425.0, 1993.0, 704.0, 360.0, 201.0, 113.0, 69.0, 43.0, 23.0, 24.0, 15.0, 14.0, 5.0, 4.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-4.0390625, -3.94036865234375, -3.8416748046875, -3.74298095703125, -3.644287109375, -3.54559326171875, -3.4468994140625, -3.34820556640625, -3.24951171875, -3.15081787109375, -3.0521240234375, -2.95343017578125, -2.854736328125, -2.75604248046875, -2.6573486328125, -2.55865478515625, -2.4599609375, -2.36126708984375, -2.2625732421875, -2.16387939453125, -2.065185546875, -1.96649169921875, -1.8677978515625, -1.76910400390625, -1.67041015625, -1.57171630859375, -1.4730224609375, -1.37432861328125, -1.275634765625, -1.17694091796875, -1.0782470703125, -0.97955322265625, -0.880859375, -0.78216552734375, -0.6834716796875, -0.58477783203125, -0.486083984375, -0.38739013671875, -0.2886962890625, -0.19000244140625, -0.09130859375, 0.00738525390625, 0.1060791015625, 0.20477294921875, 0.303466796875, 0.40216064453125, 0.5008544921875, 0.59954833984375, 0.6982421875, 0.79693603515625, 0.8956298828125, 0.99432373046875, 1.093017578125, 1.19171142578125, 1.2904052734375, 1.38909912109375, 1.48779296875, 1.58648681640625, 1.6851806640625, 1.78387451171875, 1.882568359375, 1.98126220703125, 2.0799560546875, 2.17864990234375, 2.27734375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 2.0, 10.0, 13.0, 15.0, 23.0, 28.0, 59.0, 87.0, 159.0, 320.0, 889.0, 1539.0, 457.0, 202.0, 106.0, 61.0, 35.0, 24.0, 9.0, 9.0, 10.0, 4.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76318359375, -0.7379074096679688, -0.7126312255859375, -0.6873550415039062, -0.662078857421875, -0.6368026733398438, -0.6115264892578125, -0.5862503051757812, -0.56097412109375, -0.5356979370117188, -0.5104217529296875, -0.48514556884765625, -0.459869384765625, -0.43459320068359375, -0.4093170166015625, -0.38404083251953125, -0.3587646484375, -0.33348846435546875, -0.3082122802734375, -0.28293609619140625, -0.257659912109375, -0.23238372802734375, -0.2071075439453125, -0.18183135986328125, -0.15655517578125, -0.13127899169921875, -0.1060028076171875, -0.08072662353515625, -0.055450439453125, -0.03017425537109375, -0.0048980712890625, 0.02037811279296875, 0.045654296875, 0.07093048095703125, 0.0962066650390625, 0.12148284912109375, 0.146759033203125, 0.17203521728515625, 0.1973114013671875, 0.22258758544921875, 0.24786376953125, 0.27313995361328125, 0.2984161376953125, 0.32369232177734375, 0.348968505859375, 0.37424468994140625, 0.3995208740234375, 0.42479705810546875, 0.4500732421875, 0.47534942626953125, 0.5006256103515625, 0.5259017944335938, 0.551177978515625, 0.5764541625976562, 0.6017303466796875, 0.6270065307617188, 0.65228271484375, 0.6775588989257812, 0.7028350830078125, 0.7281112670898438, 0.753387451171875, 0.7786636352539062, 0.8039398193359375, 0.8292160034179688, 0.8544921875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 9.0, 55.0, 302.0, 407.0, 188.0, 30.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.475329875946045, -3.1382718086242676, -2.8012137413024902, -2.464155673980713, -2.1270976066589355, -1.7900395393371582, -1.4529814720153809, -1.1159234046936035, -0.7788653373718262, -0.44180727005004883, -0.10474920272827148, 0.23230886459350586, 0.5693669319152832, 0.9064249992370605, 1.243483066558838, 1.5805411338806152, 1.9175992012023926, 2.25465726852417, 2.5917153358459473, 2.9287734031677246, 3.265831470489502, 3.6028895378112793, 3.9399476051330566, 4.277005672454834, 4.614063739776611, 4.951121807098389, 5.288179874420166, 5.625237941741943, 5.962296009063721, 6.299354076385498, 6.636412143707275, 6.973470211029053, 7.310527801513672, 7.647585868835449, 7.984643936157227, 8.321702003479004, 8.658760070800781, 8.995818138122559, 9.332876205444336, 9.669934272766113, 10.00699234008789, 10.344050407409668, 10.681108474731445, 11.018166542053223, 11.355224609375, 11.692282676696777, 12.029340744018555, 12.366398811340332, 12.70345687866211, 13.040514945983887, 13.377573013305664, 13.714631080627441, 14.051689147949219, 14.388747215270996, 14.725805282592773, 15.06286334991455, 15.399921417236328, 15.736979484558105, 16.074037551879883, 16.411094665527344, 16.748153686523438, 17.08521270751953, 17.422269821166992, 17.759326934814453, 18.096385955810547]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 6.0, 10.0, 7.0, 4.0, 18.0, 15.0, 21.0, 22.0, 29.0, 44.0, 43.0, 34.0, 41.0, 44.0, 62.0, 50.0, 56.0, 51.0, 53.0, 46.0, 60.0, 46.0, 42.0, 21.0, 39.0, 33.0, 18.0, 19.0, 22.0, 9.0, 11.0, 9.0, 8.0, 1.0, 5.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.707866668701172, -2.6279401779174805, -2.548013925552368, -2.4680874347686768, -2.3881611824035645, -2.308234691619873, -2.2283082008361816, -2.1483817100524902, -2.068455457687378, -1.988529086112976, -1.9086027145385742, -1.8286762237548828, -1.748749852180481, -1.668823480606079, -1.5888969898223877, -1.5089706182479858, -1.429044246673584, -1.3491178750991821, -1.2691915035247803, -1.1892650127410889, -1.109338641166687, -1.0294122695922852, -0.9494858384132385, -0.8695594072341919, -0.78963303565979, -0.7097066640853882, -0.6297802329063416, -0.5498538017272949, -0.46992743015289307, -0.3900010287761688, -0.3100746273994446, -0.23014819622039795, -0.1502220630645752, -0.07029566168785095, 0.009630739688873291, 0.08955714106559753, 0.16948354244232178, 0.24940994381904602, 0.32933634519577026, 0.4092627763748169, 0.48918914794921875, 0.5691155195236206, 0.6490419507026672, 0.7289683818817139, 0.8088947534561157, 0.8888211250305176, 0.9687475562095642, 1.0486739873886108, 1.1286003589630127, 1.2085267305374146, 1.2884531021118164, 1.3683795928955078, 1.4483059644699097, 1.5282323360443115, 1.608158826828003, 1.6880851984024048, 1.7680115699768066, 1.8479379415512085, 1.9278643131256104, 2.0077908039093018, 2.087717056274414, 2.1676435470581055, 2.247570037841797, 2.3274965286254883, 2.4074227809906006]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 7.0, 6.0, 11.0, 14.0, 18.0, 30.0, 39.0, 46.0, 60.0, 84.0, 123.0, 177.0, 234.0, 299.0, 472.0, 667.0, 989.0, 1630.0, 3105.0, 6546.0, 17095.0, 54392.0, 172851.0, 351328.0, 279559.0, 104950.0, 31984.0, 10866.0, 4467.0, 2293.0, 1324.0, 870.0, 565.0, 404.0, 277.0, 191.0, 147.0, 107.0, 72.0, 68.0, 41.0, 31.0, 27.0, 19.0, 17.0, 9.0, 14.0, 11.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.5830078125, -1.5315704345703125, -1.480133056640625, -1.4286956787109375, -1.37725830078125, -1.3258209228515625, -1.274383544921875, -1.2229461669921875, -1.1715087890625, -1.1200714111328125, -1.068634033203125, -1.0171966552734375, -0.96575927734375, -0.9143218994140625, -0.862884521484375, -0.8114471435546875, -0.760009765625, -0.7085723876953125, -0.657135009765625, -0.6056976318359375, -0.55426025390625, -0.5028228759765625, -0.451385498046875, -0.3999481201171875, -0.3485107421875, -0.2970733642578125, -0.245635986328125, -0.1941986083984375, -0.14276123046875, -0.0913238525390625, -0.039886474609375, 0.0115509033203125, 0.06298828125, 0.1144256591796875, 0.165863037109375, 0.2173004150390625, 0.26873779296875, 0.3201751708984375, 0.371612548828125, 0.4230499267578125, 0.4744873046875, 0.5259246826171875, 0.577362060546875, 0.6287994384765625, 0.68023681640625, 0.7316741943359375, 0.783111572265625, 0.8345489501953125, 0.885986328125, 0.9374237060546875, 0.988861083984375, 1.0402984619140625, 1.09173583984375, 1.1431732177734375, 1.194610595703125, 1.2460479736328125, 1.2974853515625, 1.3489227294921875, 1.400360107421875, 1.4517974853515625, 1.50323486328125, 1.5546722412109375, 1.606109619140625, 1.6575469970703125, 1.708984375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 7.0, 5.0, 4.0, 13.0, 25.0, 41.0, 69.0, 105.0, 119.0, 130.0, 148.0, 142.0, 77.0, 63.0, 33.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.052734375, -1.0223617553710938, -0.9919891357421875, -0.9616165161132812, -0.931243896484375, -0.9008712768554688, -0.8704986572265625, -0.8401260375976562, -0.80975341796875, -0.7793807983398438, -0.7490081787109375, -0.7186355590820312, -0.688262939453125, -0.6578903198242188, -0.6275177001953125, -0.5971450805664062, -0.5667724609375, -0.5363998413085938, -0.5060272216796875, -0.47565460205078125, -0.445281982421875, -0.41490936279296875, -0.3845367431640625, -0.35416412353515625, -0.32379150390625, -0.29341888427734375, -0.2630462646484375, -0.23267364501953125, -0.202301025390625, -0.17192840576171875, -0.1415557861328125, -0.11118316650390625, -0.080810546875, -0.05043792724609375, -0.0200653076171875, 0.01030731201171875, 0.040679931640625, 0.07105255126953125, 0.1014251708984375, 0.13179779052734375, 0.16217041015625, 0.19254302978515625, 0.2229156494140625, 0.25328826904296875, 0.283660888671875, 0.31403350830078125, 0.3444061279296875, 0.37477874755859375, 0.4051513671875, 0.43552398681640625, 0.4658966064453125, 0.49626922607421875, 0.526641845703125, 0.5570144653320312, 0.5873870849609375, 0.6177597045898438, 0.64813232421875, 0.6785049438476562, 0.7088775634765625, 0.7392501831054688, 0.769622802734375, 0.7999954223632812, 0.8303680419921875, 0.8607406616210938, 0.89111328125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 11.0, 12.0, 36.0, 39.0, 54.0, 103.0, 137.0, 213.0, 397.0, 718.0, 1469.0, 3886.0, 13458.0, 59709.0, 273798.0, 471625.0, 173420.0, 35510.0, 8625.0, 2757.0, 1173.0, 536.0, 292.0, 221.0, 122.0, 74.0, 56.0, 24.0, 22.0, 12.0, 10.0, 10.0, 7.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.453125, -2.37725830078125, -2.3013916015625, -2.22552490234375, -2.149658203125, -2.07379150390625, -1.9979248046875, -1.92205810546875, -1.84619140625, -1.77032470703125, -1.6944580078125, -1.61859130859375, -1.542724609375, -1.46685791015625, -1.3909912109375, -1.31512451171875, -1.2392578125, -1.16339111328125, -1.0875244140625, -1.01165771484375, -0.935791015625, -0.85992431640625, -0.7840576171875, -0.70819091796875, -0.63232421875, -0.55645751953125, -0.4805908203125, -0.40472412109375, -0.328857421875, -0.25299072265625, -0.1771240234375, -0.10125732421875, -0.025390625, 0.05047607421875, 0.1263427734375, 0.20220947265625, 0.278076171875, 0.35394287109375, 0.4298095703125, 0.50567626953125, 0.58154296875, 0.65740966796875, 0.7332763671875, 0.80914306640625, 0.885009765625, 0.96087646484375, 1.0367431640625, 1.11260986328125, 1.1884765625, 1.26434326171875, 1.3402099609375, 1.41607666015625, 1.491943359375, 1.56781005859375, 1.6436767578125, 1.71954345703125, 1.79541015625, 1.87127685546875, 1.9471435546875, 2.02301025390625, 2.098876953125, 2.17474365234375, 2.2506103515625, 2.32647705078125, 2.40234375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 5.0, 3.0, 1.0, 9.0, 4.0, 7.0, 6.0, 8.0, 11.0, 10.0, 16.0, 26.0, 26.0, 33.0, 43.0, 41.0, 63.0, 49.0, 50.0, 58.0, 59.0, 51.0, 51.0, 43.0, 55.0, 49.0, 39.0, 34.0, 23.0, 25.0, 26.0, 20.0, 13.0, 10.0, 5.0, 9.0, 7.0, 6.0, 3.0, 6.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-2.6484375, -2.571990966796875, -2.49554443359375, -2.419097900390625, -2.3426513671875, -2.266204833984375, -2.18975830078125, -2.113311767578125, -2.036865234375, -1.960418701171875, -1.88397216796875, -1.807525634765625, -1.7310791015625, -1.654632568359375, -1.57818603515625, -1.501739501953125, -1.42529296875, -1.348846435546875, -1.27239990234375, -1.195953369140625, -1.1195068359375, -1.043060302734375, -0.96661376953125, -0.890167236328125, -0.813720703125, -0.737274169921875, -0.66082763671875, -0.584381103515625, -0.5079345703125, -0.431488037109375, -0.35504150390625, -0.278594970703125, -0.2021484375, -0.125701904296875, -0.04925537109375, 0.027191162109375, 0.1036376953125, 0.180084228515625, 0.25653076171875, 0.332977294921875, 0.409423828125, 0.485870361328125, 0.56231689453125, 0.638763427734375, 0.7152099609375, 0.791656494140625, 0.86810302734375, 0.944549560546875, 1.02099609375, 1.097442626953125, 1.17388916015625, 1.250335693359375, 1.3267822265625, 1.403228759765625, 1.47967529296875, 1.556121826171875, 1.632568359375, 1.709014892578125, 1.78546142578125, 1.861907958984375, 1.9383544921875, 2.014801025390625, 2.09124755859375, 2.167694091796875, 2.244140625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 2.0, 4.0, 9.0, 8.0, 15.0, 24.0, 37.0, 42.0, 69.0, 104.0, 150.0, 256.0, 541.0, 1145.0, 3201.0, 10528.0, 51522.0, 316447.0, 524181.0, 111909.0, 19916.0, 5157.0, 1702.0, 664.0, 374.0, 207.0, 104.0, 74.0, 41.0, 39.0, 22.0, 24.0, 14.0, 7.0, 3.0, 6.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90625, -0.8797607421875, -0.853271484375, -0.8267822265625, -0.80029296875, -0.7738037109375, -0.747314453125, -0.7208251953125, -0.6943359375, -0.6678466796875, -0.641357421875, -0.6148681640625, -0.58837890625, -0.5618896484375, -0.535400390625, -0.5089111328125, -0.482421875, -0.4559326171875, -0.429443359375, -0.4029541015625, -0.37646484375, -0.3499755859375, -0.323486328125, -0.2969970703125, -0.2705078125, -0.2440185546875, -0.217529296875, -0.1910400390625, -0.16455078125, -0.1380615234375, -0.111572265625, -0.0850830078125, -0.05859375, -0.0321044921875, -0.005615234375, 0.0208740234375, 0.04736328125, 0.0738525390625, 0.100341796875, 0.1268310546875, 0.1533203125, 0.1798095703125, 0.206298828125, 0.2327880859375, 0.25927734375, 0.2857666015625, 0.312255859375, 0.3387451171875, 0.365234375, 0.3917236328125, 0.418212890625, 0.4447021484375, 0.47119140625, 0.4976806640625, 0.524169921875, 0.5506591796875, 0.5771484375, 0.6036376953125, 0.630126953125, 0.6566162109375, 0.68310546875, 0.7095947265625, 0.736083984375, 0.7625732421875, 0.7890625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 10.0, 7.0, 10.0, 7.0, 19.0, 21.0, 25.0, 26.0, 38.0, 58.0, 50.0, 85.0, 111.0, 107.0, 86.0, 64.0, 67.0, 49.0, 30.0, 22.0, 21.0, 16.0, 15.0, 12.0, 8.0, 11.0, 6.0, 2.0, 3.0, 0.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0001666545867919922, -0.00016201846301555634, -0.00015738233923912048, -0.00015274621546268463, -0.00014811009168624878, -0.00014347396790981293, -0.00013883784413337708, -0.00013420172035694122, -0.00012956559658050537, -0.00012492947280406952, -0.00012029334902763367, -0.00011565722525119781, -0.00011102110147476196, -0.00010638497769832611, -0.00010174885392189026, -9.71127301454544e-05, -9.247660636901855e-05, -8.78404825925827e-05, -8.320435881614685e-05, -7.8568235039711e-05, -7.393211126327515e-05, -6.92959874868393e-05, -6.465986371040344e-05, -6.002373993396759e-05, -5.538761615753174e-05, -5.0751492381095886e-05, -4.6115368604660034e-05, -4.147924482822418e-05, -3.684312105178833e-05, -3.220699727535248e-05, -2.7570873498916626e-05, -2.2934749722480774e-05, -1.8298625946044922e-05, -1.366250216960907e-05, -9.026378393173218e-06, -4.390254616737366e-06, 2.4586915969848633e-07, 4.881992936134338e-06, 9.51811671257019e-06, 1.4154240489006042e-05, 1.8790364265441895e-05, 2.3426488041877747e-05, 2.80626118183136e-05, 3.269873559474945e-05, 3.73348593711853e-05, 4.1970983147621155e-05, 4.660710692405701e-05, 5.124323070049286e-05, 5.587935447692871e-05, 6.051547825336456e-05, 6.515160202980042e-05, 6.978772580623627e-05, 7.442384958267212e-05, 7.905997335910797e-05, 8.369609713554382e-05, 8.833222091197968e-05, 9.296834468841553e-05, 9.760446846485138e-05, 0.00010224059224128723, 0.00010687671601772308, 0.00011151283979415894, 0.00011614896357059479, 0.00012078508734703064, 0.0001254212111234665, 0.00013005733489990234]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 5.0, 8.0, 8.0, 14.0, 19.0, 21.0, 34.0, 44.0, 64.0, 87.0, 111.0, 194.0, 313.0, 547.0, 925.0, 2002.0, 4651.0, 12851.0, 46689.0, 204470.0, 495319.0, 210323.0, 47342.0, 13283.0, 4675.0, 2063.0, 990.0, 584.0, 313.0, 202.0, 123.0, 71.0, 58.0, 35.0, 27.0, 21.0, 21.0, 11.0, 8.0, 7.0, 2.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.720703125, -0.6978302001953125, -0.674957275390625, -0.6520843505859375, -0.62921142578125, -0.6063385009765625, -0.583465576171875, -0.5605926513671875, -0.5377197265625, -0.5148468017578125, -0.491973876953125, -0.4691009521484375, -0.44622802734375, -0.4233551025390625, -0.400482177734375, -0.3776092529296875, -0.354736328125, -0.3318634033203125, -0.308990478515625, -0.2861175537109375, -0.26324462890625, -0.2403717041015625, -0.217498779296875, -0.1946258544921875, -0.1717529296875, -0.1488800048828125, -0.126007080078125, -0.1031341552734375, -0.08026123046875, -0.0573883056640625, -0.034515380859375, -0.0116424560546875, 0.01123046875, 0.0341033935546875, 0.056976318359375, 0.0798492431640625, 0.10272216796875, 0.1255950927734375, 0.148468017578125, 0.1713409423828125, 0.1942138671875, 0.2170867919921875, 0.239959716796875, 0.2628326416015625, 0.28570556640625, 0.3085784912109375, 0.331451416015625, 0.3543243408203125, 0.377197265625, 0.4000701904296875, 0.422943115234375, 0.4458160400390625, 0.46868896484375, 0.4915618896484375, 0.514434814453125, 0.5373077392578125, 0.5601806640625, 0.5830535888671875, 0.605926513671875, 0.6287994384765625, 0.65167236328125, 0.6745452880859375, 0.697418212890625, 0.7202911376953125, 0.7431640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 2.0, 6.0, 9.0, 14.0, 23.0, 34.0, 61.0, 79.0, 125.0, 114.0, 104.0, 115.0, 102.0, 72.0, 37.0, 36.0, 22.0, 8.0, 7.0, 9.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0546875, -1.0220794677734375, -0.989471435546875, -0.9568634033203125, -0.92425537109375, -0.8916473388671875, -0.859039306640625, -0.8264312744140625, -0.7938232421875, -0.7612152099609375, -0.728607177734375, -0.6959991455078125, -0.66339111328125, -0.6307830810546875, -0.598175048828125, -0.5655670166015625, -0.532958984375, -0.5003509521484375, -0.467742919921875, -0.4351348876953125, -0.40252685546875, -0.3699188232421875, -0.337310791015625, -0.3047027587890625, -0.2720947265625, -0.2394866943359375, -0.206878662109375, -0.1742706298828125, -0.14166259765625, -0.1090545654296875, -0.076446533203125, -0.0438385009765625, -0.01123046875, 0.0213775634765625, 0.053985595703125, 0.0865936279296875, 0.11920166015625, 0.1518096923828125, 0.184417724609375, 0.2170257568359375, 0.2496337890625, 0.2822418212890625, 0.314849853515625, 0.3474578857421875, 0.38006591796875, 0.4126739501953125, 0.445281982421875, 0.4778900146484375, 0.510498046875, 0.5431060791015625, 0.575714111328125, 0.6083221435546875, 0.64093017578125, 0.6735382080078125, 0.706146240234375, 0.7387542724609375, 0.7713623046875, 0.8039703369140625, 0.836578369140625, 0.8691864013671875, 0.90179443359375, 0.9344024658203125, 0.967010498046875, 0.9996185302734375, 1.0322265625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 6.0, 16.0, 31.0, 53.0, 91.0, 149.0, 186.0, 178.0, 131.0, 88.0, 37.0, 6.0, 13.0, 9.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.739856719970703, -14.190048217773438, -13.640240669250488, -13.090432167053223, -12.540623664855957, -11.990816116333008, -11.441007614135742, -10.891199111938477, -10.341390609741211, -9.791582107543945, -9.241774559020996, -8.69196605682373, -8.142157554626465, -7.592349529266357, -7.04254150390625, -6.492733001708984, -5.942925453186035, -5.393117427825928, -4.843308925628662, -4.293500900268555, -3.743692636489868, -3.1938843727111816, -2.644076347351074, -2.0942680835723877, -1.5444598197937012, -0.9946516156196594, -0.4448434114456177, 0.1049647331237793, 0.6547729969024658, 1.2045812606811523, 1.7543892860412598, 2.3041975498199463, 2.854005813598633, 3.4038140773773193, 3.953622341156006, 4.503430366516113, 5.053238868713379, 5.603046894073486, 6.152854919433594, 6.702663421630859, 7.252471446990967, 7.802279472351074, 8.35208797454834, 8.901895523071289, 9.451704025268555, 10.00151252746582, 10.551321029663086, 11.101128578186035, 11.6509370803833, 12.200745582580566, 12.750553131103516, 13.300361633300781, 13.850170135498047, 14.399978637695312, 14.949786186218262, 15.499594688415527, 16.049402236938477, 16.599210739135742, 17.149019241333008, 17.69882583618164, 18.248634338378906, 18.798442840576172, 19.348251342773438, 19.898059844970703, 20.44786834716797]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 6.0, 12.0, 13.0, 18.0, 19.0, 29.0, 25.0, 20.0, 44.0, 48.0, 53.0, 45.0, 66.0, 58.0, 51.0, 54.0, 44.0, 52.0, 45.0, 39.0, 40.0, 47.0, 29.0, 38.0, 23.0, 21.0, 18.0, 15.0, 10.0, 5.0, 4.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.8074951171875, -16.326919555664062, -15.846343040466309, -15.365766525268555, -14.885190963745117, -14.40461540222168, -13.924038887023926, -13.443462371826172, -12.962886810302734, -12.482311248779297, -12.001734733581543, -11.521158218383789, -11.040582656860352, -10.560007095336914, -10.07943058013916, -9.598854064941406, -9.118278503417969, -8.637702941894531, -8.157126426696777, -7.676550388336182, -7.195974349975586, -6.71539831161499, -6.2348222732543945, -5.754246234893799, -5.273670196533203, -4.793094158172607, -4.312518119812012, -3.831942081451416, -3.3513660430908203, -2.8707900047302246, -2.390213966369629, -1.9096379280090332, -1.429062843322754, -0.9484868049621582, -0.4679107666015625, 0.012665271759033203, 0.4932413101196289, 0.9738173484802246, 1.4543933868408203, 1.934969425201416, 2.4155454635620117, 2.8961215019226074, 3.376697540283203, 3.857273578643799, 4.3378496170043945, 4.81842565536499, 5.299001693725586, 5.779577732086182, 6.260153770446777, 6.740729808807373, 7.221305847167969, 7.7018818855285645, 8.18245792388916, 8.663034439086914, 9.143610000610352, 9.624185562133789, 10.104762077331543, 10.585338592529297, 11.065914154052734, 11.546489715576172, 12.027066230773926, 12.50764274597168, 12.988218307495117, 13.468793869018555, 13.949370384216309]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 11.0, 6.0, 6.0, 23.0, 25.0, 49.0, 79.0, 130.0, 231.0, 516.0, 1416.0, 5986.0, 51478.0, 4016076.0, 107683.0, 8087.0, 1591.0, 460.0, 208.0, 93.0, 57.0, 34.0, 15.0, 10.0, 8.0, 6.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.203125, -4.0816650390625, -3.960205078125, -3.8387451171875, -3.71728515625, -3.5958251953125, -3.474365234375, -3.3529052734375, -3.2314453125, -3.1099853515625, -2.988525390625, -2.8670654296875, -2.74560546875, -2.6241455078125, -2.502685546875, -2.3812255859375, -2.259765625, -2.1383056640625, -2.016845703125, -1.8953857421875, -1.77392578125, -1.6524658203125, -1.531005859375, -1.4095458984375, -1.2880859375, -1.1666259765625, -1.045166015625, -0.9237060546875, -0.80224609375, -0.6807861328125, -0.559326171875, -0.4378662109375, -0.31640625, -0.1949462890625, -0.073486328125, 0.0479736328125, 0.16943359375, 0.2908935546875, 0.412353515625, 0.5338134765625, 0.6552734375, 0.7767333984375, 0.898193359375, 1.0196533203125, 1.14111328125, 1.2625732421875, 1.384033203125, 1.5054931640625, 1.626953125, 1.7484130859375, 1.869873046875, 1.9913330078125, 2.11279296875, 2.2342529296875, 2.355712890625, 2.4771728515625, 2.5986328125, 2.7200927734375, 2.841552734375, 2.9630126953125, 3.08447265625, 3.2059326171875, 3.327392578125, 3.4488525390625, 3.5703125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 1.0, 8.0, 12.0, 16.0, 21.0, 54.0, 61.0, 81.0, 101.0, 101.0, 106.0, 100.0, 100.0, 86.0, 65.0, 38.0, 22.0, 9.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90478515625, -0.8783340454101562, -0.8518829345703125, -0.8254318237304688, -0.798980712890625, -0.7725296020507812, -0.7460784912109375, -0.7196273803710938, -0.69317626953125, -0.6667251586914062, -0.6402740478515625, -0.6138229370117188, -0.587371826171875, -0.5609207153320312, -0.5344696044921875, -0.5080184936523438, -0.4815673828125, -0.45511627197265625, -0.4286651611328125, -0.40221405029296875, -0.375762939453125, -0.34931182861328125, -0.3228607177734375, -0.29640960693359375, -0.26995849609375, -0.24350738525390625, -0.2170562744140625, -0.19060516357421875, -0.164154052734375, -0.13770294189453125, -0.1112518310546875, -0.08480072021484375, -0.058349609375, -0.03189849853515625, -0.0054473876953125, 0.02100372314453125, 0.047454833984375, 0.07390594482421875, 0.1003570556640625, 0.12680816650390625, 0.15325927734375, 0.17971038818359375, 0.2061614990234375, 0.23261260986328125, 0.259063720703125, 0.28551483154296875, 0.3119659423828125, 0.33841705322265625, 0.3648681640625, 0.39131927490234375, 0.4177703857421875, 0.44422149658203125, 0.470672607421875, 0.49712371826171875, 0.5235748291015625, 0.5500259399414062, 0.57647705078125, 0.6029281616210938, 0.6293792724609375, 0.6558303833007812, 0.682281494140625, 0.7087326049804688, 0.7351837158203125, 0.7616348266601562, 0.7880859375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 8.0, 8.0, 18.0, 26.0, 43.0, 79.0, 106.0, 194.0, 317.0, 537.0, 1186.0, 3374.0, 14301.0, 115202.0, 3660704.0, 362776.0, 26519.0, 5414.0, 1695.0, 741.0, 382.0, 244.0, 145.0, 76.0, 64.0, 34.0, 24.0, 21.0, 12.0, 6.0, 9.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.306640625, -2.236053466796875, -2.16546630859375, -2.094879150390625, -2.0242919921875, -1.953704833984375, -1.88311767578125, -1.812530517578125, -1.741943359375, -1.671356201171875, -1.60076904296875, -1.530181884765625, -1.4595947265625, -1.389007568359375, -1.31842041015625, -1.247833251953125, -1.17724609375, -1.106658935546875, -1.03607177734375, -0.965484619140625, -0.8948974609375, -0.824310302734375, -0.75372314453125, -0.683135986328125, -0.612548828125, -0.541961669921875, -0.47137451171875, -0.400787353515625, -0.3302001953125, -0.259613037109375, -0.18902587890625, -0.118438720703125, -0.0478515625, 0.022735595703125, 0.09332275390625, 0.163909912109375, 0.2344970703125, 0.305084228515625, 0.37567138671875, 0.446258544921875, 0.516845703125, 0.587432861328125, 0.65802001953125, 0.728607177734375, 0.7991943359375, 0.869781494140625, 0.94036865234375, 1.010955810546875, 1.08154296875, 1.152130126953125, 1.22271728515625, 1.293304443359375, 1.3638916015625, 1.434478759765625, 1.50506591796875, 1.575653076171875, 1.646240234375, 1.716827392578125, 1.78741455078125, 1.858001708984375, 1.9285888671875, 1.999176025390625, 2.06976318359375, 2.140350341796875, 2.2109375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 5.0, 7.0, 9.0, 10.0, 21.0, 33.0, 57.0, 77.0, 146.0, 379.0, 1150.0, 1376.0, 414.0, 168.0, 80.0, 49.0, 24.0, 19.0, 16.0, 13.0, 8.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53759765625, -0.5184326171875, -0.499267578125, -0.4801025390625, -0.4609375, -0.4417724609375, -0.422607421875, -0.4034423828125, -0.38427734375, -0.3651123046875, -0.345947265625, -0.3267822265625, -0.3076171875, -0.2884521484375, -0.269287109375, -0.2501220703125, -0.23095703125, -0.2117919921875, -0.192626953125, -0.1734619140625, -0.154296875, -0.1351318359375, -0.115966796875, -0.0968017578125, -0.07763671875, -0.0584716796875, -0.039306640625, -0.0201416015625, -0.0009765625, 0.0181884765625, 0.037353515625, 0.0565185546875, 0.07568359375, 0.0948486328125, 0.114013671875, 0.1331787109375, 0.15234375, 0.1715087890625, 0.190673828125, 0.2098388671875, 0.22900390625, 0.2481689453125, 0.267333984375, 0.2864990234375, 0.3056640625, 0.3248291015625, 0.343994140625, 0.3631591796875, 0.38232421875, 0.4014892578125, 0.420654296875, 0.4398193359375, 0.458984375, 0.4781494140625, 0.497314453125, 0.5164794921875, 0.53564453125, 0.5548095703125, 0.573974609375, 0.5931396484375, 0.6123046875, 0.6314697265625, 0.650634765625, 0.6697998046875, 0.68896484375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 10.0, 14.0, 38.0, 89.0, 198.0, 277.0, 192.0, 125.0, 48.0, 17.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2038841247558594, -3.039778709411621, -2.8756730556488037, -2.7115676403045654, -2.547462224960327, -2.3833565711975098, -2.2192511558532715, -2.055145740509033, -1.8910402059555054, -1.7269346714019775, -1.5628292560577393, -1.3987237215042114, -1.2346181869506836, -1.0705127716064453, -0.9064072370529175, -0.7423018217086792, -0.5781962871551514, -0.4140908122062683, -0.24998530745506287, -0.08587980270385742, 0.07822567224502563, 0.2423311471939087, 0.4064366817474365, 0.5705420970916748, 0.7346476316452026, 0.8987531065940857, 1.0628585815429688, 1.2269641160964966, 1.3910696506500244, 1.5551750659942627, 1.7192806005477905, 1.8833860158920288, 2.0474915504455566, 2.211596965789795, 2.3757026195526123, 2.5398080348968506, 2.703913450241089, 2.8680191040039062, 3.0321245193481445, 3.196229934692383, 3.360335350036621, 3.5244407653808594, 3.6885464191436768, 3.852651834487915, 4.016757488250732, 4.180862903594971, 4.344968318939209, 4.509073734283447, 4.673179626464844, 4.837285041809082, 5.00139045715332, 5.165495872497559, 5.329601764678955, 5.493707180023193, 5.657812595367432, 5.82191801071167, 5.986023426055908, 6.1501288414001465, 6.314234256744385, 6.478340148925781, 6.6424455642700195, 6.806550979614258, 6.970656394958496, 7.134761810302734, 7.298867225646973]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 6.0, 6.0, 6.0, 5.0, 11.0, 14.0, 12.0, 9.0, 24.0, 16.0, 17.0, 25.0, 28.0, 33.0, 34.0, 36.0, 30.0, 45.0, 35.0, 28.0, 35.0, 44.0, 46.0, 31.0, 32.0, 33.0, 32.0, 38.0, 31.0, 35.0, 35.0, 26.0, 24.0, 18.0, 20.0, 19.0, 19.0, 11.0, 17.0, 12.0, 6.0, 3.0, 9.0, 3.0, 0.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4982706308364868, -1.4535040855407715, -1.4087375402450562, -1.3639709949493408, -1.3192044496536255, -1.2744379043579102, -1.2296714782714844, -1.1849048137664795, -1.1401383876800537, -1.0953718423843384, -1.050605297088623, -1.0058387517929077, -0.9610722064971924, -0.916305661201477, -0.8715391755104065, -0.8267726302146912, -0.782006025314331, -0.7372394800186157, -0.6924729347229004, -0.6477063894271851, -0.6029398441314697, -0.5581732988357544, -0.5134068131446838, -0.4686402678489685, -0.4238737225532532, -0.37910717725753784, -0.3343406319618225, -0.28957411646842957, -0.24480757117271423, -0.2000410258769989, -0.15527451038360596, -0.11050796508789062, -0.06574130058288574, -0.020974762737751007, 0.023791775107383728, 0.06855830550193787, 0.1133248507976532, 0.15809139609336853, 0.20285791158676147, 0.2476244568824768, 0.29239100217819214, 0.33715754747390747, 0.3819240927696228, 0.42669060826301575, 0.4714571535587311, 0.516223669052124, 0.5609902143478394, 0.6057567596435547, 0.65052330493927, 0.6952898502349854, 0.7400563955307007, 0.784822940826416, 0.8295894861221313, 0.8743560314178467, 0.9191225171089172, 0.9638890624046326, 1.0086555480957031, 1.0534220933914185, 1.0981886386871338, 1.1429551839828491, 1.1877217292785645, 1.2324882745742798, 1.2772548198699951, 1.322021245956421, 1.3667879104614258]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 14.0, 8.0, 20.0, 31.0, 60.0, 94.0, 130.0, 193.0, 305.0, 483.0, 869.0, 1542.0, 3223.0, 8184.0, 27075.0, 108077.0, 340280.0, 374844.0, 132868.0, 33154.0, 9506.0, 3503.0, 1768.0, 922.0, 545.0, 286.0, 198.0, 111.0, 86.0, 59.0, 44.0, 28.0, 10.0, 8.0, 6.0, 6.0, 1.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9560546875, -1.89691162109375, -1.8377685546875, -1.77862548828125, -1.719482421875, -1.66033935546875, -1.6011962890625, -1.54205322265625, -1.48291015625, -1.42376708984375, -1.3646240234375, -1.30548095703125, -1.246337890625, -1.18719482421875, -1.1280517578125, -1.06890869140625, -1.009765625, -0.95062255859375, -0.8914794921875, -0.83233642578125, -0.773193359375, -0.71405029296875, -0.6549072265625, -0.59576416015625, -0.53662109375, -0.47747802734375, -0.4183349609375, -0.35919189453125, -0.300048828125, -0.24090576171875, -0.1817626953125, -0.12261962890625, -0.0634765625, -0.00433349609375, 0.0548095703125, 0.11395263671875, 0.173095703125, 0.23223876953125, 0.2913818359375, 0.35052490234375, 0.40966796875, 0.46881103515625, 0.5279541015625, 0.58709716796875, 0.646240234375, 0.70538330078125, 0.7645263671875, 0.82366943359375, 0.8828125, 0.94195556640625, 1.0010986328125, 1.06024169921875, 1.119384765625, 1.17852783203125, 1.2376708984375, 1.29681396484375, 1.35595703125, 1.41510009765625, 1.4742431640625, 1.53338623046875, 1.592529296875, 1.65167236328125, 1.7108154296875, 1.76995849609375, 1.8291015625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 7.0, 17.0, 19.0, 27.0, 59.0, 74.0, 85.0, 98.0, 101.0, 101.0, 97.0, 83.0, 88.0, 52.0, 34.0, 19.0, 10.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87890625, -0.8537063598632812, -0.8285064697265625, -0.8033065795898438, -0.778106689453125, -0.7529067993164062, -0.7277069091796875, -0.7025070190429688, -0.67730712890625, -0.6521072387695312, -0.6269073486328125, -0.6017074584960938, -0.576507568359375, -0.5513076782226562, -0.5261077880859375, -0.5009078979492188, -0.4757080078125, -0.45050811767578125, -0.4253082275390625, -0.40010833740234375, -0.374908447265625, -0.34970855712890625, -0.3245086669921875, -0.29930877685546875, -0.27410888671875, -0.24890899658203125, -0.2237091064453125, -0.19850921630859375, -0.173309326171875, -0.14810943603515625, -0.1229095458984375, -0.09770965576171875, -0.072509765625, -0.04730987548828125, -0.0221099853515625, 0.00308990478515625, 0.028289794921875, 0.05348968505859375, 0.0786895751953125, 0.10388946533203125, 0.12908935546875, 0.15428924560546875, 0.1794891357421875, 0.20468902587890625, 0.229888916015625, 0.25508880615234375, 0.2802886962890625, 0.30548858642578125, 0.3306884765625, 0.35588836669921875, 0.3810882568359375, 0.40628814697265625, 0.431488037109375, 0.45668792724609375, 0.4818878173828125, 0.5070877075195312, 0.53228759765625, 0.5574874877929688, 0.5826873779296875, 0.6078872680664062, 0.633087158203125, 0.6582870483398438, 0.6834869384765625, 0.7086868286132812, 0.73388671875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 8.0, 4.0, 13.0, 20.0, 32.0, 39.0, 54.0, 88.0, 143.0, 199.0, 277.0, 464.0, 808.0, 1561.0, 4016.0, 13871.0, 60890.0, 253855.0, 448853.0, 200580.0, 45255.0, 10682.0, 3418.0, 1402.0, 742.0, 420.0, 294.0, 166.0, 140.0, 88.0, 62.0, 36.0, 34.0, 10.0, 8.0, 8.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.013671875, -1.949554443359375, -1.88543701171875, -1.821319580078125, -1.7572021484375, -1.693084716796875, -1.62896728515625, -1.564849853515625, -1.500732421875, -1.436614990234375, -1.37249755859375, -1.308380126953125, -1.2442626953125, -1.180145263671875, -1.11602783203125, -1.051910400390625, -0.98779296875, -0.923675537109375, -0.85955810546875, -0.795440673828125, -0.7313232421875, -0.667205810546875, -0.60308837890625, -0.538970947265625, -0.474853515625, -0.410736083984375, -0.34661865234375, -0.282501220703125, -0.2183837890625, -0.154266357421875, -0.09014892578125, -0.026031494140625, 0.0380859375, 0.102203369140625, 0.16632080078125, 0.230438232421875, 0.2945556640625, 0.358673095703125, 0.42279052734375, 0.486907958984375, 0.551025390625, 0.615142822265625, 0.67926025390625, 0.743377685546875, 0.8074951171875, 0.871612548828125, 0.93572998046875, 0.999847412109375, 1.06396484375, 1.128082275390625, 1.19219970703125, 1.256317138671875, 1.3204345703125, 1.384552001953125, 1.44866943359375, 1.512786865234375, 1.576904296875, 1.641021728515625, 1.70513916015625, 1.769256591796875, 1.8333740234375, 1.897491455078125, 1.96160888671875, 2.025726318359375, 2.08984375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 6.0, 4.0, 8.0, 7.0, 12.0, 10.0, 10.0, 20.0, 23.0, 30.0, 38.0, 32.0, 35.0, 36.0, 39.0, 41.0, 46.0, 46.0, 45.0, 55.0, 46.0, 38.0, 55.0, 46.0, 42.0, 28.0, 36.0, 29.0, 20.0, 19.0, 16.0, 14.0, 12.0, 15.0, 16.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.9853515625, -1.9228668212890625, -1.860382080078125, -1.7978973388671875, -1.73541259765625, -1.6729278564453125, -1.610443115234375, -1.5479583740234375, -1.4854736328125, -1.4229888916015625, -1.360504150390625, -1.2980194091796875, -1.23553466796875, -1.1730499267578125, -1.110565185546875, -1.0480804443359375, -0.985595703125, -0.9231109619140625, -0.860626220703125, -0.7981414794921875, -0.73565673828125, -0.6731719970703125, -0.610687255859375, -0.5482025146484375, -0.4857177734375, -0.4232330322265625, -0.360748291015625, -0.2982635498046875, -0.23577880859375, -0.1732940673828125, -0.110809326171875, -0.0483245849609375, 0.01416015625, 0.0766448974609375, 0.139129638671875, 0.2016143798828125, 0.26409912109375, 0.3265838623046875, 0.389068603515625, 0.4515533447265625, 0.5140380859375, 0.5765228271484375, 0.639007568359375, 0.7014923095703125, 0.76397705078125, 0.8264617919921875, 0.888946533203125, 0.9514312744140625, 1.013916015625, 1.0764007568359375, 1.138885498046875, 1.2013702392578125, 1.26385498046875, 1.3263397216796875, 1.388824462890625, 1.4513092041015625, 1.5137939453125, 1.5762786865234375, 1.638763427734375, 1.7012481689453125, 1.76373291015625, 1.8262176513671875, 1.888702392578125, 1.9511871337890625, 2.013671875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 1.0, 7.0, 9.0, 16.0, 21.0, 39.0, 61.0, 90.0, 168.0, 353.0, 759.0, 1868.0, 5959.0, 28721.0, 194935.0, 605035.0, 175690.0, 26111.0, 5546.0, 1796.0, 673.0, 299.0, 149.0, 91.0, 59.0, 43.0, 19.0, 10.0, 10.0, 12.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54931640625, -0.5268707275390625, -0.504425048828125, -0.4819793701171875, -0.45953369140625, -0.4370880126953125, -0.414642333984375, -0.3921966552734375, -0.3697509765625, -0.3473052978515625, -0.324859619140625, -0.3024139404296875, -0.27996826171875, -0.2575225830078125, -0.235076904296875, -0.2126312255859375, -0.190185546875, -0.1677398681640625, -0.145294189453125, -0.1228485107421875, -0.10040283203125, -0.0779571533203125, -0.055511474609375, -0.0330657958984375, -0.0106201171875, 0.0118255615234375, 0.034271240234375, 0.0567169189453125, 0.07916259765625, 0.1016082763671875, 0.124053955078125, 0.1464996337890625, 0.1689453125, 0.1913909912109375, 0.213836669921875, 0.2362823486328125, 0.25872802734375, 0.2811737060546875, 0.303619384765625, 0.3260650634765625, 0.3485107421875, 0.3709564208984375, 0.393402099609375, 0.4158477783203125, 0.43829345703125, 0.4607391357421875, 0.483184814453125, 0.5056304931640625, 0.528076171875, 0.5505218505859375, 0.572967529296875, 0.5954132080078125, 0.61785888671875, 0.6403045654296875, 0.662750244140625, 0.6851959228515625, 0.7076416015625, 0.7300872802734375, 0.752532958984375, 0.7749786376953125, 0.79742431640625, 0.8198699951171875, 0.842315673828125, 0.8647613525390625, 0.88720703125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 6.0, 9.0, 13.0, 6.0, 12.0, 19.0, 19.0, 17.0, 29.0, 43.0, 45.0, 61.0, 69.0, 82.0, 110.0, 77.0, 56.0, 65.0, 42.0, 30.0, 31.0, 26.0, 17.0, 22.0, 15.0, 5.0, 12.0, 9.0, 10.0, 8.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0001430511474609375, -0.0001390017569065094, -0.0001349523663520813, -0.0001309029757976532, -0.0001268535852432251, -0.000122804194688797, -0.0001187548041343689, -0.0001147054135799408, -0.0001106560230255127, -0.0001066066324710846, -0.0001025572419166565, -9.85078513622284e-05, -9.445846080780029e-05, -9.040907025337219e-05, -8.635967969894409e-05, -8.231028914451599e-05, -7.826089859008789e-05, -7.421150803565979e-05, -7.016211748123169e-05, -6.611272692680359e-05, -6.206333637237549e-05, -5.801394581794739e-05, -5.396455526351929e-05, -4.9915164709091187e-05, -4.5865774154663086e-05, -4.1816383600234985e-05, -3.7766993045806885e-05, -3.3717602491378784e-05, -2.9668211936950684e-05, -2.5618821382522583e-05, -2.1569430828094482e-05, -1.7520040273666382e-05, -1.3470649719238281e-05, -9.42125916481018e-06, -5.37186861038208e-06, -1.3224780559539795e-06, 2.726912498474121e-06, 6.776303052902222e-06, 1.0825693607330322e-05, 1.4875084161758423e-05, 1.8924474716186523e-05, 2.2973865270614624e-05, 2.7023255825042725e-05, 3.1072646379470825e-05, 3.5122036933898926e-05, 3.9171427488327026e-05, 4.322081804275513e-05, 4.727020859718323e-05, 5.131959915161133e-05, 5.536898970603943e-05, 5.941838026046753e-05, 6.346777081489563e-05, 6.751716136932373e-05, 7.156655192375183e-05, 7.561594247817993e-05, 7.966533303260803e-05, 8.371472358703613e-05, 8.776411414146423e-05, 9.181350469589233e-05, 9.586289525032043e-05, 9.991228580474854e-05, 0.00010396167635917664, 0.00010801106691360474, 0.00011206045746803284, 0.00011610984802246094]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 10.0, 23.0, 31.0, 38.0, 53.0, 85.0, 121.0, 219.0, 368.0, 744.0, 1668.0, 4714.0, 17907.0, 94684.0, 496949.0, 354172.0, 58447.0, 12047.0, 3526.0, 1277.0, 623.0, 332.0, 211.0, 99.0, 67.0, 46.0, 22.0, 26.0, 12.0, 7.0, 5.0, 5.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5517578125, -0.530426025390625, -0.50909423828125, -0.487762451171875, -0.4664306640625, -0.445098876953125, -0.42376708984375, -0.402435302734375, -0.381103515625, -0.359771728515625, -0.33843994140625, -0.317108154296875, -0.2957763671875, -0.274444580078125, -0.25311279296875, -0.231781005859375, -0.21044921875, -0.189117431640625, -0.16778564453125, -0.146453857421875, -0.1251220703125, -0.103790283203125, -0.08245849609375, -0.061126708984375, -0.039794921875, -0.018463134765625, 0.00286865234375, 0.024200439453125, 0.0455322265625, 0.066864013671875, 0.08819580078125, 0.109527587890625, 0.130859375, 0.152191162109375, 0.17352294921875, 0.194854736328125, 0.2161865234375, 0.237518310546875, 0.25885009765625, 0.280181884765625, 0.301513671875, 0.322845458984375, 0.34417724609375, 0.365509033203125, 0.3868408203125, 0.408172607421875, 0.42950439453125, 0.450836181640625, 0.47216796875, 0.493499755859375, 0.51483154296875, 0.536163330078125, 0.5574951171875, 0.578826904296875, 0.60015869140625, 0.621490478515625, 0.642822265625, 0.664154052734375, 0.68548583984375, 0.706817626953125, 0.7281494140625, 0.749481201171875, 0.77081298828125, 0.792144775390625, 0.8134765625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 9.0, 8.0, 11.0, 17.0, 18.0, 13.0, 26.0, 36.0, 41.0, 52.0, 61.0, 55.0, 60.0, 78.0, 53.0, 67.0, 63.0, 63.0, 46.0, 42.0, 34.0, 34.0, 21.0, 16.0, 11.0, 14.0, 5.0, 10.0, 7.0, 5.0, 2.0, 1.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.419189453125, -0.4047966003417969, -0.39040374755859375, -0.3760108947753906, -0.3616180419921875, -0.3472251892089844, -0.33283233642578125, -0.3184394836425781, -0.304046630859375, -0.2896537780761719, -0.27526092529296875, -0.2608680725097656, -0.2464752197265625, -0.23208236694335938, -0.21768951416015625, -0.20329666137695312, -0.18890380859375, -0.17451095581054688, -0.16011810302734375, -0.14572525024414062, -0.1313323974609375, -0.11693954467773438, -0.10254669189453125, -0.08815383911132812, -0.073760986328125, -0.059368133544921875, -0.04497528076171875, -0.030582427978515625, -0.0161895751953125, -0.001796722412109375, 0.01259613037109375, 0.026988983154296875, 0.0413818359375, 0.055774688720703125, 0.07016754150390625, 0.08456039428710938, 0.0989532470703125, 0.11334609985351562, 0.12773895263671875, 0.14213180541992188, 0.156524658203125, 0.17091751098632812, 0.18531036376953125, 0.19970321655273438, 0.2140960693359375, 0.22848892211914062, 0.24288177490234375, 0.2572746276855469, 0.27166748046875, 0.2860603332519531, 0.30045318603515625, 0.3148460388183594, 0.3292388916015625, 0.3436317443847656, 0.35802459716796875, 0.3724174499511719, 0.386810302734375, 0.4012031555175781, 0.41559600830078125, 0.4299888610839844, 0.4443817138671875, 0.4587745666503906, 0.47316741943359375, 0.4875602722167969, 0.501953125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 6.0, 3.0, 6.0, 24.0, 41.0, 56.0, 96.0, 158.0, 175.0, 163.0, 128.0, 63.0, 38.0, 19.0, 10.0, 7.0, 6.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.49753189086914, -23.99467658996582, -23.491823196411133, -22.988967895507812, -22.486114501953125, -21.983259201049805, -21.480405807495117, -20.977550506591797, -20.47469711303711, -19.97184181213379, -19.4689884185791, -18.96613311767578, -18.463279724121094, -17.960424423217773, -17.457571029663086, -16.954715728759766, -16.451862335205078, -15.949007987976074, -15.44615364074707, -14.943299293518066, -14.440444946289062, -13.937590599060059, -13.434736251831055, -12.931880950927734, -12.429025650024414, -11.92617130279541, -11.423316955566406, -10.920462608337402, -10.417608261108398, -9.914753913879395, -9.41189956665039, -8.90904426574707, -8.4061918258667, -7.903337478637695, -7.400483131408691, -6.8976287841796875, -6.394774436950684, -5.89192008972168, -5.389065265655518, -4.886210918426514, -4.38335657119751, -3.880502223968506, -3.377647876739502, -2.874793291091919, -2.371938943862915, -1.8690845966339111, -1.3662300109863281, -0.8633756637573242, -0.3605213165283203, 0.14233309030532837, 0.645187497138977, 1.1480419635772705, 1.6508963108062744, 2.1537506580352783, 2.6566052436828613, 3.1594595909118652, 3.662313938140869, 4.165168285369873, 4.668022632598877, 5.170877456665039, 5.673731803894043, 6.176586151123047, 6.679440498352051, 7.182294845581055, 7.685149192810059]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 6.0, 11.0, 13.0, 11.0, 10.0, 22.0, 19.0, 17.0, 26.0, 23.0, 48.0, 52.0, 45.0, 55.0, 50.0, 53.0, 52.0, 63.0, 54.0, 58.0, 51.0, 37.0, 47.0, 38.0, 41.0, 30.0, 12.0, 18.0, 16.0, 5.0, 9.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-18.735824584960938, -18.293418884277344, -17.85101318359375, -17.408605575561523, -16.96619987487793, -16.523794174194336, -16.08138656616211, -15.638980865478516, -15.196575164794922, -14.754169464111328, -14.311762809753418, -13.869356155395508, -13.426950454711914, -12.98454475402832, -12.54213809967041, -12.0997314453125, -11.657325744628906, -11.214920043945312, -10.772513389587402, -10.330106735229492, -9.887701034545898, -9.445295333862305, -9.002888679504395, -8.560482025146484, -8.11807632446289, -7.675670146942139, -7.233263969421387, -6.790857791900635, -6.348451614379883, -5.906045436859131, -5.463639259338379, -5.021233081817627, -4.578826904296875, -4.136420726776123, -3.694014549255371, -3.251608371734619, -2.809202194213867, -2.3667960166931152, -1.9243898391723633, -1.4819836616516113, -1.0395774841308594, -0.5971713066101074, -0.15476512908935547, 0.2876410484313965, 0.7300472259521484, 1.1724534034729004, 1.6148595809936523, 2.0572657585144043, 2.4996719360351562, 2.942078113555908, 3.38448429107666, 3.826890468597412, 4.269296646118164, 4.711702823638916, 5.154109001159668, 5.59651517868042, 6.038921356201172, 6.481327533721924, 6.923733711242676, 7.366139888763428, 7.80854606628418, 8.250951766967773, 8.693358421325684, 9.135765075683594, 9.578170776367188]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 3.0, 15.0, 7.0, 13.0, 17.0, 21.0, 37.0, 29.0, 74.0, 88.0, 167.0, 328.0, 571.0, 1126.0, 2643.0, 9099.0, 63691.0, 3744410.0, 344823.0, 20281.0, 4067.0, 1389.0, 629.0, 328.0, 178.0, 92.0, 57.0, 38.0, 13.0, 8.0, 6.0, 6.0, 0.0, 4.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.5234375, -3.42755126953125, -3.3316650390625, -3.23577880859375, -3.139892578125, -3.04400634765625, -2.9481201171875, -2.85223388671875, -2.75634765625, -2.66046142578125, -2.5645751953125, -2.46868896484375, -2.372802734375, -2.27691650390625, -2.1810302734375, -2.08514404296875, -1.9892578125, -1.89337158203125, -1.7974853515625, -1.70159912109375, -1.605712890625, -1.50982666015625, -1.4139404296875, -1.31805419921875, -1.22216796875, -1.12628173828125, -1.0303955078125, -0.93450927734375, -0.838623046875, -0.74273681640625, -0.6468505859375, -0.55096435546875, -0.455078125, -0.35919189453125, -0.2633056640625, -0.16741943359375, -0.071533203125, 0.02435302734375, 0.1202392578125, 0.21612548828125, 0.31201171875, 0.40789794921875, 0.5037841796875, 0.59967041015625, 0.695556640625, 0.79144287109375, 0.8873291015625, 0.98321533203125, 1.0791015625, 1.17498779296875, 1.2708740234375, 1.36676025390625, 1.462646484375, 1.55853271484375, 1.6544189453125, 1.75030517578125, 1.84619140625, 1.94207763671875, 2.0379638671875, 2.13385009765625, 2.229736328125, 2.32562255859375, 2.4215087890625, 2.51739501953125, 2.61328125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 5.0, 9.0, 17.0, 28.0, 47.0, 73.0, 77.0, 91.0, 109.0, 119.0, 89.0, 85.0, 89.0, 60.0, 43.0, 26.0, 10.0, 7.0, 7.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.08203125, -1.0537109375, -1.025390625, -0.9970703125, -0.96875, -0.9404296875, -0.912109375, -0.8837890625, -0.85546875, -0.8271484375, -0.798828125, -0.7705078125, -0.7421875, -0.7138671875, -0.685546875, -0.6572265625, -0.62890625, -0.6005859375, -0.572265625, -0.5439453125, -0.515625, -0.4873046875, -0.458984375, -0.4306640625, -0.40234375, -0.3740234375, -0.345703125, -0.3173828125, -0.2890625, -0.2607421875, -0.232421875, -0.2041015625, -0.17578125, -0.1474609375, -0.119140625, -0.0908203125, -0.0625, -0.0341796875, -0.005859375, 0.0224609375, 0.05078125, 0.0791015625, 0.107421875, 0.1357421875, 0.1640625, 0.1923828125, 0.220703125, 0.2490234375, 0.27734375, 0.3056640625, 0.333984375, 0.3623046875, 0.390625, 0.4189453125, 0.447265625, 0.4755859375, 0.50390625, 0.5322265625, 0.560546875, 0.5888671875, 0.6171875, 0.6455078125, 0.673828125, 0.7021484375, 0.73046875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 7.0, 8.0, 16.0, 39.0, 58.0, 146.0, 330.0, 838.0, 2543.0, 11314.0, 156617.0, 3877653.0, 130045.0, 10710.0, 2501.0, 810.0, 318.0, 144.0, 77.0, 40.0, 21.0, 12.0, 13.0, 4.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.666015625, -2.5723876953125, -2.478759765625, -2.3851318359375, -2.29150390625, -2.1978759765625, -2.104248046875, -2.0106201171875, -1.9169921875, -1.8233642578125, -1.729736328125, -1.6361083984375, -1.54248046875, -1.4488525390625, -1.355224609375, -1.2615966796875, -1.16796875, -1.0743408203125, -0.980712890625, -0.8870849609375, -0.79345703125, -0.6998291015625, -0.606201171875, -0.5125732421875, -0.4189453125, -0.3253173828125, -0.231689453125, -0.1380615234375, -0.04443359375, 0.0491943359375, 0.142822265625, 0.2364501953125, 0.330078125, 0.4237060546875, 0.517333984375, 0.6109619140625, 0.70458984375, 0.7982177734375, 0.891845703125, 0.9854736328125, 1.0791015625, 1.1727294921875, 1.266357421875, 1.3599853515625, 1.45361328125, 1.5472412109375, 1.640869140625, 1.7344970703125, 1.828125, 1.9217529296875, 2.015380859375, 2.1090087890625, 2.20263671875, 2.2962646484375, 2.389892578125, 2.4835205078125, 2.5771484375, 2.6707763671875, 2.764404296875, 2.8580322265625, 2.95166015625, 3.0452880859375, 3.138916015625, 3.2325439453125, 3.326171875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 5.0, 9.0, 15.0, 31.0, 39.0, 65.0, 135.0, 308.0, 845.0, 1562.0, 580.0, 208.0, 106.0, 65.0, 31.0, 19.0, 15.0, 7.0, 6.0, 5.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0556640625, -1.0219573974609375, -0.988250732421875, -0.9545440673828125, -0.92083740234375, -0.8871307373046875, -0.853424072265625, -0.8197174072265625, -0.7860107421875, -0.7523040771484375, -0.718597412109375, -0.6848907470703125, -0.65118408203125, -0.6174774169921875, -0.583770751953125, -0.5500640869140625, -0.516357421875, -0.4826507568359375, -0.448944091796875, -0.4152374267578125, -0.38153076171875, -0.3478240966796875, -0.314117431640625, -0.2804107666015625, -0.2467041015625, -0.2129974365234375, -0.179290771484375, -0.1455841064453125, -0.11187744140625, -0.0781707763671875, -0.044464111328125, -0.0107574462890625, 0.02294921875, 0.0566558837890625, 0.090362548828125, 0.1240692138671875, 0.15777587890625, 0.1914825439453125, 0.225189208984375, 0.2588958740234375, 0.2926025390625, 0.3263092041015625, 0.360015869140625, 0.3937225341796875, 0.42742919921875, 0.4611358642578125, 0.494842529296875, 0.5285491943359375, 0.562255859375, 0.5959625244140625, 0.629669189453125, 0.6633758544921875, 0.69708251953125, 0.7307891845703125, 0.764495849609375, 0.7982025146484375, 0.8319091796875, 0.8656158447265625, 0.899322509765625, 0.9330291748046875, 0.96673583984375, 1.0004425048828125, 1.034149169921875, 1.0678558349609375, 1.1015625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 21.0, 46.0, 155.0, 261.0, 269.0, 140.0, 64.0, 21.0, 6.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.197665214538574, -5.940758228302002, -5.683851718902588, -5.426944732666016, -5.170038223266602, -4.913131237030029, -4.656224250793457, -4.399317741394043, -4.142410755157471, -3.8855040073394775, -3.6285972595214844, -3.371690273284912, -3.114783525466919, -2.857876777648926, -2.6009697914123535, -2.3440630435943604, -2.087156295776367, -1.830249547958374, -1.5733426809310913, -1.3164358139038086, -1.0595290660858154, -0.8026223182678223, -0.5457154512405396, -0.28880858421325684, -0.03190183639526367, 0.22500497102737427, 0.4819117784500122, 0.7388185858726501, 0.9957253932952881, 1.2526321411132812, 1.509539008140564, 1.7664458751678467, 2.02335262298584, 2.280259370803833, 2.537166118621826, 2.7940731048583984, 3.0509798526763916, 3.3078866004943848, 3.564793586730957, 3.82170033454895, 4.078607082366943, 4.335514068603516, 4.59242057800293, 4.849327564239502, 5.106234550476074, 5.363141059875488, 5.6200480461120605, 5.876955032348633, 6.133861541748047, 6.390768527984619, 6.647675037384033, 6.9045820236206055, 7.1614885330200195, 7.418395519256592, 7.675302505493164, 7.932209014892578, 8.189115524291992, 8.446022033691406, 8.702929496765137, 8.95983600616455, 9.216742515563965, 9.473649978637695, 9.73055648803711, 9.987462997436523, 10.244370460510254]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 4.0, 4.0, 22.0, 12.0, 21.0, 27.0, 35.0, 27.0, 56.0, 54.0, 62.0, 88.0, 79.0, 70.0, 75.0, 75.0, 67.0, 62.0, 42.0, 38.0, 23.0, 17.0, 12.0, 10.0, 10.0, 2.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.913640022277832, -4.780762672424316, -4.647884845733643, -4.515007495880127, -4.382129669189453, -4.2492523193359375, -4.116374969482422, -3.983497381210327, -3.8506197929382324, -3.7177422046661377, -3.584864616394043, -3.4519872665405273, -3.3191096782684326, -3.186232089996338, -3.0533547401428223, -2.9204771518707275, -2.787599563598633, -2.654721975326538, -2.5218443870544434, -2.3889670372009277, -2.256089448928833, -2.1232118606567383, -1.990334391593933, -1.857456922531128, -1.7245793342590332, -1.5917017459869385, -1.4588242769241333, -1.3259468078613281, -1.1930692195892334, -1.0601916313171387, -0.9273141622543335, -0.7944366335868835, -0.6615591049194336, -0.5286815762519836, -0.3958040475845337, -0.26292651891708374, -0.1300489902496338, 0.002828538417816162, 0.1357060670852661, 0.26858359575271606, 0.401461124420166, 0.534338653087616, 0.6672161817550659, 0.8000937104225159, 0.9329712390899658, 1.0658488273620605, 1.1987262964248657, 1.331603765487671, 1.4644813537597656, 1.5973589420318604, 1.7302364110946655, 1.8631138801574707, 1.9959914684295654, 2.12886905670166, 2.261746406555176, 2.3946239948272705, 2.5275015830993652, 2.66037917137146, 2.7932567596435547, 2.9261341094970703, 3.059011697769165, 3.1918892860412598, 3.3247666358947754, 3.45764422416687, 3.590521812438965]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 2.0, 2.0, 11.0, 11.0, 13.0, 35.0, 46.0, 89.0, 147.0, 254.0, 495.0, 984.0, 2333.0, 6496.0, 29391.0, 202197.0, 571990.0, 194824.0, 28576.0, 6344.0, 2292.0, 963.0, 448.0, 273.0, 127.0, 83.0, 52.0, 34.0, 18.0, 10.0, 10.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.73046875, -2.63787841796875, -2.5452880859375, -2.45269775390625, -2.360107421875, -2.26751708984375, -2.1749267578125, -2.08233642578125, -1.98974609375, -1.89715576171875, -1.8045654296875, -1.71197509765625, -1.619384765625, -1.52679443359375, -1.4342041015625, -1.34161376953125, -1.2490234375, -1.15643310546875, -1.0638427734375, -0.97125244140625, -0.878662109375, -0.78607177734375, -0.6934814453125, -0.60089111328125, -0.50830078125, -0.41571044921875, -0.3231201171875, -0.23052978515625, -0.137939453125, -0.04534912109375, 0.0472412109375, 0.13983154296875, 0.232421875, 0.32501220703125, 0.4176025390625, 0.51019287109375, 0.602783203125, 0.69537353515625, 0.7879638671875, 0.88055419921875, 0.97314453125, 1.06573486328125, 1.1583251953125, 1.25091552734375, 1.343505859375, 1.43609619140625, 1.5286865234375, 1.62127685546875, 1.7138671875, 1.80645751953125, 1.8990478515625, 1.99163818359375, 2.084228515625, 2.17681884765625, 2.2694091796875, 2.36199951171875, 2.45458984375, 2.54718017578125, 2.6397705078125, 2.73236083984375, 2.824951171875, 2.91754150390625, 3.0101318359375, 3.10272216796875, 3.1953125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 5.0, 8.0, 9.0, 19.0, 42.0, 68.0, 80.0, 111.0, 110.0, 121.0, 108.0, 88.0, 99.0, 51.0, 35.0, 17.0, 13.0, 5.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.26171875, -1.2311553955078125, -1.200592041015625, -1.1700286865234375, -1.13946533203125, -1.1089019775390625, -1.078338623046875, -1.0477752685546875, -1.0172119140625, -0.9866485595703125, -0.956085205078125, -0.9255218505859375, -0.89495849609375, -0.8643951416015625, -0.833831787109375, -0.8032684326171875, -0.772705078125, -0.7421417236328125, -0.711578369140625, -0.6810150146484375, -0.65045166015625, -0.6198883056640625, -0.589324951171875, -0.5587615966796875, -0.5281982421875, -0.4976348876953125, -0.467071533203125, -0.4365081787109375, -0.40594482421875, -0.3753814697265625, -0.344818115234375, -0.3142547607421875, -0.28369140625, -0.2531280517578125, -0.222564697265625, -0.1920013427734375, -0.16143798828125, -0.1308746337890625, -0.100311279296875, -0.0697479248046875, -0.0391845703125, -0.0086212158203125, 0.021942138671875, 0.0525054931640625, 0.08306884765625, 0.1136322021484375, 0.144195556640625, 0.1747589111328125, 0.205322265625, 0.2358856201171875, 0.266448974609375, 0.2970123291015625, 0.32757568359375, 0.3581390380859375, 0.388702392578125, 0.4192657470703125, 0.4498291015625, 0.4803924560546875, 0.510955810546875, 0.5415191650390625, 0.57208251953125, 0.6026458740234375, 0.633209228515625, 0.6637725830078125, 0.6943359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 8.0, 13.0, 8.0, 14.0, 16.0, 29.0, 45.0, 56.0, 85.0, 110.0, 158.0, 229.0, 362.0, 649.0, 1145.0, 2122.0, 4954.0, 12826.0, 36022.0, 102697.0, 237448.0, 319107.0, 202029.0, 81386.0, 28345.0, 10276.0, 4022.0, 1785.0, 990.0, 501.0, 311.0, 242.0, 161.0, 102.0, 84.0, 63.0, 43.0, 30.0, 18.0, 17.0, 12.0, 6.0, 7.0, 6.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0], "bins": [-1.541015625, -1.497467041015625, -1.45391845703125, -1.410369873046875, -1.3668212890625, -1.323272705078125, -1.27972412109375, -1.236175537109375, -1.192626953125, -1.149078369140625, -1.10552978515625, -1.061981201171875, -1.0184326171875, -0.974884033203125, -0.93133544921875, -0.887786865234375, -0.84423828125, -0.800689697265625, -0.75714111328125, -0.713592529296875, -0.6700439453125, -0.626495361328125, -0.58294677734375, -0.539398193359375, -0.495849609375, -0.452301025390625, -0.40875244140625, -0.365203857421875, -0.3216552734375, -0.278106689453125, -0.23455810546875, -0.191009521484375, -0.1474609375, -0.103912353515625, -0.06036376953125, -0.016815185546875, 0.0267333984375, 0.070281982421875, 0.11383056640625, 0.157379150390625, 0.200927734375, 0.244476318359375, 0.28802490234375, 0.331573486328125, 0.3751220703125, 0.418670654296875, 0.46221923828125, 0.505767822265625, 0.54931640625, 0.592864990234375, 0.63641357421875, 0.679962158203125, 0.7235107421875, 0.767059326171875, 0.81060791015625, 0.854156494140625, 0.897705078125, 0.941253662109375, 0.98480224609375, 1.028350830078125, 1.0718994140625, 1.115447998046875, 1.15899658203125, 1.202545166015625, 1.24609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 7.0, 6.0, 4.0, 13.0, 14.0, 17.0, 18.0, 17.0, 23.0, 30.0, 37.0, 27.0, 30.0, 46.0, 39.0, 44.0, 44.0, 41.0, 59.0, 45.0, 57.0, 41.0, 40.0, 43.0, 37.0, 38.0, 25.0, 24.0, 22.0, 17.0, 22.0, 7.0, 8.0, 8.0, 8.0, 12.0, 12.0, 6.0, 2.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7890625, -1.726531982421875, -1.66400146484375, -1.601470947265625, -1.5389404296875, -1.476409912109375, -1.41387939453125, -1.351348876953125, -1.288818359375, -1.226287841796875, -1.16375732421875, -1.101226806640625, -1.0386962890625, -0.976165771484375, -0.91363525390625, -0.851104736328125, -0.78857421875, -0.726043701171875, -0.66351318359375, -0.600982666015625, -0.5384521484375, -0.475921630859375, -0.41339111328125, -0.350860595703125, -0.288330078125, -0.225799560546875, -0.16326904296875, -0.100738525390625, -0.0382080078125, 0.024322509765625, 0.08685302734375, 0.149383544921875, 0.2119140625, 0.274444580078125, 0.33697509765625, 0.399505615234375, 0.4620361328125, 0.524566650390625, 0.58709716796875, 0.649627685546875, 0.712158203125, 0.774688720703125, 0.83721923828125, 0.899749755859375, 0.9622802734375, 1.024810791015625, 1.08734130859375, 1.149871826171875, 1.21240234375, 1.274932861328125, 1.33746337890625, 1.399993896484375, 1.4625244140625, 1.525054931640625, 1.58758544921875, 1.650115966796875, 1.712646484375, 1.775177001953125, 1.83770751953125, 1.900238037109375, 1.9627685546875, 2.025299072265625, 2.08782958984375, 2.150360107421875, 2.212890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 5.0, 10.0, 12.0, 20.0, 25.0, 42.0, 50.0, 78.0, 202.0, 515.0, 1867.0, 9234.0, 124383.0, 830600.0, 72350.0, 6879.0, 1463.0, 426.0, 151.0, 81.0, 52.0, 35.0, 20.0, 13.0, 9.0, 8.0, 7.0, 7.0, 2.0, 0.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.486328125, -1.4404754638671875, -1.394622802734375, -1.3487701416015625, -1.30291748046875, -1.2570648193359375, -1.211212158203125, -1.1653594970703125, -1.1195068359375, -1.0736541748046875, -1.027801513671875, -0.9819488525390625, -0.93609619140625, -0.8902435302734375, -0.844390869140625, -0.7985382080078125, -0.752685546875, -0.7068328857421875, -0.660980224609375, -0.6151275634765625, -0.56927490234375, -0.5234222412109375, -0.477569580078125, -0.4317169189453125, -0.3858642578125, -0.3400115966796875, -0.294158935546875, -0.2483062744140625, -0.20245361328125, -0.1566009521484375, -0.110748291015625, -0.0648956298828125, -0.01904296875, 0.0268096923828125, 0.072662353515625, 0.1185150146484375, 0.16436767578125, 0.2102203369140625, 0.256072998046875, 0.3019256591796875, 0.3477783203125, 0.3936309814453125, 0.439483642578125, 0.4853363037109375, 0.53118896484375, 0.5770416259765625, 0.622894287109375, 0.6687469482421875, 0.714599609375, 0.7604522705078125, 0.806304931640625, 0.8521575927734375, 0.89801025390625, 0.9438629150390625, 0.989715576171875, 1.0355682373046875, 1.0814208984375, 1.1272735595703125, 1.173126220703125, 1.2189788818359375, 1.26483154296875, 1.3106842041015625, 1.356536865234375, 1.4023895263671875, 1.4482421875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 6.0, 9.0, 4.0, 5.0, 6.0, 8.0, 17.0, 30.0, 28.0, 23.0, 36.0, 35.0, 56.0, 96.0, 90.0, 107.0, 93.0, 72.0, 60.0, 39.0, 33.0, 28.0, 24.0, 19.0, 17.0, 10.0, 9.0, 7.0, 6.0, 6.0, 5.0, 4.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010347366333007812, -9.994953870773315e-05, -9.642541408538818e-05, -9.290128946304321e-05, -8.937716484069824e-05, -8.585304021835327e-05, -8.23289155960083e-05, -7.880479097366333e-05, -7.528066635131836e-05, -7.175654172897339e-05, -6.823241710662842e-05, -6.470829248428345e-05, -6.118416786193848e-05, -5.7660043239593506e-05, -5.4135918617248535e-05, -5.0611793994903564e-05, -4.7087669372558594e-05, -4.356354475021362e-05, -4.003942012786865e-05, -3.651529550552368e-05, -3.299117088317871e-05, -2.946704626083374e-05, -2.594292163848877e-05, -2.24187970161438e-05, -1.8894672393798828e-05, -1.5370547771453857e-05, -1.1846423149108887e-05, -8.322298526763916e-06, -4.798173904418945e-06, -1.2740492820739746e-06, 2.250075340270996e-06, 5.774199962615967e-06, 9.298324584960938e-06, 1.2822449207305908e-05, 1.634657382965088e-05, 1.987069845199585e-05, 2.339482307434082e-05, 2.691894769668579e-05, 3.0443072319030762e-05, 3.396719694137573e-05, 3.74913215637207e-05, 4.1015446186065674e-05, 4.4539570808410645e-05, 4.8063695430755615e-05, 5.1587820053100586e-05, 5.511194467544556e-05, 5.863606929779053e-05, 6.21601939201355e-05, 6.568431854248047e-05, 6.920844316482544e-05, 7.273256778717041e-05, 7.625669240951538e-05, 7.978081703186035e-05, 8.330494165420532e-05, 8.682906627655029e-05, 9.035319089889526e-05, 9.387731552124023e-05, 9.74014401435852e-05, 0.00010092556476593018, 0.00010444968938827515, 0.00010797381401062012, 0.00011149793863296509, 0.00011502206325531006, 0.00011854618787765503, 0.0001220703125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 4.0, 8.0, 1.0, 13.0, 10.0, 12.0, 30.0, 58.0, 87.0, 158.0, 345.0, 852.0, 2432.0, 11143.0, 169637.0, 803983.0, 51006.0, 6030.0, 1582.0, 580.0, 257.0, 130.0, 66.0, 42.0, 23.0, 18.0, 11.0, 10.0, 1.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.6435546875, -1.598297119140625, -1.55303955078125, -1.507781982421875, -1.4625244140625, -1.417266845703125, -1.37200927734375, -1.326751708984375, -1.281494140625, -1.236236572265625, -1.19097900390625, -1.145721435546875, -1.1004638671875, -1.055206298828125, -1.00994873046875, -0.964691162109375, -0.91943359375, -0.874176025390625, -0.82891845703125, -0.783660888671875, -0.7384033203125, -0.693145751953125, -0.64788818359375, -0.602630615234375, -0.557373046875, -0.512115478515625, -0.46685791015625, -0.421600341796875, -0.3763427734375, -0.331085205078125, -0.28582763671875, -0.240570068359375, -0.1953125, -0.150054931640625, -0.10479736328125, -0.059539794921875, -0.0142822265625, 0.030975341796875, 0.07623291015625, 0.121490478515625, 0.166748046875, 0.212005615234375, 0.25726318359375, 0.302520751953125, 0.3477783203125, 0.393035888671875, 0.43829345703125, 0.483551025390625, 0.52880859375, 0.574066162109375, 0.61932373046875, 0.664581298828125, 0.7098388671875, 0.755096435546875, 0.80035400390625, 0.845611572265625, 0.890869140625, 0.936126708984375, 0.98138427734375, 1.026641845703125, 1.0718994140625, 1.117156982421875, 1.16241455078125, 1.207672119140625, 1.2529296875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 8.0, 20.0, 26.0, 26.0, 44.0, 72.0, 73.0, 99.0, 139.0, 118.0, 101.0, 80.0, 66.0, 33.0, 29.0, 21.0, 10.0, 9.0, 7.0, 2.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0302734375, -1.0023651123046875, -0.974456787109375, -0.9465484619140625, -0.91864013671875, -0.8907318115234375, -0.862823486328125, -0.8349151611328125, -0.8070068359375, -0.7790985107421875, -0.751190185546875, -0.7232818603515625, -0.69537353515625, -0.6674652099609375, -0.639556884765625, -0.6116485595703125, -0.583740234375, -0.5558319091796875, -0.527923583984375, -0.5000152587890625, -0.47210693359375, -0.4441986083984375, -0.416290283203125, -0.3883819580078125, -0.3604736328125, -0.3325653076171875, -0.304656982421875, -0.2767486572265625, -0.24884033203125, -0.2209320068359375, -0.193023681640625, -0.1651153564453125, -0.13720703125, -0.1092987060546875, -0.081390380859375, -0.0534820556640625, -0.02557373046875, 0.0023345947265625, 0.030242919921875, 0.0581512451171875, 0.0860595703125, 0.1139678955078125, 0.141876220703125, 0.1697845458984375, 0.19769287109375, 0.2256011962890625, 0.253509521484375, 0.2814178466796875, 0.309326171875, 0.3372344970703125, 0.365142822265625, 0.3930511474609375, 0.42095947265625, 0.4488677978515625, 0.476776123046875, 0.5046844482421875, 0.5325927734375, 0.5605010986328125, 0.588409423828125, 0.6163177490234375, 0.64422607421875, 0.6721343994140625, 0.700042724609375, 0.7279510498046875, 0.755859375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 2.0, 12.0, 21.0, 37.0, 39.0, 69.0, 88.0, 126.0, 109.0, 126.0, 113.0, 83.0, 55.0, 36.0, 25.0, 13.0, 15.0, 14.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.431795120239258, -11.075295448303223, -10.718795776367188, -10.362295150756836, -10.0057954788208, -9.649295806884766, -9.29279613494873, -8.936296463012695, -8.579795837402344, -8.223296165466309, -7.866796016693115, -7.51029634475708, -7.153796195983887, -6.797296524047852, -6.440796852111816, -6.084296703338623, -5.727797031402588, -5.371297359466553, -5.014797210693359, -4.658297538757324, -4.301797389984131, -3.9452977180480957, -3.5887978076934814, -3.232297897338867, -2.875797986984253, -2.5192980766296387, -2.1627981662750244, -1.8062983751296997, -1.4497984647750854, -1.0932985544204712, -0.7367987632751465, -0.3802988529205322, -0.02379894256591797, 0.3327009379863739, 0.6892008185386658, 1.0457006692886353, 1.4022005796432495, 1.7587004899978638, 2.1152002811431885, 2.4717001914978027, 2.828200101852417, 3.1847000122070312, 3.5411999225616455, 3.8976998329162598, 4.254199504852295, 4.610699653625488, 4.967199325561523, 5.323698997497559, 5.680199146270752, 6.036698818206787, 6.3931989669799805, 6.749698638916016, 7.106198787689209, 7.462698459625244, 7.8191986083984375, 8.175698280334473, 8.532197952270508, 8.888697624206543, 9.245197296142578, 9.60169792175293, 9.958197593688965, 10.314697265625, 10.671196937561035, 11.02769660949707, 11.384197235107422]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 9.0, 7.0, 14.0, 13.0, 25.0, 23.0, 20.0, 31.0, 34.0, 38.0, 54.0, 64.0, 61.0, 51.0, 63.0, 55.0, 52.0, 63.0, 47.0, 52.0, 45.0, 44.0, 38.0, 21.0, 18.0, 19.0, 14.0, 13.0, 9.0, 4.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.21365737915039, -16.74615478515625, -16.278654098510742, -15.811151504516602, -15.343649864196777, -14.876148223876953, -14.408645629882812, -13.941143989562988, -13.473642349243164, -13.00614070892334, -12.5386381149292, -12.071136474609375, -11.60363483428955, -11.136133193969727, -10.668630599975586, -10.201128959655762, -9.733626365661621, -9.266124725341797, -8.798622131347656, -8.331120491027832, -7.863618850708008, -7.396116733551025, -6.928614616394043, -6.461112976074219, -5.993610858917236, -5.526108741760254, -5.05860710144043, -4.591104984283447, -4.123602867126465, -3.6561012268066406, -3.188599109649658, -2.721097230911255, -2.2535953521728516, -1.7860934734344482, -1.3185914754867554, -0.8510894775390625, -0.3835875988006592, 0.08391427993774414, 0.5514163970947266, 1.0189182758331299, 1.4864201545715332, 1.9539220333099365, 2.42142391204834, 2.8889260292053223, 3.3564279079437256, 3.823929786682129, 4.291431903839111, 4.758934020996094, 5.226435661315918, 5.6939377784729, 6.161439418792725, 6.628941535949707, 7.096443176269531, 7.563945293426514, 8.031447410583496, 8.49894905090332, 8.966451644897461, 9.433953285217285, 9.901455879211426, 10.36895751953125, 10.836459159851074, 11.303960800170898, 11.771463394165039, 12.238965034484863, 12.706466674804688]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 7.0, 6.0, 11.0, 22.0, 23.0, 48.0, 71.0, 142.0, 237.0, 448.0, 1149.0, 4122.0, 26049.0, 3124567.0, 1011315.0, 21323.0, 3219.0, 868.0, 337.0, 144.0, 83.0, 46.0, 17.0, 15.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.294921875, -3.200653076171875, -3.10638427734375, -3.012115478515625, -2.9178466796875, -2.823577880859375, -2.72930908203125, -2.635040283203125, -2.540771484375, -2.446502685546875, -2.35223388671875, -2.257965087890625, -2.1636962890625, -2.069427490234375, -1.97515869140625, -1.880889892578125, -1.78662109375, -1.692352294921875, -1.59808349609375, -1.503814697265625, -1.4095458984375, -1.315277099609375, -1.22100830078125, -1.126739501953125, -1.032470703125, -0.938201904296875, -0.84393310546875, -0.749664306640625, -0.6553955078125, -0.561126708984375, -0.46685791015625, -0.372589111328125, -0.2783203125, -0.184051513671875, -0.08978271484375, 0.004486083984375, 0.0987548828125, 0.193023681640625, 0.28729248046875, 0.381561279296875, 0.475830078125, 0.570098876953125, 0.66436767578125, 0.758636474609375, 0.8529052734375, 0.947174072265625, 1.04144287109375, 1.135711669921875, 1.22998046875, 1.324249267578125, 1.41851806640625, 1.512786865234375, 1.6070556640625, 1.701324462890625, 1.79559326171875, 1.889862060546875, 1.984130859375, 2.078399658203125, 2.17266845703125, 2.266937255859375, 2.3612060546875, 2.455474853515625, 2.54974365234375, 2.644012451171875, 2.73828125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 5.0, 13.0, 19.0, 24.0, 53.0, 61.0, 85.0, 90.0, 105.0, 112.0, 97.0, 85.0, 75.0, 58.0, 48.0, 26.0, 18.0, 13.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.25, -1.2197113037109375, -1.189422607421875, -1.1591339111328125, -1.12884521484375, -1.0985565185546875, -1.068267822265625, -1.0379791259765625, -1.0076904296875, -0.9774017333984375, -0.947113037109375, -0.9168243408203125, -0.88653564453125, -0.8562469482421875, -0.825958251953125, -0.7956695556640625, -0.765380859375, -0.7350921630859375, -0.704803466796875, -0.6745147705078125, -0.64422607421875, -0.6139373779296875, -0.583648681640625, -0.5533599853515625, -0.5230712890625, -0.4927825927734375, -0.462493896484375, -0.4322052001953125, -0.40191650390625, -0.3716278076171875, -0.341339111328125, -0.3110504150390625, -0.28076171875, -0.2504730224609375, -0.220184326171875, -0.1898956298828125, -0.15960693359375, -0.1293182373046875, -0.099029541015625, -0.0687408447265625, -0.0384521484375, -0.0081634521484375, 0.022125244140625, 0.0524139404296875, 0.08270263671875, 0.1129913330078125, 0.143280029296875, 0.1735687255859375, 0.203857421875, 0.2341461181640625, 0.264434814453125, 0.2947235107421875, 0.32501220703125, 0.3553009033203125, 0.385589599609375, 0.4158782958984375, 0.4461669921875, 0.4764556884765625, 0.506744384765625, 0.5370330810546875, 0.56732177734375, 0.5976104736328125, 0.627899169921875, 0.6581878662109375, 0.6884765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 11.0, 20.0, 45.0, 66.0, 172.0, 469.0, 1383.0, 5585.0, 36514.0, 1223651.0, 2866069.0, 50795.0, 6838.0, 1646.0, 570.0, 227.0, 96.0, 44.0, 39.0, 15.0, 7.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8125, -1.74554443359375, -1.6785888671875, -1.61163330078125, -1.544677734375, -1.47772216796875, -1.4107666015625, -1.34381103515625, -1.27685546875, -1.20989990234375, -1.1429443359375, -1.07598876953125, -1.009033203125, -0.94207763671875, -0.8751220703125, -0.80816650390625, -0.7412109375, -0.67425537109375, -0.6072998046875, -0.54034423828125, -0.473388671875, -0.40643310546875, -0.3394775390625, -0.27252197265625, -0.20556640625, -0.13861083984375, -0.0716552734375, -0.00469970703125, 0.062255859375, 0.12921142578125, 0.1961669921875, 0.26312255859375, 0.330078125, 0.39703369140625, 0.4639892578125, 0.53094482421875, 0.597900390625, 0.66485595703125, 0.7318115234375, 0.79876708984375, 0.86572265625, 0.93267822265625, 0.9996337890625, 1.06658935546875, 1.133544921875, 1.20050048828125, 1.2674560546875, 1.33441162109375, 1.4013671875, 1.46832275390625, 1.5352783203125, 1.60223388671875, 1.669189453125, 1.73614501953125, 1.8031005859375, 1.87005615234375, 1.93701171875, 2.00396728515625, 2.0709228515625, 2.13787841796875, 2.204833984375, 2.27178955078125, 2.3387451171875, 2.40570068359375, 2.47265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 4.0, 4.0, 2.0, 4.0, 16.0, 18.0, 29.0, 37.0, 65.0, 139.0, 302.0, 986.0, 1525.0, 506.0, 195.0, 101.0, 49.0, 32.0, 24.0, 13.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.599609375, -0.5775680541992188, -0.5555267333984375, -0.5334854125976562, -0.511444091796875, -0.48940277099609375, -0.4673614501953125, -0.44532012939453125, -0.42327880859375, -0.40123748779296875, -0.3791961669921875, -0.35715484619140625, -0.335113525390625, -0.31307220458984375, -0.2910308837890625, -0.26898956298828125, -0.2469482421875, -0.22490692138671875, -0.2028656005859375, -0.18082427978515625, -0.158782958984375, -0.13674163818359375, -0.1147003173828125, -0.09265899658203125, -0.07061767578125, -0.04857635498046875, -0.0265350341796875, -0.00449371337890625, 0.017547607421875, 0.03958892822265625, 0.0616302490234375, 0.08367156982421875, 0.105712890625, 0.12775421142578125, 0.1497955322265625, 0.17183685302734375, 0.193878173828125, 0.21591949462890625, 0.2379608154296875, 0.26000213623046875, 0.28204345703125, 0.30408477783203125, 0.3261260986328125, 0.34816741943359375, 0.370208740234375, 0.39225006103515625, 0.4142913818359375, 0.43633270263671875, 0.4583740234375, 0.48041534423828125, 0.5024566650390625, 0.5244979858398438, 0.546539306640625, 0.5685806274414062, 0.5906219482421875, 0.6126632690429688, 0.63470458984375, 0.6567459106445312, 0.6787872314453125, 0.7008285522460938, 0.722869873046875, 0.7449111938476562, 0.7669525146484375, 0.7889938354492188, 0.81103515625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 4.0, 12.0, 36.0, 110.0, 240.0, 299.0, 197.0, 76.0, 23.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.980940818786621, -1.7667518854141235, -1.552562952041626, -1.338374137878418, -1.1241850852966309, -0.9099962711334229, -0.6958073377609253, -0.48161840438842773, -0.2674294710159302, -0.05324055254459381, 0.16094836592674255, 0.3751372694969177, 0.5893262028694153, 0.8035150766372681, 1.0177040100097656, 1.2318929433822632, 1.4460818767547607, 1.6602708101272583, 1.8744597434997559, 2.088648557662964, 2.302837610244751, 2.517026424407959, 2.731215476989746, 2.945404291152954, 3.159593105316162, 3.37378191947937, 3.5879709720611572, 3.8021597862243652, 4.016348838806152, 4.230537414550781, 4.444726467132568, 4.6589155197143555, 4.873104572296143, 5.08729362487793, 5.301482200622559, 5.515671253204346, 5.729860305786133, 5.944048881530762, 6.158237934112549, 6.372426986694336, 6.586616039276123, 6.80080509185791, 7.014993667602539, 7.229182720184326, 7.443371772766113, 7.657560348510742, 7.871749401092529, 8.085938453674316, 8.300127029418945, 8.514315605163574, 8.72850513458252, 8.942693710327148, 9.156882286071777, 9.371071815490723, 9.585260391235352, 9.799449920654297, 10.013638496398926, 10.227827072143555, 10.4420166015625, 10.656205177307129, 10.870393753051758, 11.084583282470703, 11.298771858215332, 11.512960433959961, 11.727149963378906]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 3.0, 7.0, 6.0, 10.0, 19.0, 26.0, 18.0, 29.0, 28.0, 19.0, 41.0, 44.0, 40.0, 49.0, 56.0, 54.0, 44.0, 51.0, 54.0, 41.0, 46.0, 37.0, 49.0, 33.0, 39.0, 22.0, 21.0, 25.0, 11.0, 18.0, 14.0, 3.0, 5.0, 5.0, 5.0, 6.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.728029489517212, -1.6730456352233887, -1.6180616617202759, -1.5630778074264526, -1.5080938339233398, -1.4531099796295166, -1.3981261253356934, -1.3431422710418701, -1.2881582975387573, -1.233174443244934, -1.1781904697418213, -1.123206615447998, -1.0682227611541748, -1.013238787651062, -0.9582549333572388, -0.9032710194587708, -0.8482871055603027, -0.7933031916618347, -0.7383192777633667, -0.6833354234695435, -0.6283515095710754, -0.5733675956726074, -0.5183837413787842, -0.46339982748031616, -0.40841591358184814, -0.3534319996833801, -0.2984481155872345, -0.24346421658992767, -0.18848031759262085, -0.13349640369415283, -0.0785125195980072, -0.023528635501861572, 0.031455397605895996, 0.08643929660320282, 0.14142319560050964, 0.19640709459781647, 0.2513909935951233, 0.3063749074935913, 0.36135879158973694, 0.41634267568588257, 0.4713265895843506, 0.5263105034828186, 0.5812944173812866, 0.6362782716751099, 0.6912621855735779, 0.7462460994720459, 0.8012299537658691, 0.8562138676643372, 0.9111977815628052, 0.9661816954612732, 1.0211656093597412, 1.0761494636535645, 1.1311333179473877, 1.1861172914505005, 1.2411011457443237, 1.2960851192474365, 1.3510689735412598, 1.406052827835083, 1.4610368013381958, 1.516020655632019, 1.5710046291351318, 1.625988483428955, 1.6809723377227783, 1.7359561920166016, 1.7909401655197144]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 10.0, 15.0, 15.0, 29.0, 42.0, 53.0, 77.0, 111.0, 175.0, 268.0, 380.0, 658.0, 1192.0, 2209.0, 4927.0, 12625.0, 39427.0, 130074.0, 324978.0, 332354.0, 134337.0, 40852.0, 13152.0, 5094.0, 2379.0, 1197.0, 679.0, 398.0, 268.0, 170.0, 118.0, 69.0, 61.0, 46.0, 33.0, 18.0, 17.0, 11.0, 9.0, 6.0, 5.0, 5.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7724609375, -1.7153167724609375, -1.658172607421875, -1.6010284423828125, -1.54388427734375, -1.4867401123046875, -1.429595947265625, -1.3724517822265625, -1.3153076171875, -1.2581634521484375, -1.201019287109375, -1.1438751220703125, -1.08673095703125, -1.0295867919921875, -0.972442626953125, -0.9152984619140625, -0.858154296875, -0.8010101318359375, -0.743865966796875, -0.6867218017578125, -0.62957763671875, -0.5724334716796875, -0.515289306640625, -0.4581451416015625, -0.4010009765625, -0.3438568115234375, -0.286712646484375, -0.2295684814453125, -0.17242431640625, -0.1152801513671875, -0.058135986328125, -0.0009918212890625, 0.05615234375, 0.1132965087890625, 0.170440673828125, 0.2275848388671875, 0.28472900390625, 0.3418731689453125, 0.399017333984375, 0.4561614990234375, 0.5133056640625, 0.5704498291015625, 0.627593994140625, 0.6847381591796875, 0.74188232421875, 0.7990264892578125, 0.856170654296875, 0.9133148193359375, 0.970458984375, 1.0276031494140625, 1.084747314453125, 1.1418914794921875, 1.19903564453125, 1.2561798095703125, 1.313323974609375, 1.3704681396484375, 1.4276123046875, 1.4847564697265625, 1.541900634765625, 1.5990447998046875, 1.65618896484375, 1.7133331298828125, 1.770477294921875, 1.8276214599609375, 1.884765625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 14.0, 32.0, 41.0, 65.0, 92.0, 99.0, 103.0, 114.0, 115.0, 81.0, 72.0, 61.0, 41.0, 21.0, 17.0, 7.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.3330078125, -1.3013992309570312, -1.2697906494140625, -1.2381820678710938, -1.206573486328125, -1.1749649047851562, -1.1433563232421875, -1.1117477416992188, -1.08013916015625, -1.0485305786132812, -1.0169219970703125, -0.9853134155273438, -0.953704833984375, -0.9220962524414062, -0.8904876708984375, -0.8588790893554688, -0.8272705078125, -0.7956619262695312, -0.7640533447265625, -0.7324447631835938, -0.700836181640625, -0.6692276000976562, -0.6376190185546875, -0.6060104370117188, -0.57440185546875, -0.5427932739257812, -0.5111846923828125, -0.47957611083984375, -0.447967529296875, -0.41635894775390625, -0.3847503662109375, -0.35314178466796875, -0.321533203125, -0.28992462158203125, -0.2583160400390625, -0.22670745849609375, -0.195098876953125, -0.16349029541015625, -0.1318817138671875, -0.10027313232421875, -0.06866455078125, -0.03705596923828125, -0.0054473876953125, 0.02616119384765625, 0.057769775390625, 0.08937835693359375, 0.1209869384765625, 0.15259552001953125, 0.1842041015625, 0.21581268310546875, 0.2474212646484375, 0.27902984619140625, 0.310638427734375, 0.34224700927734375, 0.3738555908203125, 0.40546417236328125, 0.43707275390625, 0.46868133544921875, 0.5002899169921875, 0.5318984985351562, 0.563507080078125, 0.5951156616210938, 0.6267242431640625, 0.6583328247070312, 0.68994140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 7.0, 5.0, 10.0, 15.0, 10.0, 21.0, 26.0, 36.0, 51.0, 73.0, 83.0, 133.0, 204.0, 308.0, 461.0, 777.0, 1533.0, 3614.0, 10707.0, 35140.0, 118021.0, 302253.0, 345028.0, 157970.0, 48771.0, 14275.0, 4713.0, 1794.0, 877.0, 537.0, 327.0, 206.0, 162.0, 108.0, 99.0, 47.0, 44.0, 36.0, 27.0, 11.0, 10.0, 10.0, 8.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.51953125, -1.4707183837890625, -1.421905517578125, -1.3730926513671875, -1.32427978515625, -1.2754669189453125, -1.226654052734375, -1.1778411865234375, -1.1290283203125, -1.0802154541015625, -1.031402587890625, -0.9825897216796875, -0.93377685546875, -0.8849639892578125, -0.836151123046875, -0.7873382568359375, -0.738525390625, -0.6897125244140625, -0.640899658203125, -0.5920867919921875, -0.54327392578125, -0.4944610595703125, -0.445648193359375, -0.3968353271484375, -0.3480224609375, -0.2992095947265625, -0.250396728515625, -0.2015838623046875, -0.15277099609375, -0.1039581298828125, -0.055145263671875, -0.0063323974609375, 0.04248046875, 0.0912933349609375, 0.140106201171875, 0.1889190673828125, 0.23773193359375, 0.2865447998046875, 0.335357666015625, 0.3841705322265625, 0.4329833984375, 0.4817962646484375, 0.530609130859375, 0.5794219970703125, 0.62823486328125, 0.6770477294921875, 0.725860595703125, 0.7746734619140625, 0.823486328125, 0.8722991943359375, 0.921112060546875, 0.9699249267578125, 1.01873779296875, 1.0675506591796875, 1.116363525390625, 1.1651763916015625, 1.2139892578125, 1.2628021240234375, 1.311614990234375, 1.3604278564453125, 1.40924072265625, 1.4580535888671875, 1.506866455078125, 1.5556793212890625, 1.6044921875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 5.0, 4.0, 3.0, 6.0, 5.0, 7.0, 5.0, 10.0, 10.0, 18.0, 24.0, 21.0, 22.0, 24.0, 25.0, 36.0, 45.0, 40.0, 52.0, 45.0, 55.0, 58.0, 52.0, 40.0, 50.0, 39.0, 31.0, 32.0, 23.0, 31.0, 32.0, 26.0, 23.0, 10.0, 19.0, 11.0, 11.0, 9.0, 10.0, 11.0, 5.0, 9.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9150390625, -1.8537445068359375, -1.792449951171875, -1.7311553955078125, -1.66986083984375, -1.6085662841796875, -1.547271728515625, -1.4859771728515625, -1.4246826171875, -1.3633880615234375, -1.302093505859375, -1.2407989501953125, -1.17950439453125, -1.1182098388671875, -1.056915283203125, -0.9956207275390625, -0.934326171875, -0.8730316162109375, -0.811737060546875, -0.7504425048828125, -0.68914794921875, -0.6278533935546875, -0.566558837890625, -0.5052642822265625, -0.4439697265625, -0.3826751708984375, -0.321380615234375, -0.2600860595703125, -0.19879150390625, -0.1374969482421875, -0.076202392578125, -0.0149078369140625, 0.04638671875, 0.1076812744140625, 0.168975830078125, 0.2302703857421875, 0.29156494140625, 0.3528594970703125, 0.414154052734375, 0.4754486083984375, 0.5367431640625, 0.5980377197265625, 0.659332275390625, 0.7206268310546875, 0.78192138671875, 0.8432159423828125, 0.904510498046875, 0.9658050537109375, 1.027099609375, 1.0883941650390625, 1.149688720703125, 1.2109832763671875, 1.27227783203125, 1.3335723876953125, 1.394866943359375, 1.4561614990234375, 1.5174560546875, 1.5787506103515625, 1.640045166015625, 1.7013397216796875, 1.76263427734375, 1.8239288330078125, 1.885223388671875, 1.9465179443359375, 2.0078125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 2.0, 3.0, 4.0, 8.0, 7.0, 8.0, 10.0, 28.0, 20.0, 33.0, 53.0, 94.0, 118.0, 195.0, 381.0, 649.0, 1245.0, 2625.0, 6101.0, 17951.0, 83124.0, 487298.0, 366973.0, 57904.0, 14021.0, 4973.0, 2207.0, 1049.0, 604.0, 338.0, 172.0, 101.0, 74.0, 57.0, 35.0, 23.0, 21.0, 14.0, 11.0, 8.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.912109375, -0.8859710693359375, -0.859832763671875, -0.8336944580078125, -0.80755615234375, -0.7814178466796875, -0.755279541015625, -0.7291412353515625, -0.7030029296875, -0.6768646240234375, -0.650726318359375, -0.6245880126953125, -0.59844970703125, -0.5723114013671875, -0.546173095703125, -0.5200347900390625, -0.493896484375, -0.4677581787109375, -0.441619873046875, -0.4154815673828125, -0.38934326171875, -0.3632049560546875, -0.337066650390625, -0.3109283447265625, -0.2847900390625, -0.2586517333984375, -0.232513427734375, -0.2063751220703125, -0.18023681640625, -0.1540985107421875, -0.127960205078125, -0.1018218994140625, -0.07568359375, -0.0495452880859375, -0.023406982421875, 0.0027313232421875, 0.02886962890625, 0.0550079345703125, 0.081146240234375, 0.1072845458984375, 0.1334228515625, 0.1595611572265625, 0.185699462890625, 0.2118377685546875, 0.23797607421875, 0.2641143798828125, 0.290252685546875, 0.3163909912109375, 0.342529296875, 0.3686676025390625, 0.394805908203125, 0.4209442138671875, 0.44708251953125, 0.4732208251953125, 0.499359130859375, 0.5254974365234375, 0.5516357421875, 0.5777740478515625, 0.603912353515625, 0.6300506591796875, 0.65618896484375, 0.6823272705078125, 0.708465576171875, 0.7346038818359375, 0.7607421875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 3.0, 6.0, 5.0, 14.0, 12.0, 16.0, 25.0, 25.0, 29.0, 49.0, 56.0, 84.0, 121.0, 128.0, 95.0, 81.0, 41.0, 44.0, 37.0, 32.0, 25.0, 17.0, 13.0, 11.0, 13.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00016689300537109375, -0.00016153976321220398, -0.0001561865210533142, -0.00015083327889442444, -0.00014548003673553467, -0.0001401267945766449, -0.00013477355241775513, -0.00012942031025886536, -0.00012406706809997559, -0.00011871382594108582, -0.00011336058378219604, -0.00010800734162330627, -0.0001026540994644165, -9.730085730552673e-05, -9.194761514663696e-05, -8.659437298774719e-05, -8.124113082885742e-05, -7.588788866996765e-05, -7.053464651107788e-05, -6.518140435218811e-05, -5.982816219329834e-05, -5.447492003440857e-05, -4.91216778755188e-05, -4.376843571662903e-05, -3.841519355773926e-05, -3.306195139884949e-05, -2.7708709239959717e-05, -2.2355467081069946e-05, -1.7002224922180176e-05, -1.1648982763290405e-05, -6.295740604400635e-06, -9.424984455108643e-07, 4.410743713378906e-06, 9.763985872268677e-06, 1.5117228031158447e-05, 2.0470470190048218e-05, 2.5823712348937988e-05, 3.117695450782776e-05, 3.653019666671753e-05, 4.18834388256073e-05, 4.723668098449707e-05, 5.258992314338684e-05, 5.794316530227661e-05, 6.329640746116638e-05, 6.864964962005615e-05, 7.400289177894592e-05, 7.93561339378357e-05, 8.470937609672546e-05, 9.006261825561523e-05, 9.5415860414505e-05, 0.00010076910257339478, 0.00010612234473228455, 0.00011147558689117432, 0.00011682882905006409, 0.00012218207120895386, 0.00012753531336784363, 0.0001328885555267334, 0.00013824179768562317, 0.00014359503984451294, 0.0001489482820034027, 0.00015430152416229248, 0.00015965476632118225, 0.00016500800848007202, 0.0001703612506389618, 0.00017571449279785156]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 10.0, 11.0, 16.0, 26.0, 38.0, 48.0, 68.0, 132.0, 211.0, 470.0, 1056.0, 2340.0, 6723.0, 28111.0, 214657.0, 673707.0, 96485.0, 16500.0, 4654.0, 1685.0, 747.0, 336.0, 191.0, 92.0, 82.0, 61.0, 26.0, 25.0, 8.0, 9.0, 8.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97900390625, -0.9467239379882812, -0.9144439697265625, -0.8821640014648438, -0.849884033203125, -0.8176040649414062, -0.7853240966796875, -0.7530441284179688, -0.72076416015625, -0.6884841918945312, -0.6562042236328125, -0.6239242553710938, -0.591644287109375, -0.5593643188476562, -0.5270843505859375, -0.49480438232421875, -0.4625244140625, -0.43024444580078125, -0.3979644775390625, -0.36568450927734375, -0.333404541015625, -0.30112457275390625, -0.2688446044921875, -0.23656463623046875, -0.20428466796875, -0.17200469970703125, -0.1397247314453125, -0.10744476318359375, -0.075164794921875, -0.04288482666015625, -0.0106048583984375, 0.02167510986328125, 0.053955078125, 0.08623504638671875, 0.1185150146484375, 0.15079498291015625, 0.183074951171875, 0.21535491943359375, 0.2476348876953125, 0.27991485595703125, 0.31219482421875, 0.34447479248046875, 0.3767547607421875, 0.40903472900390625, 0.441314697265625, 0.47359466552734375, 0.5058746337890625, 0.5381546020507812, 0.5704345703125, 0.6027145385742188, 0.6349945068359375, 0.6672744750976562, 0.699554443359375, 0.7318344116210938, 0.7641143798828125, 0.7963943481445312, 0.82867431640625, 0.8609542846679688, 0.8932342529296875, 0.9255142211914062, 0.957794189453125, 0.9900741577148438, 1.0223541259765625, 1.0546340942382812, 1.0869140625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 4.0, 5.0, 8.0, 14.0, 16.0, 23.0, 28.0, 60.0, 68.0, 82.0, 141.0, 133.0, 119.0, 97.0, 64.0, 38.0, 28.0, 24.0, 12.0, 8.0, 7.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9423828125, -0.9091644287109375, -0.875946044921875, -0.8427276611328125, -0.80950927734375, -0.7762908935546875, -0.743072509765625, -0.7098541259765625, -0.6766357421875, -0.6434173583984375, -0.610198974609375, -0.5769805908203125, -0.54376220703125, -0.5105438232421875, -0.477325439453125, -0.4441070556640625, -0.410888671875, -0.3776702880859375, -0.344451904296875, -0.3112335205078125, -0.27801513671875, -0.2447967529296875, -0.211578369140625, -0.1783599853515625, -0.1451416015625, -0.1119232177734375, -0.078704833984375, -0.0454864501953125, -0.01226806640625, 0.0209503173828125, 0.054168701171875, 0.0873870849609375, 0.12060546875, 0.1538238525390625, 0.187042236328125, 0.2202606201171875, 0.25347900390625, 0.2866973876953125, 0.319915771484375, 0.3531341552734375, 0.3863525390625, 0.4195709228515625, 0.452789306640625, 0.4860076904296875, 0.51922607421875, 0.5524444580078125, 0.585662841796875, 0.6188812255859375, 0.652099609375, 0.6853179931640625, 0.718536376953125, 0.7517547607421875, 0.78497314453125, 0.8181915283203125, 0.851409912109375, 0.8846282958984375, 0.9178466796875, 0.9510650634765625, 0.984283447265625, 1.0175018310546875, 1.05072021484375, 1.0839385986328125, 1.117156982421875, 1.1503753662109375, 1.18359375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 6.0, 4.0, 10.0, 11.0, 21.0, 28.0, 50.0, 57.0, 98.0, 135.0, 127.0, 142.0, 105.0, 84.0, 41.0, 29.0, 21.0, 13.0, 5.0, 10.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.689489364624023, -14.266870498657227, -13.84425163269043, -13.421632766723633, -12.999013900756836, -12.576395034790039, -12.153776168823242, -11.731157302856445, -11.308538436889648, -10.885919570922852, -10.463300704956055, -10.040681838989258, -9.618062973022461, -9.195444107055664, -8.772825241088867, -8.35020637512207, -7.927587509155273, -7.504968643188477, -7.08234977722168, -6.659730911254883, -6.237112045288086, -5.814493179321289, -5.391874313354492, -4.969255447387695, -4.546636581420898, -4.124017715454102, -3.7013988494873047, -3.278779983520508, -2.856161117553711, -2.433542251586914, -2.010923385620117, -1.5883045196533203, -1.1656856536865234, -0.7430667877197266, -0.3204479217529297, 0.10217094421386719, 0.5247898101806641, 0.9474086761474609, 1.3700275421142578, 1.7926464080810547, 2.2152652740478516, 2.6378841400146484, 3.0605030059814453, 3.483121871948242, 3.905740737915039, 4.328359603881836, 4.750978469848633, 5.17359733581543, 5.596216201782227, 6.018835067749023, 6.44145393371582, 6.864072799682617, 7.286691665649414, 7.709310531616211, 8.131929397583008, 8.554548263549805, 8.977167129516602, 9.399785995483398, 9.822404861450195, 10.245023727416992, 10.667642593383789, 11.090261459350586, 11.512880325317383, 11.93549919128418, 12.358118057250977]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 8.0, 5.0, 6.0, 8.0, 6.0, 8.0, 12.0, 14.0, 12.0, 16.0, 17.0, 20.0, 21.0, 26.0, 31.0, 38.0, 33.0, 55.0, 42.0, 30.0, 38.0, 42.0, 40.0, 44.0, 44.0, 38.0, 45.0, 37.0, 32.0, 23.0, 34.0, 32.0, 21.0, 18.0, 24.0, 14.0, 15.0, 11.0, 13.0, 10.0, 5.0, 3.0, 3.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.59252643585205, -10.253106117248535, -9.91368579864502, -9.574264526367188, -9.234844207763672, -8.895423889160156, -8.55600357055664, -8.216583251953125, -7.877161979675293, -7.537741661071777, -7.1983208656311035, -6.858900547027588, -6.519479751586914, -6.180059432983398, -5.840639114379883, -5.501218318939209, -5.161798000335693, -4.822377681732178, -4.482956886291504, -4.143536567687988, -3.8041157722473145, -3.464695453643799, -3.125274896621704, -2.7858543395996094, -2.4464337825775146, -2.10701322555542, -1.7675926685333252, -1.42817223072052, -1.0887516736984253, -0.7493311166763306, -0.4099106788635254, -0.07049012184143066, 0.26893043518066406, 0.6083509922027588, 0.9477714896202087, 1.2871919870376587, 1.6266125440597534, 1.9660331010818481, 2.3054535388946533, 2.644874095916748, 2.9842946529388428, 3.3237152099609375, 3.6631357669830322, 4.002556324005127, 4.341976642608643, 4.681397438049316, 5.020817756652832, 5.360238075256348, 5.6996588706970215, 6.039079189300537, 6.378499984741211, 6.717920303344727, 7.0573410987854, 7.396761417388916, 7.73618221282959, 8.075602531433105, 8.415022850036621, 8.754443168640137, 9.093863487243652, 9.433284759521484, 9.772705078125, 10.112125396728516, 10.451545715332031, 10.790966033935547, 11.130387306213379]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 6.0, 11.0, 9.0, 12.0, 16.0, 23.0, 33.0, 36.0, 55.0, 113.0, 215.0, 329.0, 663.0, 1501.0, 4366.0, 19693.0, 301367.0, 3789704.0, 63177.0, 8729.0, 2373.0, 925.0, 439.0, 209.0, 117.0, 62.0, 41.0, 23.0, 11.0, 8.0, 4.0, 7.0, 0.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.279296875, -3.197845458984375, -3.11639404296875, -3.034942626953125, -2.9534912109375, -2.872039794921875, -2.79058837890625, -2.709136962890625, -2.627685546875, -2.546234130859375, -2.46478271484375, -2.383331298828125, -2.3018798828125, -2.220428466796875, -2.13897705078125, -2.057525634765625, -1.97607421875, -1.894622802734375, -1.81317138671875, -1.731719970703125, -1.6502685546875, -1.568817138671875, -1.48736572265625, -1.405914306640625, -1.324462890625, -1.243011474609375, -1.16156005859375, -1.080108642578125, -0.9986572265625, -0.917205810546875, -0.83575439453125, -0.754302978515625, -0.6728515625, -0.591400146484375, -0.50994873046875, -0.428497314453125, -0.3470458984375, -0.265594482421875, -0.18414306640625, -0.102691650390625, -0.021240234375, 0.060211181640625, 0.14166259765625, 0.223114013671875, 0.3045654296875, 0.386016845703125, 0.46746826171875, 0.548919677734375, 0.63037109375, 0.711822509765625, 0.79327392578125, 0.874725341796875, 0.9561767578125, 1.037628173828125, 1.11907958984375, 1.200531005859375, 1.281982421875, 1.363433837890625, 1.44488525390625, 1.526336669921875, 1.6077880859375, 1.689239501953125, 1.77069091796875, 1.852142333984375, 1.93359375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 7.0, 25.0, 29.0, 39.0, 54.0, 70.0, 93.0, 102.0, 81.0, 90.0, 90.0, 86.0, 65.0, 61.0, 30.0, 21.0, 21.0, 16.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.330078125, -1.2982406616210938, -1.2664031982421875, -1.2345657348632812, -1.202728271484375, -1.1708908081054688, -1.1390533447265625, -1.1072158813476562, -1.07537841796875, -1.0435409545898438, -1.0117034912109375, -0.9798660278320312, -0.948028564453125, -0.9161911010742188, -0.8843536376953125, -0.8525161743164062, -0.8206787109375, -0.7888412475585938, -0.7570037841796875, -0.7251663208007812, -0.693328857421875, -0.6614913940429688, -0.6296539306640625, -0.5978164672851562, -0.56597900390625, -0.5341415405273438, -0.5023040771484375, -0.47046661376953125, -0.438629150390625, -0.40679168701171875, -0.3749542236328125, -0.34311676025390625, -0.311279296875, -0.27944183349609375, -0.2476043701171875, -0.21576690673828125, -0.183929443359375, -0.15209197998046875, -0.1202545166015625, -0.08841705322265625, -0.05657958984375, -0.02474212646484375, 0.0070953369140625, 0.03893280029296875, 0.070770263671875, 0.10260772705078125, 0.1344451904296875, 0.16628265380859375, 0.1981201171875, 0.22995758056640625, 0.2617950439453125, 0.29363250732421875, 0.325469970703125, 0.35730743408203125, 0.3891448974609375, 0.42098236083984375, 0.45281982421875, 0.48465728759765625, 0.5164947509765625, 0.5483322143554688, 0.580169677734375, 0.6120071411132812, 0.6438446044921875, 0.6756820678710938, 0.70751953125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 4.0, 2.0, 8.0, 21.0, 21.0, 33.0, 64.0, 117.0, 208.0, 382.0, 894.0, 2464.0, 8486.0, 44516.0, 832912.0, 3196353.0, 88364.0, 13483.0, 3597.0, 1282.0, 496.0, 247.0, 139.0, 73.0, 45.0, 32.0, 20.0, 8.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.986328125, -1.9281768798828125, -1.870025634765625, -1.8118743896484375, -1.75372314453125, -1.6955718994140625, -1.637420654296875, -1.5792694091796875, -1.5211181640625, -1.4629669189453125, -1.404815673828125, -1.3466644287109375, -1.28851318359375, -1.2303619384765625, -1.172210693359375, -1.1140594482421875, -1.055908203125, -0.9977569580078125, -0.939605712890625, -0.8814544677734375, -0.82330322265625, -0.7651519775390625, -0.707000732421875, -0.6488494873046875, -0.5906982421875, -0.5325469970703125, -0.474395751953125, -0.4162445068359375, -0.35809326171875, -0.2999420166015625, -0.241790771484375, -0.1836395263671875, -0.12548828125, -0.0673370361328125, -0.009185791015625, 0.0489654541015625, 0.10711669921875, 0.1652679443359375, 0.223419189453125, 0.2815704345703125, 0.3397216796875, 0.3978729248046875, 0.456024169921875, 0.5141754150390625, 0.57232666015625, 0.6304779052734375, 0.688629150390625, 0.7467803955078125, 0.804931640625, 0.8630828857421875, 0.921234130859375, 0.9793853759765625, 1.03753662109375, 1.0956878662109375, 1.153839111328125, 1.2119903564453125, 1.2701416015625, 1.3282928466796875, 1.386444091796875, 1.4445953369140625, 1.50274658203125, 1.5608978271484375, 1.619049072265625, 1.6772003173828125, 1.7353515625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 5.0, 5.0, 12.0, 7.0, 14.0, 17.0, 47.0, 47.0, 123.0, 215.0, 523.0, 1587.0, 872.0, 293.0, 136.0, 51.0, 35.0, 27.0, 16.0, 6.0, 13.0, 6.0, 5.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7998046875, -0.7728958129882812, -0.7459869384765625, -0.7190780639648438, -0.692169189453125, -0.6652603149414062, -0.6383514404296875, -0.6114425659179688, -0.58453369140625, -0.5576248168945312, -0.5307159423828125, -0.5038070678710938, -0.476898193359375, -0.44998931884765625, -0.4230804443359375, -0.39617156982421875, -0.3692626953125, -0.34235382080078125, -0.3154449462890625, -0.28853607177734375, -0.261627197265625, -0.23471832275390625, -0.2078094482421875, -0.18090057373046875, -0.15399169921875, -0.12708282470703125, -0.1001739501953125, -0.07326507568359375, -0.046356201171875, -0.01944732666015625, 0.0074615478515625, 0.03437042236328125, 0.061279296875, 0.08818817138671875, 0.1150970458984375, 0.14200592041015625, 0.168914794921875, 0.19582366943359375, 0.2227325439453125, 0.24964141845703125, 0.27655029296875, 0.30345916748046875, 0.3303680419921875, 0.35727691650390625, 0.384185791015625, 0.41109466552734375, 0.4380035400390625, 0.46491241455078125, 0.4918212890625, 0.5187301635742188, 0.5456390380859375, 0.5725479125976562, 0.599456787109375, 0.6263656616210938, 0.6532745361328125, 0.6801834106445312, 0.70709228515625, 0.7340011596679688, 0.7609100341796875, 0.7878189086914062, 0.814727783203125, 0.8416366577148438, 0.8685455322265625, 0.8954544067382812, 0.92236328125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 2.0, 6.0, 26.0, 163.0, 345.0, 321.0, 123.0, 14.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.086357116699219, -4.748605251312256, -4.410853385925293, -4.073101043701172, -3.735349416732788, -3.397597551345825, -3.059845447540283, -2.7220935821533203, -2.3843417167663574, -2.0465898513793945, -1.708837866783142, -1.3710858821868896, -1.0333340167999268, -0.6955821514129639, -0.3578300476074219, -0.020078182220458984, 0.3176736831665039, 0.6554256081581116, 0.9931775331497192, 1.3309295177459717, 1.6686813831329346, 2.0064332485198975, 2.3441853523254395, 2.6819372177124023, 3.0196890830993652, 3.357440948486328, 3.695192813873291, 4.032944679260254, 4.370697021484375, 4.70844841003418, 5.046200752258301, 5.383952617645264, 5.721704483032227, 6.0594563484191895, 6.397208213806152, 6.734960556030273, 7.072711944580078, 7.410464286804199, 7.748216152191162, 8.085968017578125, 8.42371940612793, 8.76147174835205, 9.099223136901855, 9.436975479125977, 9.774726867675781, 10.112479209899902, 10.450231552124023, 10.787982940673828, 11.12573528289795, 11.46348762512207, 11.801239013671875, 12.138991355895996, 12.4767427444458, 12.814495086669922, 13.152246475219727, 13.489998817443848, 13.827751159667969, 14.16550350189209, 14.503254890441895, 14.841007232666016, 15.17875862121582, 15.516510963439941, 15.854263305664062, 16.192014694213867, 16.529766082763672]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 11.0, 9.0, 10.0, 14.0, 18.0, 23.0, 30.0, 38.0, 47.0, 51.0, 50.0, 42.0, 38.0, 47.0, 57.0, 66.0, 70.0, 49.0, 54.0, 48.0, 37.0, 48.0, 29.0, 26.0, 23.0, 16.0, 11.0, 9.0, 7.0, 8.0, 5.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.5575668811798096, -3.4646031856536865, -3.3716394901275635, -3.2786757946014404, -3.1857123374938965, -3.0927486419677734, -2.9997849464416504, -2.9068212509155273, -2.8138575553894043, -2.7208938598632812, -2.627930164337158, -2.534966468811035, -2.442002773284912, -2.349039316177368, -2.256075620651245, -2.163111925125122, -2.070148229598999, -1.977184534072876, -1.884220838546753, -1.7912572622299194, -1.6982935667037964, -1.6053298711776733, -1.5123662948608398, -1.4194025993347168, -1.3264389038085938, -1.2334752082824707, -1.1405115127563477, -1.0475479364395142, -0.9545842409133911, -0.8616205453872681, -0.7686569094657898, -0.6756932735443115, -0.5827293395996094, -0.4897656738758087, -0.39680200815200806, -0.3038383424282074, -0.21087467670440674, -0.11791101098060608, -0.02494734525680542, 0.06801629066467285, 0.1609799861907959, 0.25394365191459656, 0.3469073176383972, 0.4398709833621979, 0.5328346490859985, 0.6257983446121216, 0.7187619805335999, 0.8117256164550781, 0.9046893119812012, 0.9976530075073242, 1.0906167030334473, 1.1835802793502808, 1.2765439748764038, 1.3695076704025269, 1.4624712467193604, 1.5554349422454834, 1.6483986377716064, 1.7413623332977295, 1.8343260288238525, 1.927289605140686, 2.0202531814575195, 2.1132168769836426, 2.2061805725097656, 2.2991442680358887, 2.3921079635620117]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 9.0, 8.0, 11.0, 19.0, 26.0, 48.0, 67.0, 137.0, 232.0, 353.0, 736.0, 1496.0, 3424.0, 9445.0, 32783.0, 141205.0, 480386.0, 286695.0, 64764.0, 16736.0, 5486.0, 2186.0, 1076.0, 509.0, 269.0, 150.0, 115.0, 53.0, 31.0, 30.0, 14.0, 15.0, 14.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.525390625, -2.45269775390625, -2.3800048828125, -2.30731201171875, -2.234619140625, -2.16192626953125, -2.0892333984375, -2.01654052734375, -1.94384765625, -1.87115478515625, -1.7984619140625, -1.72576904296875, -1.653076171875, -1.58038330078125, -1.5076904296875, -1.43499755859375, -1.3623046875, -1.28961181640625, -1.2169189453125, -1.14422607421875, -1.071533203125, -0.99884033203125, -0.9261474609375, -0.85345458984375, -0.78076171875, -0.70806884765625, -0.6353759765625, -0.56268310546875, -0.489990234375, -0.41729736328125, -0.3446044921875, -0.27191162109375, -0.19921875, -0.12652587890625, -0.0538330078125, 0.01885986328125, 0.091552734375, 0.16424560546875, 0.2369384765625, 0.30963134765625, 0.38232421875, 0.45501708984375, 0.5277099609375, 0.60040283203125, 0.673095703125, 0.74578857421875, 0.8184814453125, 0.89117431640625, 0.9638671875, 1.03656005859375, 1.1092529296875, 1.18194580078125, 1.254638671875, 1.32733154296875, 1.4000244140625, 1.47271728515625, 1.54541015625, 1.61810302734375, 1.6907958984375, 1.76348876953125, 1.836181640625, 1.90887451171875, 1.9815673828125, 2.05426025390625, 2.126953125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 16.0, 22.0, 34.0, 40.0, 54.0, 86.0, 81.0, 106.0, 81.0, 88.0, 84.0, 84.0, 66.0, 42.0, 34.0, 30.0, 16.0, 12.0, 8.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.310546875, -1.2797470092773438, -1.2489471435546875, -1.2181472778320312, -1.187347412109375, -1.1565475463867188, -1.1257476806640625, -1.0949478149414062, -1.06414794921875, -1.0333480834960938, -1.0025482177734375, -0.9717483520507812, -0.940948486328125, -0.9101486206054688, -0.8793487548828125, -0.8485488891601562, -0.8177490234375, -0.7869491577148438, -0.7561492919921875, -0.7253494262695312, -0.694549560546875, -0.6637496948242188, -0.6329498291015625, -0.6021499633789062, -0.57135009765625, -0.5405502319335938, -0.5097503662109375, -0.47895050048828125, -0.448150634765625, -0.41735076904296875, -0.3865509033203125, -0.35575103759765625, -0.324951171875, -0.29415130615234375, -0.2633514404296875, -0.23255157470703125, -0.201751708984375, -0.17095184326171875, -0.1401519775390625, -0.10935211181640625, -0.07855224609375, -0.04775238037109375, -0.0169525146484375, 0.01384735107421875, 0.044647216796875, 0.07544708251953125, 0.1062469482421875, 0.13704681396484375, 0.1678466796875, 0.19864654541015625, 0.2294464111328125, 0.26024627685546875, 0.291046142578125, 0.32184600830078125, 0.3526458740234375, 0.38344573974609375, 0.41424560546875, 0.44504547119140625, 0.4758453369140625, 0.5066452026367188, 0.537445068359375, 0.5682449340820312, 0.5990447998046875, 0.6298446655273438, 0.66064453125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 5.0, 5.0, 12.0, 11.0, 16.0, 21.0, 21.0, 45.0, 53.0, 58.0, 78.0, 120.0, 183.0, 254.0, 395.0, 684.0, 1294.0, 3232.0, 10277.0, 39088.0, 164715.0, 449872.0, 280483.0, 70899.0, 17507.0, 4995.0, 1817.0, 839.0, 506.0, 319.0, 206.0, 132.0, 93.0, 73.0, 53.0, 41.0, 41.0, 30.0, 20.0, 9.0, 12.0, 14.0, 5.0, 4.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.017578125, -1.9577178955078125, -1.897857666015625, -1.8379974365234375, -1.77813720703125, -1.7182769775390625, -1.658416748046875, -1.5985565185546875, -1.5386962890625, -1.4788360595703125, -1.418975830078125, -1.3591156005859375, -1.29925537109375, -1.2393951416015625, -1.179534912109375, -1.1196746826171875, -1.059814453125, -0.9999542236328125, -0.940093994140625, -0.8802337646484375, -0.82037353515625, -0.7605133056640625, -0.700653076171875, -0.6407928466796875, -0.5809326171875, -0.5210723876953125, -0.461212158203125, -0.4013519287109375, -0.34149169921875, -0.2816314697265625, -0.221771240234375, -0.1619110107421875, -0.10205078125, -0.0421905517578125, 0.017669677734375, 0.0775299072265625, 0.13739013671875, 0.1972503662109375, 0.257110595703125, 0.3169708251953125, 0.3768310546875, 0.4366912841796875, 0.496551513671875, 0.5564117431640625, 0.61627197265625, 0.6761322021484375, 0.735992431640625, 0.7958526611328125, 0.855712890625, 0.9155731201171875, 0.975433349609375, 1.0352935791015625, 1.09515380859375, 1.1550140380859375, 1.214874267578125, 1.2747344970703125, 1.3345947265625, 1.3944549560546875, 1.454315185546875, 1.5141754150390625, 1.57403564453125, 1.6338958740234375, 1.693756103515625, 1.7536163330078125, 1.8134765625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 7.0, 9.0, 4.0, 11.0, 10.0, 10.0, 18.0, 21.0, 21.0, 22.0, 23.0, 21.0, 31.0, 32.0, 29.0, 53.0, 37.0, 40.0, 39.0, 47.0, 46.0, 43.0, 39.0, 43.0, 43.0, 27.0, 43.0, 23.0, 38.0, 22.0, 26.0, 17.0, 16.0, 13.0, 13.0, 14.0, 10.0, 5.0, 8.0, 5.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-2.04296875, -1.97918701171875, -1.9154052734375, -1.85162353515625, -1.787841796875, -1.72406005859375, -1.6602783203125, -1.59649658203125, -1.53271484375, -1.46893310546875, -1.4051513671875, -1.34136962890625, -1.277587890625, -1.21380615234375, -1.1500244140625, -1.08624267578125, -1.0224609375, -0.95867919921875, -0.8948974609375, -0.83111572265625, -0.767333984375, -0.70355224609375, -0.6397705078125, -0.57598876953125, -0.51220703125, -0.44842529296875, -0.3846435546875, -0.32086181640625, -0.257080078125, -0.19329833984375, -0.1295166015625, -0.06573486328125, -0.001953125, 0.06182861328125, 0.1256103515625, 0.18939208984375, 0.253173828125, 0.31695556640625, 0.3807373046875, 0.44451904296875, 0.50830078125, 0.57208251953125, 0.6358642578125, 0.69964599609375, 0.763427734375, 0.82720947265625, 0.8909912109375, 0.95477294921875, 1.0185546875, 1.08233642578125, 1.1461181640625, 1.20989990234375, 1.273681640625, 1.33746337890625, 1.4012451171875, 1.46502685546875, 1.52880859375, 1.59259033203125, 1.6563720703125, 1.72015380859375, 1.783935546875, 1.84771728515625, 1.9114990234375, 1.97528076171875, 2.0390625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 3.0, 5.0, 9.0, 7.0, 12.0, 15.0, 21.0, 26.0, 60.0, 110.0, 192.0, 338.0, 731.0, 2425.0, 9659.0, 53566.0, 680062.0, 266767.0, 26532.0, 5339.0, 1472.0, 559.0, 279.0, 143.0, 81.0, 42.0, 31.0, 27.0, 17.0, 9.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.18359375, -1.150543212890625, -1.11749267578125, -1.084442138671875, -1.0513916015625, -1.018341064453125, -0.98529052734375, -0.952239990234375, -0.919189453125, -0.886138916015625, -0.85308837890625, -0.820037841796875, -0.7869873046875, -0.753936767578125, -0.72088623046875, -0.687835693359375, -0.65478515625, -0.621734619140625, -0.58868408203125, -0.555633544921875, -0.5225830078125, -0.489532470703125, -0.45648193359375, -0.423431396484375, -0.390380859375, -0.357330322265625, -0.32427978515625, -0.291229248046875, -0.2581787109375, -0.225128173828125, -0.19207763671875, -0.159027099609375, -0.1259765625, -0.092926025390625, -0.05987548828125, -0.026824951171875, 0.0062255859375, 0.039276123046875, 0.07232666015625, 0.105377197265625, 0.138427734375, 0.171478271484375, 0.20452880859375, 0.237579345703125, 0.2706298828125, 0.303680419921875, 0.33673095703125, 0.369781494140625, 0.40283203125, 0.435882568359375, 0.46893310546875, 0.501983642578125, 0.5350341796875, 0.568084716796875, 0.60113525390625, 0.634185791015625, 0.667236328125, 0.700286865234375, 0.73333740234375, 0.766387939453125, 0.7994384765625, 0.832489013671875, 0.86553955078125, 0.898590087890625, 0.931640625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 10.0, 4.0, 5.0, 10.0, 5.0, 11.0, 6.0, 8.0, 15.0, 14.0, 18.0, 22.0, 21.0, 21.0, 47.0, 92.0, 115.0, 144.0, 120.0, 72.0, 48.0, 34.0, 24.0, 22.0, 14.0, 15.0, 10.0, 6.0, 8.0, 6.0, 5.0, 6.0, 4.0, 5.0, 6.0, 1.0, 4.0, 3.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.00012421607971191406, -0.0001200065016746521, -0.00011579692363739014, -0.00011158734560012817, -0.00010737776756286621, -0.00010316818952560425, -9.895861148834229e-05, -9.474903345108032e-05, -9.053945541381836e-05, -8.63298773765564e-05, -8.212029933929443e-05, -7.791072130203247e-05, -7.370114326477051e-05, -6.949156522750854e-05, -6.528198719024658e-05, -6.107240915298462e-05, -5.6862831115722656e-05, -5.265325307846069e-05, -4.844367504119873e-05, -4.423409700393677e-05, -4.0024518966674805e-05, -3.581494092941284e-05, -3.160536289215088e-05, -2.7395784854888916e-05, -2.3186206817626953e-05, -1.897662878036499e-05, -1.4767050743103027e-05, -1.0557472705841064e-05, -6.3478946685791016e-06, -2.1383166313171387e-06, 2.0712614059448242e-06, 6.280839443206787e-06, 1.049041748046875e-05, 1.4699995517730713e-05, 1.8909573554992676e-05, 2.311915159225464e-05, 2.73287296295166e-05, 3.1538307666778564e-05, 3.574788570404053e-05, 3.995746374130249e-05, 4.416704177856445e-05, 4.8376619815826416e-05, 5.258619785308838e-05, 5.679577589035034e-05, 6.1005353927612305e-05, 6.521493196487427e-05, 6.942451000213623e-05, 7.36340880393982e-05, 7.784366607666016e-05, 8.205324411392212e-05, 8.626282215118408e-05, 9.047240018844604e-05, 9.468197822570801e-05, 9.889155626296997e-05, 0.00010310113430023193, 0.0001073107123374939, 0.00011152029037475586, 0.00011572986841201782, 0.00011993944644927979, 0.00012414902448654175, 0.0001283586025238037, 0.00013256818056106567, 0.00013677775859832764, 0.0001409873366355896, 0.00014519691467285156]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 1.0, 9.0, 13.0, 15.0, 24.0, 45.0, 62.0, 93.0, 175.0, 251.0, 451.0, 1140.0, 3828.0, 21030.0, 217796.0, 742674.0, 49840.0, 7711.0, 1820.0, 703.0, 320.0, 198.0, 131.0, 80.0, 35.0, 35.0, 22.0, 9.0, 11.0, 8.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.162109375, -1.12603759765625, -1.0899658203125, -1.05389404296875, -1.017822265625, -0.98175048828125, -0.9456787109375, -0.90960693359375, -0.87353515625, -0.83746337890625, -0.8013916015625, -0.76531982421875, -0.729248046875, -0.69317626953125, -0.6571044921875, -0.62103271484375, -0.5849609375, -0.54888916015625, -0.5128173828125, -0.47674560546875, -0.440673828125, -0.40460205078125, -0.3685302734375, -0.33245849609375, -0.29638671875, -0.26031494140625, -0.2242431640625, -0.18817138671875, -0.152099609375, -0.11602783203125, -0.0799560546875, -0.04388427734375, -0.0078125, 0.02825927734375, 0.0643310546875, 0.10040283203125, 0.136474609375, 0.17254638671875, 0.2086181640625, 0.24468994140625, 0.28076171875, 0.31683349609375, 0.3529052734375, 0.38897705078125, 0.425048828125, 0.46112060546875, 0.4971923828125, 0.53326416015625, 0.5693359375, 0.60540771484375, 0.6414794921875, 0.67755126953125, 0.713623046875, 0.74969482421875, 0.7857666015625, 0.82183837890625, 0.85791015625, 0.89398193359375, 0.9300537109375, 0.96612548828125, 1.002197265625, 1.03826904296875, 1.0743408203125, 1.11041259765625, 1.146484375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 11.0, 17.0, 26.0, 38.0, 65.0, 103.0, 157.0, 205.0, 142.0, 98.0, 54.0, 35.0, 23.0, 5.0, 10.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1181640625, -1.07861328125, -1.0390625, -0.99951171875, -0.9599609375, -0.92041015625, -0.880859375, -0.84130859375, -0.8017578125, -0.76220703125, -0.72265625, -0.68310546875, -0.6435546875, -0.60400390625, -0.564453125, -0.52490234375, -0.4853515625, -0.44580078125, -0.40625, -0.36669921875, -0.3271484375, -0.28759765625, -0.248046875, -0.20849609375, -0.1689453125, -0.12939453125, -0.08984375, -0.05029296875, -0.0107421875, 0.02880859375, 0.068359375, 0.10791015625, 0.1474609375, 0.18701171875, 0.2265625, 0.26611328125, 0.3056640625, 0.34521484375, 0.384765625, 0.42431640625, 0.4638671875, 0.50341796875, 0.54296875, 0.58251953125, 0.6220703125, 0.66162109375, 0.701171875, 0.74072265625, 0.7802734375, 0.81982421875, 0.859375, 0.89892578125, 0.9384765625, 0.97802734375, 1.017578125, 1.05712890625, 1.0966796875, 1.13623046875, 1.17578125, 1.21533203125, 1.2548828125, 1.29443359375, 1.333984375, 1.37353515625, 1.4130859375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 13.0, 24.0, 40.0, 55.0, 113.0, 113.0, 137.0, 157.0, 114.0, 77.0, 54.0, 39.0, 23.0, 11.0, 8.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.566740989685059, -11.143534660339355, -10.720328330993652, -10.29712200164795, -9.873915672302246, -9.450709342956543, -9.027502059936523, -8.60429573059082, -8.181089401245117, -7.757883071899414, -7.334676742553711, -6.911470413208008, -6.488264083862305, -6.065057754516602, -5.64185094833374, -5.218644618988037, -4.795438766479492, -4.372232437133789, -3.949026107788086, -3.5258195400238037, -3.1026132106781006, -2.6794068813323975, -2.2562003135681152, -1.832993984222412, -1.409787654876709, -0.9865812659263611, -0.5633748769760132, -0.1401684284210205, 0.2830379009246826, 0.7062442302703857, 1.129450798034668, 1.552657127380371, 1.9758644104003906, 2.3990707397460938, 2.822277069091797, 3.245483636856079, 3.6686899662017822, 4.091896057128906, 4.515102863311768, 4.938309192657471, 5.361515522003174, 5.784721851348877, 6.20792818069458, 6.631134986877441, 7.0543413162231445, 7.477547645568848, 7.900753974914551, 8.323960304260254, 8.747166633605957, 9.17037296295166, 9.593579292297363, 10.016785621643066, 10.43999195098877, 10.863198280334473, 11.286405563354492, 11.709611892700195, 12.132818222045898, 12.556024551391602, 12.979230880737305, 13.402437210083008, 13.825643539428711, 14.248849868774414, 14.672056198120117, 15.09526252746582, 15.518468856811523]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 11.0, 4.0, 8.0, 11.0, 10.0, 13.0, 20.0, 21.0, 20.0, 37.0, 29.0, 32.0, 35.0, 46.0, 39.0, 54.0, 51.0, 44.0, 51.0, 23.0, 38.0, 53.0, 46.0, 45.0, 38.0, 39.0, 20.0, 30.0, 31.0, 12.0, 21.0, 14.0, 18.0, 11.0, 5.0, 4.0, 7.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.500724792480469, -13.100916862487793, -12.701108932495117, -12.301300048828125, -11.90149211883545, -11.501684188842773, -11.101876258850098, -10.702068328857422, -10.30225944519043, -9.902451515197754, -9.502643585205078, -9.102834701538086, -8.70302677154541, -8.303218841552734, -7.903410911560059, -7.503602981567383, -7.103795051574707, -6.703987121582031, -6.304178714752197, -5.9043707847595215, -5.5045623779296875, -5.104754447937012, -4.704946517944336, -4.30513858795166, -3.905330181121826, -3.5055220127105713, -3.1057138442993164, -2.7059059143066406, -2.3060977458953857, -1.9062895774841309, -1.506481647491455, -1.1066734790802002, -0.7068662643432617, -0.3070581555366516, 0.0927499532699585, 0.49255800247192383, 0.8923661708831787, 1.2921743392944336, 1.6919822692871094, 2.0917904376983643, 2.491598606109619, 2.891406774520874, 3.291214942932129, 3.6910228729248047, 4.0908308029174805, 4.4906392097473145, 4.89044713973999, 5.290255546569824, 5.6900634765625, 6.089871406555176, 6.48967981338501, 6.8894877433776855, 7.2892961502075195, 7.689104080200195, 8.088912010192871, 8.488719940185547, 8.888528823852539, 9.288336753845215, 9.68814468383789, 10.087953567504883, 10.487761497497559, 10.887569427490234, 11.28737735748291, 11.687185287475586, 12.086993217468262]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 12.0, 7.0, 6.0, 14.0, 20.0, 25.0, 46.0, 43.0, 82.0, 123.0, 193.0, 352.0, 625.0, 1375.0, 3125.0, 8758.0, 32365.0, 279884.0, 3713699.0, 121497.0, 20980.0, 6386.0, 2476.0, 1022.0, 490.0, 245.0, 160.0, 95.0, 65.0, 35.0, 17.0, 18.0, 11.0, 10.0, 6.0, 8.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.138671875, -2.0781707763671875, -2.017669677734375, -1.9571685791015625, -1.89666748046875, -1.8361663818359375, -1.775665283203125, -1.7151641845703125, -1.6546630859375, -1.5941619873046875, -1.533660888671875, -1.4731597900390625, -1.41265869140625, -1.3521575927734375, -1.291656494140625, -1.2311553955078125, -1.170654296875, -1.1101531982421875, -1.049652099609375, -0.9891510009765625, -0.92864990234375, -0.8681488037109375, -0.807647705078125, -0.7471466064453125, -0.6866455078125, -0.6261444091796875, -0.565643310546875, -0.5051422119140625, -0.44464111328125, -0.3841400146484375, -0.323638916015625, -0.2631378173828125, -0.20263671875, -0.1421356201171875, -0.081634521484375, -0.0211334228515625, 0.03936767578125, 0.0998687744140625, 0.160369873046875, 0.2208709716796875, 0.2813720703125, 0.3418731689453125, 0.402374267578125, 0.4628753662109375, 0.52337646484375, 0.5838775634765625, 0.644378662109375, 0.7048797607421875, 0.765380859375, 0.8258819580078125, 0.886383056640625, 0.9468841552734375, 1.00738525390625, 1.0678863525390625, 1.128387451171875, 1.1888885498046875, 1.2493896484375, 1.3098907470703125, 1.370391845703125, 1.4308929443359375, 1.49139404296875, 1.5518951416015625, 1.612396240234375, 1.6728973388671875, 1.7333984375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 4.0, 6.0, 11.0, 15.0, 36.0, 37.0, 45.0, 59.0, 72.0, 78.0, 86.0, 79.0, 95.0, 74.0, 69.0, 45.0, 60.0, 43.0, 30.0, 27.0, 10.0, 6.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.314453125, -1.28277587890625, -1.2510986328125, -1.21942138671875, -1.187744140625, -1.15606689453125, -1.1243896484375, -1.09271240234375, -1.06103515625, -1.02935791015625, -0.9976806640625, -0.96600341796875, -0.934326171875, -0.90264892578125, -0.8709716796875, -0.83929443359375, -0.8076171875, -0.77593994140625, -0.7442626953125, -0.71258544921875, -0.680908203125, -0.64923095703125, -0.6175537109375, -0.58587646484375, -0.55419921875, -0.52252197265625, -0.4908447265625, -0.45916748046875, -0.427490234375, -0.39581298828125, -0.3641357421875, -0.33245849609375, -0.30078125, -0.26910400390625, -0.2374267578125, -0.20574951171875, -0.174072265625, -0.14239501953125, -0.1107177734375, -0.07904052734375, -0.04736328125, -0.01568603515625, 0.0159912109375, 0.04766845703125, 0.079345703125, 0.11102294921875, 0.1427001953125, 0.17437744140625, 0.2060546875, 0.23773193359375, 0.2694091796875, 0.30108642578125, 0.332763671875, 0.36444091796875, 0.3961181640625, 0.42779541015625, 0.45947265625, 0.49114990234375, 0.5228271484375, 0.55450439453125, 0.586181640625, 0.61785888671875, 0.6495361328125, 0.68121337890625, 0.712890625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 8.0, 7.0, 18.0, 25.0, 51.0, 82.0, 178.0, 380.0, 823.0, 1733.0, 4237.0, 11522.0, 40664.0, 262114.0, 3470461.0, 333491.0, 46429.0, 13449.0, 4868.0, 2008.0, 876.0, 401.0, 217.0, 90.0, 62.0, 28.0, 17.0, 8.0, 11.0, 7.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.29296875, -1.250640869140625, -1.20831298828125, -1.165985107421875, -1.1236572265625, -1.081329345703125, -1.03900146484375, -0.996673583984375, -0.954345703125, -0.912017822265625, -0.86968994140625, -0.827362060546875, -0.7850341796875, -0.742706298828125, -0.70037841796875, -0.658050537109375, -0.61572265625, -0.573394775390625, -0.53106689453125, -0.488739013671875, -0.4464111328125, -0.404083251953125, -0.36175537109375, -0.319427490234375, -0.277099609375, -0.234771728515625, -0.19244384765625, -0.150115966796875, -0.1077880859375, -0.065460205078125, -0.02313232421875, 0.019195556640625, 0.0615234375, 0.103851318359375, 0.14617919921875, 0.188507080078125, 0.2308349609375, 0.273162841796875, 0.31549072265625, 0.357818603515625, 0.400146484375, 0.442474365234375, 0.48480224609375, 0.527130126953125, 0.5694580078125, 0.611785888671875, 0.65411376953125, 0.696441650390625, 0.73876953125, 0.781097412109375, 0.82342529296875, 0.865753173828125, 0.9080810546875, 0.950408935546875, 0.99273681640625, 1.035064697265625, 1.077392578125, 1.119720458984375, 1.16204833984375, 1.204376220703125, 1.2467041015625, 1.289031982421875, 1.33135986328125, 1.373687744140625, 1.416015625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 4.0, 5.0, 11.0, 8.0, 16.0, 16.0, 43.0, 58.0, 132.0, 233.0, 640.0, 1704.0, 630.0, 263.0, 94.0, 59.0, 33.0, 26.0, 24.0, 16.0, 8.0, 10.0, 6.0, 13.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63037109375, -0.6097412109375, -0.589111328125, -0.5684814453125, -0.5478515625, -0.5272216796875, -0.506591796875, -0.4859619140625, -0.46533203125, -0.4447021484375, -0.424072265625, -0.4034423828125, -0.3828125, -0.3621826171875, -0.341552734375, -0.3209228515625, -0.30029296875, -0.2796630859375, -0.259033203125, -0.2384033203125, -0.2177734375, -0.1971435546875, -0.176513671875, -0.1558837890625, -0.13525390625, -0.1146240234375, -0.093994140625, -0.0733642578125, -0.052734375, -0.0321044921875, -0.011474609375, 0.0091552734375, 0.02978515625, 0.0504150390625, 0.071044921875, 0.0916748046875, 0.1123046875, 0.1329345703125, 0.153564453125, 0.1741943359375, 0.19482421875, 0.2154541015625, 0.236083984375, 0.2567138671875, 0.27734375, 0.2979736328125, 0.318603515625, 0.3392333984375, 0.35986328125, 0.3804931640625, 0.401123046875, 0.4217529296875, 0.4423828125, 0.4630126953125, 0.483642578125, 0.5042724609375, 0.52490234375, 0.5455322265625, 0.566162109375, 0.5867919921875, 0.607421875, 0.6280517578125, 0.648681640625, 0.6693115234375, 0.68994140625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 14.0, 58.0, 183.0, 307.0, 243.0, 127.0, 49.0, 16.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7384209632873535, -1.523756504058838, -1.3090921640396118, -1.0944278240203857, -0.8797633647918701, -0.6650989055633545, -0.4504345655441284, -0.23577022552490234, -0.02110576629638672, 0.19355863332748413, 0.408223032951355, 0.6228874325752258, 0.8375518321990967, 1.0522162914276123, 1.2668806314468384, 1.4815449714660645, 1.69620943069458, 1.9108738899230957, 2.1255383491516113, 2.340202569961548, 2.5548670291900635, 2.769531488418579, 2.9841957092285156, 3.1988601684570312, 3.413524627685547, 3.6281890869140625, 3.842853546142578, 4.057518005371094, 4.272182464599609, 4.486846923828125, 4.701510906219482, 4.916175365447998, 5.1308393478393555, 5.345503807067871, 5.560168266296387, 5.774832725524902, 5.989497184753418, 6.204161643981934, 6.418825626373291, 6.633490085601807, 6.848154544830322, 7.062819004058838, 7.2774834632873535, 7.492147922515869, 7.706811904907227, 7.921476364135742, 8.136140823364258, 8.350805282592773, 8.565469741821289, 8.780134201049805, 8.99479866027832, 9.209463119506836, 9.424127578735352, 9.638792037963867, 9.853456497192383, 10.068120956420898, 10.282785415649414, 10.49744987487793, 10.712114334106445, 10.926778793334961, 11.141443252563477, 11.356107711791992, 11.570772171020508, 11.785436630249023, 12.000100135803223]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 3.0, 7.0, 9.0, 19.0, 18.0, 20.0, 23.0, 27.0, 29.0, 29.0, 38.0, 49.0, 35.0, 59.0, 51.0, 66.0, 46.0, 52.0, 55.0, 52.0, 38.0, 42.0, 41.0, 22.0, 29.0, 21.0, 25.0, 26.0, 13.0, 12.0, 8.0, 9.0, 6.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-2.5775716304779053, -2.509949207305908, -2.442326545715332, -2.374704122543335, -2.307081699371338, -2.2394590377807617, -2.1718366146087646, -2.1042141914367676, -2.0365915298461914, -1.9689689874649048, -1.9013465642929077, -1.833724021911621, -1.766101598739624, -1.6984790563583374, -1.6308565139770508, -1.5632340908050537, -1.4956116676330566, -1.42798912525177, -1.360366702079773, -1.2927441596984863, -1.2251217365264893, -1.1574991941452026, -1.089876651763916, -1.022254228591919, -0.9546316862106323, -0.8870092034339905, -0.8193867206573486, -0.751764178276062, -0.6841416954994202, -0.6165192127227783, -0.5488966703414917, -0.48127418756484985, -0.413651704788208, -0.34602922201156616, -0.27840670943260193, -0.2107842117547989, -0.14316171407699585, -0.075539231300354, -0.00791671872138977, 0.05970579385757446, 0.1273282766342163, 0.19495077431201935, 0.2625732719898224, 0.3301957845687866, 0.39781826734542847, 0.4654407501220703, 0.5330632925033569, 0.6006857752799988, 0.6683082580566406, 0.7359307408332825, 0.8035532236099243, 0.8711757659912109, 0.9387982487678528, 1.0064207315444946, 1.0740432739257812, 1.1416656970977783, 1.209288239479065, 1.2769107818603516, 1.3445332050323486, 1.4121557474136353, 1.4797782897949219, 1.547400712966919, 1.6150232553482056, 1.6826457977294922, 1.7502682209014893]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 3.0, 10.0, 11.0, 25.0, 35.0, 53.0, 126.0, 195.0, 323.0, 744.0, 1620.0, 4702.0, 18186.0, 90910.0, 395518.0, 411959.0, 96600.0, 19325.0, 4890.0, 1746.0, 727.0, 345.0, 219.0, 115.0, 67.0, 39.0, 20.0, 13.0, 7.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-3.2734375, -3.193634033203125, -3.11383056640625, -3.034027099609375, -2.9542236328125, -2.874420166015625, -2.79461669921875, -2.714813232421875, -2.635009765625, -2.555206298828125, -2.47540283203125, -2.395599365234375, -2.3157958984375, -2.235992431640625, -2.15618896484375, -2.076385498046875, -1.99658203125, -1.916778564453125, -1.83697509765625, -1.757171630859375, -1.6773681640625, -1.597564697265625, -1.51776123046875, -1.437957763671875, -1.358154296875, -1.278350830078125, -1.19854736328125, -1.118743896484375, -1.0389404296875, -0.959136962890625, -0.87933349609375, -0.799530029296875, -0.7197265625, -0.639923095703125, -0.56011962890625, -0.480316162109375, -0.4005126953125, -0.320709228515625, -0.24090576171875, -0.161102294921875, -0.081298828125, -0.001495361328125, 0.07830810546875, 0.158111572265625, 0.2379150390625, 0.317718505859375, 0.39752197265625, 0.477325439453125, 0.55712890625, 0.636932373046875, 0.71673583984375, 0.796539306640625, 0.8763427734375, 0.956146240234375, 1.03594970703125, 1.115753173828125, 1.195556640625, 1.275360107421875, 1.35516357421875, 1.434967041015625, 1.5147705078125, 1.594573974609375, 1.67437744140625, 1.754180908203125, 1.833984375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 4.0, 12.0, 20.0, 27.0, 41.0, 44.0, 66.0, 67.0, 89.0, 82.0, 88.0, 93.0, 77.0, 60.0, 53.0, 55.0, 37.0, 31.0, 21.0, 15.0, 2.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3271484375, -1.2950515747070312, -1.2629547119140625, -1.2308578491210938, -1.198760986328125, -1.1666641235351562, -1.1345672607421875, -1.1024703979492188, -1.07037353515625, -1.0382766723632812, -1.0061798095703125, -0.9740829467773438, -0.941986083984375, -0.9098892211914062, -0.8777923583984375, -0.8456954956054688, -0.8135986328125, -0.7815017700195312, -0.7494049072265625, -0.7173080444335938, -0.685211181640625, -0.6531143188476562, -0.6210174560546875, -0.5889205932617188, -0.55682373046875, -0.5247268676757812, -0.4926300048828125, -0.46053314208984375, -0.428436279296875, -0.39633941650390625, -0.3642425537109375, -0.33214569091796875, -0.300048828125, -0.26795196533203125, -0.2358551025390625, -0.20375823974609375, -0.171661376953125, -0.13956451416015625, -0.1074676513671875, -0.07537078857421875, -0.04327392578125, -0.01117706298828125, 0.0209197998046875, 0.05301666259765625, 0.085113525390625, 0.11721038818359375, 0.1493072509765625, 0.18140411376953125, 0.2135009765625, 0.24559783935546875, 0.2776947021484375, 0.30979156494140625, 0.341888427734375, 0.37398529052734375, 0.4060821533203125, 0.43817901611328125, 0.47027587890625, 0.5023727416992188, 0.5344696044921875, 0.5665664672851562, 0.598663330078125, 0.6307601928710938, 0.6628570556640625, 0.6949539184570312, 0.72705078125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 3.0, 4.0, 10.0, 13.0, 17.0, 11.0, 25.0, 31.0, 54.0, 82.0, 73.0, 151.0, 245.0, 475.0, 1090.0, 3125.0, 10737.0, 42411.0, 173156.0, 454740.0, 267878.0, 69453.0, 16979.0, 4731.0, 1553.0, 632.0, 322.0, 190.0, 106.0, 67.0, 46.0, 40.0, 24.0, 23.0, 18.0, 11.0, 9.0, 8.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.103515625, -2.041046142578125, -1.97857666015625, -1.916107177734375, -1.8536376953125, -1.791168212890625, -1.72869873046875, -1.666229248046875, -1.603759765625, -1.541290283203125, -1.47882080078125, -1.416351318359375, -1.3538818359375, -1.291412353515625, -1.22894287109375, -1.166473388671875, -1.10400390625, -1.041534423828125, -0.97906494140625, -0.916595458984375, -0.8541259765625, -0.791656494140625, -0.72918701171875, -0.666717529296875, -0.604248046875, -0.541778564453125, -0.47930908203125, -0.416839599609375, -0.3543701171875, -0.291900634765625, -0.22943115234375, -0.166961669921875, -0.1044921875, -0.042022705078125, 0.02044677734375, 0.082916259765625, 0.1453857421875, 0.207855224609375, 0.27032470703125, 0.332794189453125, 0.395263671875, 0.457733154296875, 0.52020263671875, 0.582672119140625, 0.6451416015625, 0.707611083984375, 0.77008056640625, 0.832550048828125, 0.89501953125, 0.957489013671875, 1.01995849609375, 1.082427978515625, 1.1448974609375, 1.207366943359375, 1.26983642578125, 1.332305908203125, 1.394775390625, 1.457244873046875, 1.51971435546875, 1.582183837890625, 1.6446533203125, 1.707122802734375, 1.76959228515625, 1.832061767578125, 1.89453125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 4.0, 9.0, 9.0, 5.0, 10.0, 10.0, 16.0, 16.0, 20.0, 22.0, 38.0, 34.0, 36.0, 48.0, 47.0, 38.0, 41.0, 44.0, 44.0, 63.0, 44.0, 47.0, 41.0, 40.0, 44.0, 36.0, 25.0, 32.0, 17.0, 21.0, 17.0, 20.0, 9.0, 10.0, 6.0, 7.0, 9.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.36328125, -2.28955078125, -2.2158203125, -2.14208984375, -2.068359375, -1.99462890625, -1.9208984375, -1.84716796875, -1.7734375, -1.69970703125, -1.6259765625, -1.55224609375, -1.478515625, -1.40478515625, -1.3310546875, -1.25732421875, -1.18359375, -1.10986328125, -1.0361328125, -0.96240234375, -0.888671875, -0.81494140625, -0.7412109375, -0.66748046875, -0.59375, -0.52001953125, -0.4462890625, -0.37255859375, -0.298828125, -0.22509765625, -0.1513671875, -0.07763671875, -0.00390625, 0.06982421875, 0.1435546875, 0.21728515625, 0.291015625, 0.36474609375, 0.4384765625, 0.51220703125, 0.5859375, 0.65966796875, 0.7333984375, 0.80712890625, 0.880859375, 0.95458984375, 1.0283203125, 1.10205078125, 1.17578125, 1.24951171875, 1.3232421875, 1.39697265625, 1.470703125, 1.54443359375, 1.6181640625, 1.69189453125, 1.765625, 1.83935546875, 1.9130859375, 1.98681640625, 2.060546875, 2.13427734375, 2.2080078125, 2.28173828125, 2.35546875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 5.0, 7.0, 12.0, 11.0, 18.0, 25.0, 41.0, 51.0, 92.0, 152.0, 292.0, 750.0, 1919.0, 6198.0, 27094.0, 171415.0, 682188.0, 128414.0, 21781.0, 5203.0, 1593.0, 608.0, 261.0, 151.0, 91.0, 57.0, 41.0, 30.0, 19.0, 14.0, 7.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.8330078125, -0.8080902099609375, -0.783172607421875, -0.7582550048828125, -0.73333740234375, -0.7084197998046875, -0.683502197265625, -0.6585845947265625, -0.6336669921875, -0.6087493896484375, -0.583831787109375, -0.5589141845703125, -0.53399658203125, -0.5090789794921875, -0.484161376953125, -0.4592437744140625, -0.434326171875, -0.4094085693359375, -0.384490966796875, -0.3595733642578125, -0.33465576171875, -0.3097381591796875, -0.284820556640625, -0.2599029541015625, -0.2349853515625, -0.2100677490234375, -0.185150146484375, -0.1602325439453125, -0.13531494140625, -0.1103973388671875, -0.085479736328125, -0.0605621337890625, -0.03564453125, -0.0107269287109375, 0.014190673828125, 0.0391082763671875, 0.06402587890625, 0.0889434814453125, 0.113861083984375, 0.1387786865234375, 0.1636962890625, 0.1886138916015625, 0.213531494140625, 0.2384490966796875, 0.26336669921875, 0.2882843017578125, 0.313201904296875, 0.3381195068359375, 0.363037109375, 0.3879547119140625, 0.412872314453125, 0.4377899169921875, 0.46270751953125, 0.4876251220703125, 0.512542724609375, 0.5374603271484375, 0.5623779296875, 0.5872955322265625, 0.612213134765625, 0.6371307373046875, 0.66204833984375, 0.6869659423828125, 0.711883544921875, 0.7368011474609375, 0.76171875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 4.0, 3.0, 7.0, 6.0, 12.0, 9.0, 6.0, 10.0, 14.0, 18.0, 23.0, 44.0, 49.0, 96.0, 172.0, 177.0, 107.0, 55.0, 35.0, 27.0, 25.0, 22.0, 14.0, 10.0, 6.0, 4.0, 6.0, 7.0, 7.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016570091247558594, -0.00016067177057266235, -0.00015564262866973877, -0.00015061348676681519, -0.0001455843448638916, -0.00014055520296096802, -0.00013552606105804443, -0.00013049691915512085, -0.00012546777725219727, -0.00012043863534927368, -0.0001154094934463501, -0.00011038035154342651, -0.00010535120964050293, -0.00010032206773757935, -9.529292583465576e-05, -9.026378393173218e-05, -8.52346420288086e-05, -8.020550012588501e-05, -7.517635822296143e-05, -7.014721632003784e-05, -6.511807441711426e-05, -6.0088932514190674e-05, -5.505979061126709e-05, -5.0030648708343506e-05, -4.500150680541992e-05, -3.997236490249634e-05, -3.4943222999572754e-05, -2.991408109664917e-05, -2.4884939193725586e-05, -1.9855797290802002e-05, -1.4826655387878418e-05, -9.797513484954834e-06, -4.76837158203125e-06, 2.60770320892334e-07, 5.289912223815918e-06, 1.0319054126739502e-05, 1.5348196029663086e-05, 2.037733793258667e-05, 2.5406479835510254e-05, 3.0435621738433838e-05, 3.546476364135742e-05, 4.0493905544281006e-05, 4.552304744720459e-05, 5.0552189350128174e-05, 5.558133125305176e-05, 6.061047315597534e-05, 6.563961505889893e-05, 7.066875696182251e-05, 7.56978988647461e-05, 8.072704076766968e-05, 8.575618267059326e-05, 9.078532457351685e-05, 9.581446647644043e-05, 0.00010084360837936401, 0.0001058727502822876, 0.00011090189218521118, 0.00011593103408813477, 0.00012096017599105835, 0.00012598931789398193, 0.00013101845979690552, 0.0001360476016998291, 0.00014107674360275269, 0.00014610588550567627, 0.00015113502740859985, 0.00015616416931152344]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 22.0, 23.0, 43.0, 102.0, 246.0, 694.0, 3241.0, 43631.0, 895813.0, 97888.0, 5402.0, 899.0, 278.0, 117.0, 74.0, 30.0, 20.0, 9.0, 13.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.037109375, -0.9912567138671875, -0.945404052734375, -0.8995513916015625, -0.85369873046875, -0.8078460693359375, -0.761993408203125, -0.7161407470703125, -0.6702880859375, -0.6244354248046875, -0.578582763671875, -0.5327301025390625, -0.48687744140625, -0.4410247802734375, -0.395172119140625, -0.3493194580078125, -0.303466796875, -0.2576141357421875, -0.211761474609375, -0.1659088134765625, -0.12005615234375, -0.0742034912109375, -0.028350830078125, 0.0175018310546875, 0.0633544921875, 0.1092071533203125, 0.155059814453125, 0.2009124755859375, 0.24676513671875, 0.2926177978515625, 0.338470458984375, 0.3843231201171875, 0.43017578125, 0.4760284423828125, 0.521881103515625, 0.5677337646484375, 0.61358642578125, 0.6594390869140625, 0.705291748046875, 0.7511444091796875, 0.7969970703125, 0.8428497314453125, 0.888702392578125, 0.9345550537109375, 0.98040771484375, 1.0262603759765625, 1.072113037109375, 1.1179656982421875, 1.163818359375, 1.2096710205078125, 1.255523681640625, 1.3013763427734375, 1.34722900390625, 1.3930816650390625, 1.438934326171875, 1.4847869873046875, 1.5306396484375, 1.5764923095703125, 1.622344970703125, 1.6681976318359375, 1.71405029296875, 1.7599029541015625, 1.805755615234375, 1.8516082763671875, 1.8974609375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 7.0, 11.0, 15.0, 29.0, 48.0, 94.0, 150.0, 201.0, 193.0, 124.0, 55.0, 25.0, 18.0, 9.0, 14.0, 10.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.020599365234375, -0.97772216796875, -0.934844970703125, -0.8919677734375, -0.849090576171875, -0.80621337890625, -0.763336181640625, -0.720458984375, -0.677581787109375, -0.63470458984375, -0.591827392578125, -0.5489501953125, -0.506072998046875, -0.46319580078125, -0.420318603515625, -0.37744140625, -0.334564208984375, -0.29168701171875, -0.248809814453125, -0.2059326171875, -0.163055419921875, -0.12017822265625, -0.077301025390625, -0.034423828125, 0.008453369140625, 0.05133056640625, 0.094207763671875, 0.1370849609375, 0.179962158203125, 0.22283935546875, 0.265716552734375, 0.30859375, 0.351470947265625, 0.39434814453125, 0.437225341796875, 0.4801025390625, 0.522979736328125, 0.56585693359375, 0.608734130859375, 0.651611328125, 0.694488525390625, 0.73736572265625, 0.780242919921875, 0.8231201171875, 0.865997314453125, 0.90887451171875, 0.951751708984375, 0.99462890625, 1.037506103515625, 1.08038330078125, 1.123260498046875, 1.1661376953125, 1.209014892578125, 1.25189208984375, 1.294769287109375, 1.337646484375, 1.380523681640625, 1.42340087890625, 1.466278076171875, 1.5091552734375, 1.552032470703125, 1.59490966796875, 1.637786865234375, 1.6806640625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 11.0, 22.0, 73.0, 157.0, 251.0, 229.0, 153.0, 65.0, 24.0, 11.0, 11.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.65030288696289, -12.89504337310791, -12.139782905578613, -11.384523391723633, -10.629262924194336, -9.874003410339355, -9.118743896484375, -8.363483428955078, -7.608223915100098, -6.852963924407959, -6.09770393371582, -5.34244441986084, -4.587184429168701, -3.8319244384765625, -3.076664924621582, -2.3214049339294434, -1.5661449432373047, -0.8108850717544556, -0.055625200271606445, 0.6996345520019531, 1.4548945426940918, 2.2101545333862305, 2.965414047241211, 3.7206740379333496, 4.475934028625488, 5.231194019317627, 5.986454010009766, 6.741713523864746, 7.496973514556885, 8.252233505249023, 9.007493019104004, 9.762752532958984, 10.518013000488281, 11.273272514343262, 12.028532981872559, 12.783792495727539, 13.539052963256836, 14.294312477111816, 15.049571990966797, 15.804832458496094, 16.56009292602539, 17.315353393554688, 18.07061195373535, 18.82587242126465, 19.581132888793945, 20.33639144897461, 21.091651916503906, 21.846912384033203, 22.602170944213867, 23.357431411743164, 24.112689971923828, 24.867950439453125, 25.623210906982422, 26.37847137451172, 27.133729934692383, 27.88899040222168, 28.644248962402344, 29.39950942993164, 30.154767990112305, 30.9100284576416, 31.6652889251709, 32.42054748535156, 33.17580795288086, 33.931068420410156, 34.68632888793945]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 9.0, 7.0, 5.0, 9.0, 11.0, 10.0, 12.0, 19.0, 21.0, 20.0, 25.0, 27.0, 29.0, 24.0, 31.0, 35.0, 44.0, 46.0, 22.0, 42.0, 45.0, 39.0, 36.0, 38.0, 39.0, 36.0, 28.0, 33.0, 30.0, 36.0, 18.0, 23.0, 20.0, 14.0, 18.0, 15.0, 13.0, 10.0, 10.0, 8.0, 6.0, 7.0, 4.0, 4.0, 8.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0], "bins": [-9.470109939575195, -9.18471622467041, -8.899321556091309, -8.613927841186523, -8.328534126281738, -8.043140411376953, -7.757745742797852, -7.472352027893066, -7.186957836151123, -6.90156364440918, -6.6161699295043945, -6.330775737762451, -6.045381546020508, -5.759987831115723, -5.474593639373779, -5.189199447631836, -4.903805732727051, -4.618411540985107, -4.333017826080322, -4.047623634338379, -3.7622296810150146, -3.4768357276916504, -3.191441535949707, -2.9060475826263428, -2.6206536293029785, -2.3352596759796143, -2.04986572265625, -1.7644715309143066, -1.4790775775909424, -1.1936836242675781, -0.9082895517349243, -0.6228954792022705, -0.33750152587890625, -0.05210751295089722, 0.23328649997711182, 0.5186805129051208, 0.8040745258331299, 1.0894684791564941, 1.374862551689148, 1.6602566242218018, 1.945650577545166, 2.2310445308685303, 2.5164384841918945, 2.801832675933838, 3.087226629257202, 3.3726205825805664, 3.6580147743225098, 3.943408727645874, 4.228802680969238, 4.514196872711182, 4.799590587615967, 5.08498477935791, 5.370378494262695, 5.655772686004639, 5.941166877746582, 6.226560592651367, 6.5119547843933105, 6.797348976135254, 7.082742691040039, 7.368136882781982, 7.653531074523926, 7.938924789428711, 8.224318504333496, 8.509713172912598, 8.795106887817383]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 6.0, 5.0, 6.0, 11.0, 31.0, 33.0, 51.0, 87.0, 136.0, 203.0, 395.0, 812.0, 1926.0, 5845.0, 26053.0, 384231.0, 3697914.0, 61074.0, 10436.0, 2921.0, 1043.0, 488.0, 230.0, 133.0, 62.0, 60.0, 25.0, 22.0, 17.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.0703125, -3.96649169921875, -3.8626708984375, -3.75885009765625, -3.655029296875, -3.55120849609375, -3.4473876953125, -3.34356689453125, -3.23974609375, -3.13592529296875, -3.0321044921875, -2.92828369140625, -2.824462890625, -2.72064208984375, -2.6168212890625, -2.51300048828125, -2.4091796875, -2.30535888671875, -2.2015380859375, -2.09771728515625, -1.993896484375, -1.89007568359375, -1.7862548828125, -1.68243408203125, -1.57861328125, -1.47479248046875, -1.3709716796875, -1.26715087890625, -1.163330078125, -1.05950927734375, -0.9556884765625, -0.85186767578125, -0.748046875, -0.64422607421875, -0.5404052734375, -0.43658447265625, -0.332763671875, -0.22894287109375, -0.1251220703125, -0.02130126953125, 0.08251953125, 0.18634033203125, 0.2901611328125, 0.39398193359375, 0.497802734375, 0.60162353515625, 0.7054443359375, 0.80926513671875, 0.9130859375, 1.01690673828125, 1.1207275390625, 1.22454833984375, 1.328369140625, 1.43218994140625, 1.5360107421875, 1.63983154296875, 1.74365234375, 1.84747314453125, 1.9512939453125, 2.05511474609375, 2.158935546875, 2.26275634765625, 2.3665771484375, 2.47039794921875, 2.57421875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 7.0, 8.0, 14.0, 22.0, 23.0, 35.0, 42.0, 60.0, 57.0, 76.0, 88.0, 82.0, 69.0, 72.0, 69.0, 71.0, 51.0, 43.0, 34.0, 28.0, 17.0, 16.0, 6.0, 5.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3125, -1.28033447265625, -1.2481689453125, -1.21600341796875, -1.183837890625, -1.15167236328125, -1.1195068359375, -1.08734130859375, -1.05517578125, -1.02301025390625, -0.9908447265625, -0.95867919921875, -0.926513671875, -0.89434814453125, -0.8621826171875, -0.83001708984375, -0.7978515625, -0.76568603515625, -0.7335205078125, -0.70135498046875, -0.669189453125, -0.63702392578125, -0.6048583984375, -0.57269287109375, -0.54052734375, -0.50836181640625, -0.4761962890625, -0.44403076171875, -0.411865234375, -0.37969970703125, -0.3475341796875, -0.31536865234375, -0.283203125, -0.25103759765625, -0.2188720703125, -0.18670654296875, -0.154541015625, -0.12237548828125, -0.0902099609375, -0.05804443359375, -0.02587890625, 0.00628662109375, 0.0384521484375, 0.07061767578125, 0.102783203125, 0.13494873046875, 0.1671142578125, 0.19927978515625, 0.2314453125, 0.26361083984375, 0.2957763671875, 0.32794189453125, 0.360107421875, 0.39227294921875, 0.4244384765625, 0.45660400390625, 0.48876953125, 0.52093505859375, 0.5531005859375, 0.58526611328125, 0.617431640625, 0.64959716796875, 0.6817626953125, 0.71392822265625, 0.74609375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 4.0, 18.0, 16.0, 25.0, 48.0, 62.0, 106.0, 177.0, 303.0, 580.0, 1184.0, 2394.0, 5960.0, 18069.0, 83917.0, 2138012.0, 1830247.0, 83217.0, 18580.0, 6195.0, 2570.0, 1208.0, 575.0, 311.0, 175.0, 131.0, 63.0, 40.0, 35.0, 23.0, 10.0, 7.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.4609375, -2.3978271484375, -2.334716796875, -2.2716064453125, -2.20849609375, -2.1453857421875, -2.082275390625, -2.0191650390625, -1.9560546875, -1.8929443359375, -1.829833984375, -1.7667236328125, -1.70361328125, -1.6405029296875, -1.577392578125, -1.5142822265625, -1.451171875, -1.3880615234375, -1.324951171875, -1.2618408203125, -1.19873046875, -1.1356201171875, -1.072509765625, -1.0093994140625, -0.9462890625, -0.8831787109375, -0.820068359375, -0.7569580078125, -0.69384765625, -0.6307373046875, -0.567626953125, -0.5045166015625, -0.44140625, -0.3782958984375, -0.315185546875, -0.2520751953125, -0.18896484375, -0.1258544921875, -0.062744140625, 0.0003662109375, 0.0634765625, 0.1265869140625, 0.189697265625, 0.2528076171875, 0.31591796875, 0.3790283203125, 0.442138671875, 0.5052490234375, 0.568359375, 0.6314697265625, 0.694580078125, 0.7576904296875, 0.82080078125, 0.8839111328125, 0.947021484375, 1.0101318359375, 1.0732421875, 1.1363525390625, 1.199462890625, 1.2625732421875, 1.32568359375, 1.3887939453125, 1.451904296875, 1.5150146484375, 1.578125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 6.0, 6.0, 13.0, 17.0, 38.0, 61.0, 164.0, 547.0, 2459.0, 439.0, 146.0, 63.0, 41.0, 24.0, 17.0, 12.0, 9.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3837890625, -1.3424072265625, -1.301025390625, -1.2596435546875, -1.21826171875, -1.1768798828125, -1.135498046875, -1.0941162109375, -1.052734375, -1.0113525390625, -0.969970703125, -0.9285888671875, -0.88720703125, -0.8458251953125, -0.804443359375, -0.7630615234375, -0.7216796875, -0.6802978515625, -0.638916015625, -0.5975341796875, -0.55615234375, -0.5147705078125, -0.473388671875, -0.4320068359375, -0.390625, -0.3492431640625, -0.307861328125, -0.2664794921875, -0.22509765625, -0.1837158203125, -0.142333984375, -0.1009521484375, -0.0595703125, -0.0181884765625, 0.023193359375, 0.0645751953125, 0.10595703125, 0.1473388671875, 0.188720703125, 0.2301025390625, 0.271484375, 0.3128662109375, 0.354248046875, 0.3956298828125, 0.43701171875, 0.4783935546875, 0.519775390625, 0.5611572265625, 0.6025390625, 0.6439208984375, 0.685302734375, 0.7266845703125, 0.76806640625, 0.8094482421875, 0.850830078125, 0.8922119140625, 0.93359375, 0.9749755859375, 1.016357421875, 1.0577392578125, 1.09912109375, 1.1405029296875, 1.181884765625, 1.2232666015625, 1.2646484375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 31.0, 43.0, 103.0, 169.0, 211.0, 203.0, 126.0, 62.0, 20.0, 6.0, 10.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.34738826751709, -3.153942346572876, -2.960496425628662, -2.7670507431030273, -2.5736048221588135, -2.3801589012145996, -2.1867129802703857, -1.9932671785354614, -1.7998212575912476, -1.6063753366470337, -1.4129295349121094, -1.2194836139678955, -1.0260376930236816, -0.8325918912887573, -0.6391459703445435, -0.44570016860961914, -0.2522542476654053, -0.05880837142467499, 0.1346375048160553, 0.3280833959579468, 0.5215292572975159, 0.714975118637085, 0.9084210395812988, 1.1018668413162231, 1.295312762260437, 1.4887586832046509, 1.6822044849395752, 1.875650405883789, 2.069096326828003, 2.262542247772217, 2.4559879302978516, 2.6494338512420654, 2.8428797721862793, 3.036325693130493, 3.229771614074707, 3.423217296600342, 3.6166632175445557, 3.8101091384887695, 4.0035552978515625, 4.197000980377197, 4.390446662902832, 4.583892345428467, 4.77733850479126, 4.9707841873168945, 5.1642303466796875, 5.357676029205322, 5.551121711730957, 5.74456787109375, 5.938014030456543, 6.131459712982178, 6.324905872344971, 6.5183515548706055, 6.711797714233398, 6.905243396759033, 7.098689079284668, 7.292135238647461, 7.485580921173096, 7.6790266036987305, 7.872472763061523, 8.065918922424316, 8.259364128112793, 8.452810287475586, 8.646256446838379, 8.839701652526855, 9.033147811889648]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 13.0, 10.0, 16.0, 23.0, 39.0, 36.0, 60.0, 58.0, 65.0, 82.0, 80.0, 78.0, 61.0, 87.0, 66.0, 51.0, 47.0, 41.0, 13.0, 27.0, 13.0, 7.0, 7.0, 8.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.24365234375, -5.119315147399902, -4.9949774742126465, -4.870640277862549, -4.746302604675293, -4.621965408325195, -4.4976277351379395, -4.373290538787842, -4.248952865600586, -4.124615669250488, -4.000277996063232, -3.8759405612945557, -3.751603126525879, -3.6272659301757812, -3.5029282569885254, -3.3785910606384277, -3.25425386428833, -3.1299164295196533, -3.0055789947509766, -2.8812415599823, -2.756904125213623, -2.6325669288635254, -2.5082292556762695, -2.383892059326172, -2.259554386138916, -2.1352169513702393, -2.0108795166015625, -1.8865420818328857, -1.7622047662734985, -1.6378673315048218, -1.513529896736145, -1.3891925811767578, -1.264855146408081, -1.1405177116394043, -1.0161802768707275, -0.8918429017066956, -0.7675055265426636, -0.6431680917739868, -0.5188306570053101, -0.3944932818412781, -0.2701558470726013, -0.14581844210624695, -0.021481022238731384, 0.10285639762878418, 0.22719380259513855, 0.3515312075614929, 0.4758686423301697, 0.6002060174942017, 0.7245434522628784, 0.8488808870315552, 0.9732182621955872, 1.0975556373596191, 1.221893072128296, 1.3462305068969727, 1.4705679416656494, 1.5949053764343262, 1.719242811203003, 1.8435802459716797, 1.9679176807403564, 2.092255115509033, 2.21659255027771, 2.3409299850463867, 2.4652671813964844, 2.589604616165161, 2.713942050933838]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 7.0, 6.0, 9.0, 9.0, 23.0, 34.0, 63.0, 79.0, 126.0, 187.0, 312.0, 603.0, 1214.0, 2463.0, 5771.0, 16040.0, 50753.0, 166556.0, 390072.0, 278105.0, 91419.0, 27890.0, 9456.0, 3705.0, 1714.0, 800.0, 441.0, 252.0, 159.0, 108.0, 68.0, 26.0, 27.0, 16.0, 17.0, 12.0, 5.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8740234375, -1.7982940673828125, -1.722564697265625, -1.6468353271484375, -1.57110595703125, -1.4953765869140625, -1.419647216796875, -1.3439178466796875, -1.2681884765625, -1.1924591064453125, -1.116729736328125, -1.0410003662109375, -0.96527099609375, -0.8895416259765625, -0.813812255859375, -0.7380828857421875, -0.662353515625, -0.5866241455078125, -0.510894775390625, -0.4351654052734375, -0.35943603515625, -0.2837066650390625, -0.207977294921875, -0.1322479248046875, -0.0565185546875, 0.0192108154296875, 0.094940185546875, 0.1706695556640625, 0.24639892578125, 0.3221282958984375, 0.397857666015625, 0.4735870361328125, 0.54931640625, 0.6250457763671875, 0.700775146484375, 0.7765045166015625, 0.85223388671875, 0.9279632568359375, 1.003692626953125, 1.0794219970703125, 1.1551513671875, 1.2308807373046875, 1.306610107421875, 1.3823394775390625, 1.45806884765625, 1.5337982177734375, 1.609527587890625, 1.6852569580078125, 1.760986328125, 1.8367156982421875, 1.912445068359375, 1.9881744384765625, 2.06390380859375, 2.1396331787109375, 2.215362548828125, 2.2910919189453125, 2.3668212890625, 2.4425506591796875, 2.518280029296875, 2.5940093994140625, 2.66973876953125, 2.7454681396484375, 2.821197509765625, 2.8969268798828125, 2.97265625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 8.0, 11.0, 21.0, 23.0, 27.0, 35.0, 52.0, 63.0, 63.0, 91.0, 84.0, 77.0, 68.0, 79.0, 67.0, 55.0, 47.0, 39.0, 28.0, 17.0, 22.0, 3.0, 10.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3193359375, -1.28729248046875, -1.2552490234375, -1.22320556640625, -1.191162109375, -1.15911865234375, -1.1270751953125, -1.09503173828125, -1.06298828125, -1.03094482421875, -0.9989013671875, -0.96685791015625, -0.934814453125, -0.90277099609375, -0.8707275390625, -0.83868408203125, -0.806640625, -0.77459716796875, -0.7425537109375, -0.71051025390625, -0.678466796875, -0.64642333984375, -0.6143798828125, -0.58233642578125, -0.55029296875, -0.51824951171875, -0.4862060546875, -0.45416259765625, -0.422119140625, -0.39007568359375, -0.3580322265625, -0.32598876953125, -0.2939453125, -0.26190185546875, -0.2298583984375, -0.19781494140625, -0.165771484375, -0.13372802734375, -0.1016845703125, -0.06964111328125, -0.03759765625, -0.00555419921875, 0.0264892578125, 0.05853271484375, 0.090576171875, 0.12261962890625, 0.1546630859375, 0.18670654296875, 0.21875, 0.25079345703125, 0.2828369140625, 0.31488037109375, 0.346923828125, 0.37896728515625, 0.4110107421875, 0.44305419921875, 0.47509765625, 0.50714111328125, 0.5391845703125, 0.57122802734375, 0.603271484375, 0.63531494140625, 0.6673583984375, 0.69940185546875, 0.7314453125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 8.0, 7.0, 14.0, 15.0, 25.0, 25.0, 34.0, 50.0, 69.0, 115.0, 172.0, 246.0, 396.0, 746.0, 1461.0, 3367.0, 8543.0, 26272.0, 92905.0, 301090.0, 399787.0, 149236.0, 41866.0, 12984.0, 4688.0, 2018.0, 988.0, 512.0, 287.0, 203.0, 121.0, 92.0, 54.0, 38.0, 29.0, 22.0, 19.0, 19.0, 7.0, 9.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.380859375, -2.31121826171875, -2.2415771484375, -2.17193603515625, -2.102294921875, -2.03265380859375, -1.9630126953125, -1.89337158203125, -1.82373046875, -1.75408935546875, -1.6844482421875, -1.61480712890625, -1.545166015625, -1.47552490234375, -1.4058837890625, -1.33624267578125, -1.2666015625, -1.19696044921875, -1.1273193359375, -1.05767822265625, -0.988037109375, -0.91839599609375, -0.8487548828125, -0.77911376953125, -0.70947265625, -0.63983154296875, -0.5701904296875, -0.50054931640625, -0.430908203125, -0.36126708984375, -0.2916259765625, -0.22198486328125, -0.15234375, -0.08270263671875, -0.0130615234375, 0.05657958984375, 0.126220703125, 0.19586181640625, 0.2655029296875, 0.33514404296875, 0.40478515625, 0.47442626953125, 0.5440673828125, 0.61370849609375, 0.683349609375, 0.75299072265625, 0.8226318359375, 0.89227294921875, 0.9619140625, 1.03155517578125, 1.1011962890625, 1.17083740234375, 1.240478515625, 1.31011962890625, 1.3797607421875, 1.44940185546875, 1.51904296875, 1.58868408203125, 1.6583251953125, 1.72796630859375, 1.797607421875, 1.86724853515625, 1.9368896484375, 2.00653076171875, 2.076171875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 5.0, 5.0, 8.0, 10.0, 8.0, 9.0, 14.0, 21.0, 14.0, 17.0, 24.0, 24.0, 41.0, 38.0, 48.0, 43.0, 58.0, 44.0, 57.0, 50.0, 63.0, 43.0, 38.0, 45.0, 50.0, 33.0, 39.0, 36.0, 28.0, 18.0, 16.0, 8.0, 11.0, 10.0, 4.0, 4.0, 6.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.623046875, -3.515869140625, -3.40869140625, -3.301513671875, -3.1943359375, -3.087158203125, -2.97998046875, -2.872802734375, -2.765625, -2.658447265625, -2.55126953125, -2.444091796875, -2.3369140625, -2.229736328125, -2.12255859375, -2.015380859375, -1.908203125, -1.801025390625, -1.69384765625, -1.586669921875, -1.4794921875, -1.372314453125, -1.26513671875, -1.157958984375, -1.05078125, -0.943603515625, -0.83642578125, -0.729248046875, -0.6220703125, -0.514892578125, -0.40771484375, -0.300537109375, -0.193359375, -0.086181640625, 0.02099609375, 0.128173828125, 0.2353515625, 0.342529296875, 0.44970703125, 0.556884765625, 0.6640625, 0.771240234375, 0.87841796875, 0.985595703125, 1.0927734375, 1.199951171875, 1.30712890625, 1.414306640625, 1.521484375, 1.628662109375, 1.73583984375, 1.843017578125, 1.9501953125, 2.057373046875, 2.16455078125, 2.271728515625, 2.37890625, 2.486083984375, 2.59326171875, 2.700439453125, 2.8076171875, 2.914794921875, 3.02197265625, 3.129150390625, 3.236328125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 12.0, 29.0, 24.0, 41.0, 67.0, 138.0, 224.0, 504.0, 1212.0, 4601.0, 41180.0, 932033.0, 60395.0, 5543.0, 1374.0, 540.0, 275.0, 137.0, 80.0, 54.0, 36.0, 18.0, 9.0, 9.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-4.578125, -4.470550537109375, -4.36297607421875, -4.255401611328125, -4.1478271484375, -4.040252685546875, -3.93267822265625, -3.825103759765625, -3.717529296875, -3.609954833984375, -3.50238037109375, -3.394805908203125, -3.2872314453125, -3.179656982421875, -3.07208251953125, -2.964508056640625, -2.85693359375, -2.749359130859375, -2.64178466796875, -2.534210205078125, -2.4266357421875, -2.319061279296875, -2.21148681640625, -2.103912353515625, -1.996337890625, -1.888763427734375, -1.78118896484375, -1.673614501953125, -1.5660400390625, -1.458465576171875, -1.35089111328125, -1.243316650390625, -1.1357421875, -1.028167724609375, -0.92059326171875, -0.813018798828125, -0.7054443359375, -0.597869873046875, -0.49029541015625, -0.382720947265625, -0.275146484375, -0.167572021484375, -0.05999755859375, 0.047576904296875, 0.1551513671875, 0.262725830078125, 0.37030029296875, 0.477874755859375, 0.58544921875, 0.693023681640625, 0.80059814453125, 0.908172607421875, 1.0157470703125, 1.123321533203125, 1.23089599609375, 1.338470458984375, 1.446044921875, 1.553619384765625, 1.66119384765625, 1.768768310546875, 1.8763427734375, 1.983917236328125, 2.09149169921875, 2.199066162109375, 2.306640625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 16.0, 13.0, 26.0, 41.0, 56.0, 60.0, 90.0, 196.0, 164.0, 99.0, 59.0, 46.0, 33.0, 26.0, 17.0, 14.0, 8.0, 7.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001800060272216797, -0.00017097964882850647, -0.00016195327043533325, -0.00015292689204216003, -0.00014390051364898682, -0.0001348741352558136, -0.00012584775686264038, -0.00011682137846946716, -0.00010779500007629395, -9.876862168312073e-05, -8.974224328994751e-05, -8.071586489677429e-05, -7.168948650360107e-05, -6.266310811042786e-05, -5.363672971725464e-05, -4.461035132408142e-05, -3.55839729309082e-05, -2.6557594537734985e-05, -1.7531216144561768e-05, -8.50483775138855e-06, 5.21540641784668e-07, 9.547919034957886e-06, 1.8574297428131104e-05, 2.760067582130432e-05, 3.662705421447754e-05, 4.565343260765076e-05, 5.4679811000823975e-05, 6.370618939399719e-05, 7.273256778717041e-05, 8.175894618034363e-05, 9.078532457351685e-05, 9.981170296669006e-05, 0.00010883808135986328, 0.0001178644597530365, 0.00012689083814620972, 0.00013591721653938293, 0.00014494359493255615, 0.00015396997332572937, 0.0001629963517189026, 0.0001720227301120758, 0.00018104910850524902, 0.00019007548689842224, 0.00019910186529159546, 0.00020812824368476868, 0.0002171546220779419, 0.0002261810004711151, 0.00023520737886428833, 0.00024423375725746155, 0.00025326013565063477, 0.000262286514043808, 0.0002713128924369812, 0.0002803392708301544, 0.00028936564922332764, 0.00029839202761650085, 0.00030741840600967407, 0.0003164447844028473, 0.0003254711627960205, 0.0003344975411891937, 0.00034352391958236694, 0.00035255029797554016, 0.0003615766763687134, 0.0003706030547618866, 0.0003796294331550598, 0.00038865581154823303, 0.00039768218994140625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 6.0, 11.0, 20.0, 24.0, 35.0, 60.0, 94.0, 187.0, 450.0, 1048.0, 4133.0, 37615.0, 826881.0, 164707.0, 10180.0, 1836.0, 651.0, 268.0, 145.0, 87.0, 42.0, 29.0, 12.0, 14.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.337890625, -2.25653076171875, -2.1751708984375, -2.09381103515625, -2.012451171875, -1.93109130859375, -1.8497314453125, -1.76837158203125, -1.68701171875, -1.60565185546875, -1.5242919921875, -1.44293212890625, -1.361572265625, -1.28021240234375, -1.1988525390625, -1.11749267578125, -1.0361328125, -0.95477294921875, -0.8734130859375, -0.79205322265625, -0.710693359375, -0.62933349609375, -0.5479736328125, -0.46661376953125, -0.38525390625, -0.30389404296875, -0.2225341796875, -0.14117431640625, -0.059814453125, 0.02154541015625, 0.1029052734375, 0.18426513671875, 0.265625, 0.34698486328125, 0.4283447265625, 0.50970458984375, 0.591064453125, 0.67242431640625, 0.7537841796875, 0.83514404296875, 0.91650390625, 0.99786376953125, 1.0792236328125, 1.16058349609375, 1.241943359375, 1.32330322265625, 1.4046630859375, 1.48602294921875, 1.5673828125, 1.64874267578125, 1.7301025390625, 1.81146240234375, 1.892822265625, 1.97418212890625, 2.0555419921875, 2.13690185546875, 2.21826171875, 2.29962158203125, 2.3809814453125, 2.46234130859375, 2.543701171875, 2.62506103515625, 2.7064208984375, 2.78778076171875, 2.869140625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 8.0, 12.0, 13.0, 27.0, 34.0, 63.0, 121.0, 236.0, 195.0, 128.0, 52.0, 37.0, 28.0, 13.0, 13.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6640625, -1.580902099609375, -1.49774169921875, -1.414581298828125, -1.3314208984375, -1.248260498046875, -1.16510009765625, -1.081939697265625, -0.998779296875, -0.915618896484375, -0.83245849609375, -0.749298095703125, -0.6661376953125, -0.582977294921875, -0.49981689453125, -0.416656494140625, -0.33349609375, -0.250335693359375, -0.16717529296875, -0.084014892578125, -0.0008544921875, 0.082305908203125, 0.16546630859375, 0.248626708984375, 0.331787109375, 0.414947509765625, 0.49810791015625, 0.581268310546875, 0.6644287109375, 0.747589111328125, 0.83074951171875, 0.913909912109375, 0.9970703125, 1.080230712890625, 1.16339111328125, 1.246551513671875, 1.3297119140625, 1.412872314453125, 1.49603271484375, 1.579193115234375, 1.662353515625, 1.745513916015625, 1.82867431640625, 1.911834716796875, 1.9949951171875, 2.078155517578125, 2.16131591796875, 2.244476318359375, 2.32763671875, 2.410797119140625, 2.49395751953125, 2.577117919921875, 2.6602783203125, 2.743438720703125, 2.82659912109375, 2.909759521484375, 2.992919921875, 3.076080322265625, 3.15924072265625, 3.242401123046875, 3.3255615234375, 3.408721923828125, 3.49188232421875, 3.575042724609375, 3.658203125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 23.0, 46.0, 110.0, 203.0, 257.0, 202.0, 89.0, 45.0, 23.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.88633728027344, -32.5527458190918, -31.21915626525879, -29.88556671142578, -28.55197525024414, -27.2183837890625, -25.884794235229492, -24.551204681396484, -23.217613220214844, -21.884021759033203, -20.550432205200195, -19.216842651367188, -17.883251190185547, -16.549659729003906, -15.216070175170898, -13.882479667663574, -12.54888916015625, -11.215298652648926, -9.881708145141602, -8.548117637634277, -7.214527130126953, -5.880936622619629, -4.547346115112305, -3.2137556076049805, -1.8801651000976562, -0.546574592590332, 0.7870159149169922, 2.1206064224243164, 3.4541969299316406, 4.787787437438965, 6.121377944946289, 7.454968452453613, 8.788562774658203, 10.122153282165527, 11.455743789672852, 12.789334297180176, 14.1229248046875, 15.456515312194824, 16.79010581970215, 18.123695373535156, 19.457286834716797, 20.790878295898438, 22.124467849731445, 23.458057403564453, 24.791648864746094, 26.125240325927734, 27.458829879760742, 28.79241943359375, 30.12601089477539, 31.45960235595703, 32.793190002441406, 34.12678146362305, 35.46037292480469, 36.79396438598633, 38.12755584716797, 39.461143493652344, 40.794734954833984, 42.128326416015625, 43.4619140625, 44.79550552368164, 46.12909698486328, 47.46268844604492, 48.79627990722656, 50.12986755371094, 51.46345901489258]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 6.0, 6.0, 12.0, 10.0, 16.0, 22.0, 22.0, 22.0, 35.0, 26.0, 30.0, 28.0, 45.0, 39.0, 51.0, 53.0, 38.0, 43.0, 41.0, 45.0, 49.0, 39.0, 40.0, 53.0, 29.0, 28.0, 23.0, 20.0, 17.0, 18.0, 17.0, 14.0, 5.0, 15.0, 11.0, 4.0, 8.0, 5.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.802505493164062, -18.204437255859375, -17.606367111206055, -17.008298873901367, -16.410228729248047, -15.81216049194336, -15.214092254638672, -14.616023063659668, -14.017953872680664, -13.41988468170166, -12.821815490722656, -12.223747253417969, -11.625678062438965, -11.027608871459961, -10.429540634155273, -9.83147144317627, -9.233402252197266, -8.635333061218262, -8.037263870239258, -7.43919563293457, -6.841126441955566, -6.2430572509765625, -5.644988536834717, -5.046919822692871, -4.448850631713867, -3.8507816791534424, -3.2527127265930176, -2.6546437740325928, -2.056574821472168, -1.4585058689117432, -0.8604369163513184, -0.26236820220947266, 0.33570098876953125, 0.933769941329956, 1.5318388938903809, 2.1299078464508057, 2.7279767990112305, 3.3260457515716553, 3.92411470413208, 4.522183418273926, 5.12025260925293, 5.718321800231934, 6.316390514373779, 6.914459228515625, 7.512528419494629, 8.110597610473633, 8.70866584777832, 9.306735038757324, 9.904804229736328, 10.502873420715332, 11.100942611694336, 11.699010848999023, 12.297080039978027, 12.895149230957031, 13.493217468261719, 14.091286659240723, 14.689355850219727, 15.28742504119873, 15.885494232177734, 16.483562469482422, 17.08163070678711, 17.67970085144043, 18.277769088745117, 18.875839233398438, 19.473907470703125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 6.0, 12.0, 12.0, 14.0, 18.0, 26.0, 31.0, 52.0, 77.0, 103.0, 220.0, 326.0, 582.0, 1071.0, 2298.0, 5978.0, 20092.0, 146455.0, 3767739.0, 212395.0, 24559.0, 6902.0, 2633.0, 1206.0, 649.0, 342.0, 182.0, 122.0, 64.0, 38.0, 26.0, 19.0, 8.0, 10.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.8046875, -3.706024169921875, -3.60736083984375, -3.508697509765625, -3.4100341796875, -3.311370849609375, -3.21270751953125, -3.114044189453125, -3.015380859375, -2.916717529296875, -2.81805419921875, -2.719390869140625, -2.6207275390625, -2.522064208984375, -2.42340087890625, -2.324737548828125, -2.22607421875, -2.127410888671875, -2.02874755859375, -1.930084228515625, -1.8314208984375, -1.732757568359375, -1.63409423828125, -1.535430908203125, -1.436767578125, -1.338104248046875, -1.23944091796875, -1.140777587890625, -1.0421142578125, -0.943450927734375, -0.84478759765625, -0.746124267578125, -0.6474609375, -0.548797607421875, -0.45013427734375, -0.351470947265625, -0.2528076171875, -0.154144287109375, -0.05548095703125, 0.043182373046875, 0.141845703125, 0.240509033203125, 0.33917236328125, 0.437835693359375, 0.5364990234375, 0.635162353515625, 0.73382568359375, 0.832489013671875, 0.93115234375, 1.029815673828125, 1.12847900390625, 1.227142333984375, 1.3258056640625, 1.424468994140625, 1.52313232421875, 1.621795654296875, 1.720458984375, 1.819122314453125, 1.91778564453125, 2.016448974609375, 2.1151123046875, 2.213775634765625, 2.31243896484375, 2.411102294921875, 2.509765625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 5.0, 4.0, 13.0, 6.0, 15.0, 16.0, 24.0, 30.0, 42.0, 43.0, 50.0, 77.0, 59.0, 67.0, 63.0, 69.0, 58.0, 59.0, 52.0, 44.0, 40.0, 36.0, 31.0, 25.0, 26.0, 22.0, 12.0, 10.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.30078125, -1.2681427001953125, -1.235504150390625, -1.2028656005859375, -1.17022705078125, -1.1375885009765625, -1.104949951171875, -1.0723114013671875, -1.0396728515625, -1.0070343017578125, -0.974395751953125, -0.9417572021484375, -0.90911865234375, -0.8764801025390625, -0.843841552734375, -0.8112030029296875, -0.778564453125, -0.7459259033203125, -0.713287353515625, -0.6806488037109375, -0.64801025390625, -0.6153717041015625, -0.582733154296875, -0.5500946044921875, -0.5174560546875, -0.4848175048828125, -0.452178955078125, -0.4195404052734375, -0.38690185546875, -0.3542633056640625, -0.321624755859375, -0.2889862060546875, -0.25634765625, -0.2237091064453125, -0.191070556640625, -0.1584320068359375, -0.12579345703125, -0.0931549072265625, -0.060516357421875, -0.0278778076171875, 0.0047607421875, 0.0373992919921875, 0.070037841796875, 0.1026763916015625, 0.13531494140625, 0.1679534912109375, 0.200592041015625, 0.2332305908203125, 0.265869140625, 0.2985076904296875, 0.331146240234375, 0.3637847900390625, 0.39642333984375, 0.4290618896484375, 0.461700439453125, 0.4943389892578125, 0.5269775390625, 0.5596160888671875, 0.592254638671875, 0.6248931884765625, 0.65753173828125, 0.6901702880859375, 0.722808837890625, 0.7554473876953125, 0.7880859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 8.0, 4.0, 10.0, 12.0, 22.0, 29.0, 42.0, 54.0, 125.0, 154.0, 249.0, 328.0, 649.0, 1079.0, 1776.0, 3471.0, 7526.0, 19120.0, 67317.0, 536243.0, 3269376.0, 219740.0, 41242.0, 13341.0, 5761.0, 2751.0, 1526.0, 897.0, 529.0, 320.0, 200.0, 127.0, 80.0, 58.0, 47.0, 27.0, 20.0, 12.0, 9.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.837890625, -1.77728271484375, -1.7166748046875, -1.65606689453125, -1.595458984375, -1.53485107421875, -1.4742431640625, -1.41363525390625, -1.35302734375, -1.29241943359375, -1.2318115234375, -1.17120361328125, -1.110595703125, -1.04998779296875, -0.9893798828125, -0.92877197265625, -0.8681640625, -0.80755615234375, -0.7469482421875, -0.68634033203125, -0.625732421875, -0.56512451171875, -0.5045166015625, -0.44390869140625, -0.38330078125, -0.32269287109375, -0.2620849609375, -0.20147705078125, -0.140869140625, -0.08026123046875, -0.0196533203125, 0.04095458984375, 0.1015625, 0.16217041015625, 0.2227783203125, 0.28338623046875, 0.343994140625, 0.40460205078125, 0.4652099609375, 0.52581787109375, 0.58642578125, 0.64703369140625, 0.7076416015625, 0.76824951171875, 0.828857421875, 0.88946533203125, 0.9500732421875, 1.01068115234375, 1.0712890625, 1.13189697265625, 1.1925048828125, 1.25311279296875, 1.313720703125, 1.37432861328125, 1.4349365234375, 1.49554443359375, 1.55615234375, 1.61676025390625, 1.6773681640625, 1.73797607421875, 1.798583984375, 1.85919189453125, 1.9197998046875, 1.98040771484375, 2.041015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 6.0, 6.0, 3.0, 8.0, 14.0, 15.0, 22.0, 37.0, 59.0, 120.0, 288.0, 816.0, 1787.0, 458.0, 179.0, 102.0, 35.0, 31.0, 28.0, 17.0, 3.0, 5.0, 6.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.966796875, -0.9232940673828125, -0.879791259765625, -0.8362884521484375, -0.79278564453125, -0.7492828369140625, -0.705780029296875, -0.6622772216796875, -0.6187744140625, -0.5752716064453125, -0.531768798828125, -0.4882659912109375, -0.44476318359375, -0.4012603759765625, -0.357757568359375, -0.3142547607421875, -0.270751953125, -0.2272491455078125, -0.183746337890625, -0.1402435302734375, -0.09674072265625, -0.0532379150390625, -0.009735107421875, 0.0337677001953125, 0.0772705078125, 0.1207733154296875, 0.164276123046875, 0.2077789306640625, 0.25128173828125, 0.2947845458984375, 0.338287353515625, 0.3817901611328125, 0.42529296875, 0.4687957763671875, 0.512298583984375, 0.5558013916015625, 0.59930419921875, 0.6428070068359375, 0.686309814453125, 0.7298126220703125, 0.7733154296875, 0.8168182373046875, 0.860321044921875, 0.9038238525390625, 0.94732666015625, 0.9908294677734375, 1.034332275390625, 1.0778350830078125, 1.121337890625, 1.1648406982421875, 1.208343505859375, 1.2518463134765625, 1.29534912109375, 1.3388519287109375, 1.382354736328125, 1.4258575439453125, 1.4693603515625, 1.5128631591796875, 1.556365966796875, 1.5998687744140625, 1.64337158203125, 1.6868743896484375, 1.730377197265625, 1.7738800048828125, 1.8173828125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 26.0, 67.0, 163.0, 281.0, 214.0, 152.0, 69.0, 16.0, 9.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.900103569030762, -8.515300750732422, -8.130497932434082, -7.745695114135742, -7.360892295837402, -6.9760894775390625, -6.591286659240723, -6.206483840942383, -5.821681022644043, -5.436878204345703, -5.052075386047363, -4.667272567749023, -4.282469749450684, -3.8976669311523438, -3.512863874435425, -3.128061056137085, -2.743257999420166, -2.358455181121826, -1.9736523628234863, -1.588849425315857, -1.204046607017517, -0.8192437887191772, -0.43444085121154785, -0.04963803291320801, 0.33516478538513184, 0.7199676036834717, 1.1047704219818115, 1.489573359489441, 1.8743761777877808, 2.25917911529541, 2.64398193359375, 3.02878475189209, 3.4135875701904297, 3.7983903884887695, 4.183193206787109, 4.567996025085449, 4.952798843383789, 5.337601661682129, 5.722404479980469, 6.107207298278809, 6.492010116577148, 6.876812934875488, 7.261615753173828, 7.646418571472168, 8.031221389770508, 8.416024208068848, 8.800827026367188, 9.185629844665527, 9.570432662963867, 9.955235481262207, 10.340038299560547, 10.724841117858887, 11.109643936157227, 11.494446754455566, 11.879249572753906, 12.264052391052246, 12.648856163024902, 13.033658981323242, 13.418461799621582, 13.803264617919922, 14.188067436218262, 14.572870254516602, 14.957673072814941, 15.342475891113281, 15.727278709411621]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 5.0, 5.0, 10.0, 10.0, 13.0, 14.0, 18.0, 17.0, 18.0, 33.0, 37.0, 35.0, 23.0, 52.0, 36.0, 55.0, 46.0, 51.0, 43.0, 56.0, 46.0, 35.0, 52.0, 46.0, 39.0, 27.0, 28.0, 20.0, 27.0, 19.0, 20.0, 16.0, 11.0, 8.0, 5.0, 5.0, 4.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-4.871958255767822, -4.739504337310791, -4.60705041885376, -4.4745965003967285, -4.342142581939697, -4.209688186645508, -4.077234268188477, -3.9447805881500244, -3.812326431274414, -3.679872512817383, -3.5474185943603516, -3.4149646759033203, -3.28251051902771, -3.1500566005706787, -3.0176026821136475, -2.885148763656616, -2.752694845199585, -2.6202409267425537, -2.4877870082855225, -2.355332851409912, -2.222878932952881, -2.0904250144958496, -1.9579710960388184, -1.825517177581787, -1.6930631399154663, -1.560609221458435, -1.4281551837921143, -1.295701265335083, -1.1632473468780518, -1.030793309211731, -0.8983393907546997, -0.7658854126930237, -0.6334316730499268, -0.5009776949882507, -0.3685237467288971, -0.23606979846954346, -0.10361582040786743, 0.028838157653808594, 0.16129207611083984, 0.29374605417251587, 0.4262000322341919, 0.5586540102958679, 0.691107988357544, 0.8235619068145752, 0.9560158848762512, 1.0884698629379272, 1.2209237813949585, 1.3533778190612793, 1.4858317375183105, 1.6182856559753418, 1.7507396936416626, 1.8831936120986938, 2.0156476497650146, 2.148101568222046, 2.280555486679077, 2.4130094051361084, 2.5454635620117188, 2.67791748046875, 2.8103713989257812, 2.9428253173828125, 3.075279474258423, 3.207733392715454, 3.3401873111724854, 3.4726412296295166, 3.605095148086548]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 6.0, 12.0, 13.0, 12.0, 28.0, 48.0, 64.0, 137.0, 190.0, 368.0, 774.0, 1682.0, 3898.0, 10728.0, 33113.0, 108155.0, 290064.0, 355441.0, 165803.0, 51501.0, 16400.0, 5685.0, 2247.0, 1059.0, 487.0, 281.0, 165.0, 74.0, 37.0, 34.0, 13.0, 14.0, 10.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.11328125, -3.024810791015625, -2.93634033203125, -2.847869873046875, -2.7593994140625, -2.670928955078125, -2.58245849609375, -2.493988037109375, -2.405517578125, -2.317047119140625, -2.22857666015625, -2.140106201171875, -2.0516357421875, -1.963165283203125, -1.87469482421875, -1.786224365234375, -1.69775390625, -1.609283447265625, -1.52081298828125, -1.432342529296875, -1.3438720703125, -1.255401611328125, -1.16693115234375, -1.078460693359375, -0.989990234375, -0.901519775390625, -0.81304931640625, -0.724578857421875, -0.6361083984375, -0.547637939453125, -0.45916748046875, -0.370697021484375, -0.2822265625, -0.193756103515625, -0.10528564453125, -0.016815185546875, 0.0716552734375, 0.160125732421875, 0.24859619140625, 0.337066650390625, 0.425537109375, 0.514007568359375, 0.60247802734375, 0.690948486328125, 0.7794189453125, 0.867889404296875, 0.95635986328125, 1.044830322265625, 1.13330078125, 1.221771240234375, 1.31024169921875, 1.398712158203125, 1.4871826171875, 1.575653076171875, 1.66412353515625, 1.752593994140625, 1.841064453125, 1.929534912109375, 2.01800537109375, 2.106475830078125, 2.1949462890625, 2.283416748046875, 2.37188720703125, 2.460357666015625, 2.548828125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 6.0, 10.0, 8.0, 22.0, 24.0, 30.0, 27.0, 38.0, 50.0, 66.0, 75.0, 92.0, 72.0, 58.0, 65.0, 64.0, 56.0, 48.0, 37.0, 36.0, 35.0, 28.0, 25.0, 15.0, 4.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.470703125, -1.43560791015625, -1.4005126953125, -1.36541748046875, -1.330322265625, -1.29522705078125, -1.2601318359375, -1.22503662109375, -1.18994140625, -1.15484619140625, -1.1197509765625, -1.08465576171875, -1.049560546875, -1.01446533203125, -0.9793701171875, -0.94427490234375, -0.9091796875, -0.87408447265625, -0.8389892578125, -0.80389404296875, -0.768798828125, -0.73370361328125, -0.6986083984375, -0.66351318359375, -0.62841796875, -0.59332275390625, -0.5582275390625, -0.52313232421875, -0.488037109375, -0.45294189453125, -0.4178466796875, -0.38275146484375, -0.34765625, -0.31256103515625, -0.2774658203125, -0.24237060546875, -0.207275390625, -0.17218017578125, -0.1370849609375, -0.10198974609375, -0.06689453125, -0.03179931640625, 0.0032958984375, 0.03839111328125, 0.073486328125, 0.10858154296875, 0.1436767578125, 0.17877197265625, 0.2138671875, 0.24896240234375, 0.2840576171875, 0.31915283203125, 0.354248046875, 0.38934326171875, 0.4244384765625, 0.45953369140625, 0.49462890625, 0.52972412109375, 0.5648193359375, 0.59991455078125, 0.635009765625, 0.67010498046875, 0.7052001953125, 0.74029541015625, 0.775390625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 8.0, 6.0, 8.0, 10.0, 16.0, 19.0, 22.0, 35.0, 41.0, 55.0, 82.0, 113.0, 154.0, 224.0, 345.0, 561.0, 1162.0, 2580.0, 7084.0, 21492.0, 74244.0, 239469.0, 410048.0, 201497.0, 60712.0, 17873.0, 5886.0, 2249.0, 1016.0, 496.0, 323.0, 184.0, 140.0, 110.0, 84.0, 43.0, 38.0, 28.0, 21.0, 18.0, 14.0, 11.0, 9.0, 8.0, 7.0, 3.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.85546875, -2.76458740234375, -2.6737060546875, -2.58282470703125, -2.491943359375, -2.40106201171875, -2.3101806640625, -2.21929931640625, -2.12841796875, -2.03753662109375, -1.9466552734375, -1.85577392578125, -1.764892578125, -1.67401123046875, -1.5831298828125, -1.49224853515625, -1.4013671875, -1.31048583984375, -1.2196044921875, -1.12872314453125, -1.037841796875, -0.94696044921875, -0.8560791015625, -0.76519775390625, -0.67431640625, -0.58343505859375, -0.4925537109375, -0.40167236328125, -0.310791015625, -0.21990966796875, -0.1290283203125, -0.03814697265625, 0.052734375, 0.14361572265625, 0.2344970703125, 0.32537841796875, 0.416259765625, 0.50714111328125, 0.5980224609375, 0.68890380859375, 0.77978515625, 0.87066650390625, 0.9615478515625, 1.05242919921875, 1.143310546875, 1.23419189453125, 1.3250732421875, 1.41595458984375, 1.5068359375, 1.59771728515625, 1.6885986328125, 1.77947998046875, 1.870361328125, 1.96124267578125, 2.0521240234375, 2.14300537109375, 2.23388671875, 2.32476806640625, 2.4156494140625, 2.50653076171875, 2.597412109375, 2.68829345703125, 2.7791748046875, 2.87005615234375, 2.9609375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 9.0, 12.0, 8.0, 11.0, 12.0, 15.0, 24.0, 24.0, 22.0, 29.0, 32.0, 38.0, 38.0, 33.0, 40.0, 41.0, 44.0, 46.0, 70.0, 48.0, 53.0, 49.0, 41.0, 41.0, 26.0, 33.0, 23.0, 26.0, 17.0, 23.0, 15.0, 13.0, 9.0, 9.0, 3.0, 6.0, 2.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.41015625, -4.26812744140625, -4.1260986328125, -3.98406982421875, -3.842041015625, -3.70001220703125, -3.5579833984375, -3.41595458984375, -3.27392578125, -3.13189697265625, -2.9898681640625, -2.84783935546875, -2.705810546875, -2.56378173828125, -2.4217529296875, -2.27972412109375, -2.1376953125, -1.99566650390625, -1.8536376953125, -1.71160888671875, -1.569580078125, -1.42755126953125, -1.2855224609375, -1.14349365234375, -1.00146484375, -0.85943603515625, -0.7174072265625, -0.57537841796875, -0.433349609375, -0.29132080078125, -0.1492919921875, -0.00726318359375, 0.134765625, 0.27679443359375, 0.4188232421875, 0.56085205078125, 0.702880859375, 0.84490966796875, 0.9869384765625, 1.12896728515625, 1.27099609375, 1.41302490234375, 1.5550537109375, 1.69708251953125, 1.839111328125, 1.98114013671875, 2.1231689453125, 2.26519775390625, 2.4072265625, 2.54925537109375, 2.6912841796875, 2.83331298828125, 2.975341796875, 3.11737060546875, 3.2593994140625, 3.40142822265625, 3.54345703125, 3.68548583984375, 3.8275146484375, 3.96954345703125, 4.111572265625, 4.25360107421875, 4.3956298828125, 4.53765869140625, 4.6796875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 21.0, 22.0, 35.0, 60.0, 98.0, 180.0, 409.0, 1512.0, 8374.0, 233231.0, 777994.0, 22663.0, 2729.0, 660.0, 255.0, 123.0, 63.0, 29.0, 26.0, 23.0, 5.0, 9.0, 6.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.837890625, -3.701751708984375, -3.56561279296875, -3.429473876953125, -3.2933349609375, -3.157196044921875, -3.02105712890625, -2.884918212890625, -2.748779296875, -2.612640380859375, -2.47650146484375, -2.340362548828125, -2.2042236328125, -2.068084716796875, -1.93194580078125, -1.795806884765625, -1.65966796875, -1.523529052734375, -1.38739013671875, -1.251251220703125, -1.1151123046875, -0.978973388671875, -0.84283447265625, -0.706695556640625, -0.570556640625, -0.434417724609375, -0.29827880859375, -0.162139892578125, -0.0260009765625, 0.110137939453125, 0.24627685546875, 0.382415771484375, 0.5185546875, 0.654693603515625, 0.79083251953125, 0.926971435546875, 1.0631103515625, 1.199249267578125, 1.33538818359375, 1.471527099609375, 1.607666015625, 1.743804931640625, 1.87994384765625, 2.016082763671875, 2.1522216796875, 2.288360595703125, 2.42449951171875, 2.560638427734375, 2.69677734375, 2.832916259765625, 2.96905517578125, 3.105194091796875, 3.2413330078125, 3.377471923828125, 3.51361083984375, 3.649749755859375, 3.785888671875, 3.922027587890625, 4.05816650390625, 4.194305419921875, 4.3304443359375, 4.466583251953125, 4.60272216796875, 4.738861083984375, 4.875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 7.0, 16.0, 20.0, 35.0, 67.0, 84.0, 104.0, 146.0, 150.0, 122.0, 90.0, 51.0, 44.0, 26.0, 18.0, 9.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00044536590576171875, -0.00043004751205444336, -0.00041472911834716797, -0.0003994107246398926, -0.0003840923309326172, -0.0003687739372253418, -0.0003534555435180664, -0.000338137149810791, -0.0003228187561035156, -0.00030750036239624023, -0.00029218196868896484, -0.00027686357498168945, -0.00026154518127441406, -0.00024622678756713867, -0.00023090839385986328, -0.0002155900001525879, -0.0002002716064453125, -0.0001849532127380371, -0.00016963481903076172, -0.00015431642532348633, -0.00013899803161621094, -0.00012367963790893555, -0.00010836124420166016, -9.304285049438477e-05, -7.772445678710938e-05, -6.240606307983398e-05, -4.7087669372558594e-05, -3.17692756652832e-05, -1.6450881958007812e-05, -1.1324882507324219e-06, 1.4185905456542969e-05, 2.950429916381836e-05, 4.482269287109375e-05, 6.014108657836914e-05, 7.545948028564453e-05, 9.077787399291992e-05, 0.00010609626770019531, 0.0001214146614074707, 0.0001367330551147461, 0.00015205144882202148, 0.00016736984252929688, 0.00018268823623657227, 0.00019800662994384766, 0.00021332502365112305, 0.00022864341735839844, 0.00024396181106567383, 0.0002592802047729492, 0.0002745985984802246, 0.0002899169921875, 0.0003052353858947754, 0.0003205537796020508, 0.00033587217330932617, 0.00035119056701660156, 0.00036650896072387695, 0.00038182735443115234, 0.00039714574813842773, 0.0004124641418457031, 0.0004277825355529785, 0.0004431009292602539, 0.0004584193229675293, 0.0004737377166748047, 0.0004890561103820801, 0.0005043745040893555, 0.0005196928977966309, 0.0005350112915039062]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 8.0, 11.0, 8.0, 17.0, 21.0, 30.0, 52.0, 100.0, 160.0, 331.0, 588.0, 1377.0, 3942.0, 16422.0, 101309.0, 557419.0, 308239.0, 45260.0, 8671.0, 2499.0, 1008.0, 455.0, 252.0, 142.0, 78.0, 43.0, 37.0, 20.0, 14.0, 11.0, 9.0, 5.0, 8.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7314453125, -1.6713104248046875, -1.611175537109375, -1.5510406494140625, -1.49090576171875, -1.4307708740234375, -1.370635986328125, -1.3105010986328125, -1.2503662109375, -1.1902313232421875, -1.130096435546875, -1.0699615478515625, -1.00982666015625, -0.9496917724609375, -0.889556884765625, -0.8294219970703125, -0.769287109375, -0.7091522216796875, -0.649017333984375, -0.5888824462890625, -0.52874755859375, -0.4686126708984375, -0.408477783203125, -0.3483428955078125, -0.2882080078125, -0.2280731201171875, -0.167938232421875, -0.1078033447265625, -0.04766845703125, 0.0124664306640625, 0.072601318359375, 0.1327362060546875, 0.19287109375, 0.2530059814453125, 0.313140869140625, 0.3732757568359375, 0.43341064453125, 0.4935455322265625, 0.553680419921875, 0.6138153076171875, 0.6739501953125, 0.7340850830078125, 0.794219970703125, 0.8543548583984375, 0.91448974609375, 0.9746246337890625, 1.034759521484375, 1.0948944091796875, 1.155029296875, 1.2151641845703125, 1.275299072265625, 1.3354339599609375, 1.39556884765625, 1.4557037353515625, 1.515838623046875, 1.5759735107421875, 1.6361083984375, 1.6962432861328125, 1.756378173828125, 1.8165130615234375, 1.87664794921875, 1.9367828369140625, 1.996917724609375, 2.0570526123046875, 2.1171875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 3.0, 9.0, 10.0, 22.0, 27.0, 34.0, 37.0, 66.0, 84.0, 105.0, 150.0, 119.0, 76.0, 58.0, 62.0, 34.0, 31.0, 22.0, 15.0, 6.0, 6.0, 9.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.25390625, -3.1739349365234375, -3.093963623046875, -3.0139923095703125, -2.93402099609375, -2.8540496826171875, -2.774078369140625, -2.6941070556640625, -2.6141357421875, -2.5341644287109375, -2.454193115234375, -2.3742218017578125, -2.29425048828125, -2.2142791748046875, -2.134307861328125, -2.0543365478515625, -1.974365234375, -1.8943939208984375, -1.814422607421875, -1.7344512939453125, -1.65447998046875, -1.5745086669921875, -1.494537353515625, -1.4145660400390625, -1.3345947265625, -1.2546234130859375, -1.174652099609375, -1.0946807861328125, -1.01470947265625, -0.9347381591796875, -0.854766845703125, -0.7747955322265625, -0.69482421875, -0.6148529052734375, -0.534881591796875, -0.4549102783203125, -0.37493896484375, -0.2949676513671875, -0.214996337890625, -0.1350250244140625, -0.0550537109375, 0.0249176025390625, 0.104888916015625, 0.1848602294921875, 0.26483154296875, 0.3448028564453125, 0.424774169921875, 0.5047454833984375, 0.584716796875, 0.6646881103515625, 0.744659423828125, 0.8246307373046875, 0.90460205078125, 0.9845733642578125, 1.064544677734375, 1.1445159912109375, 1.2244873046875, 1.3044586181640625, 1.384429931640625, 1.4644012451171875, 1.54437255859375, 1.6243438720703125, 1.704315185546875, 1.7842864990234375, 1.8642578125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 21.0, 38.0, 75.0, 145.0, 233.0, 220.0, 140.0, 74.0, 28.0, 16.0, 7.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.66496658325195, -46.12830352783203, -44.591644287109375, -43.05498123168945, -41.5183219909668, -39.981658935546875, -38.44499969482422, -36.9083366394043, -35.371673583984375, -33.83501052856445, -32.2983512878418, -30.761688232421875, -29.22502899169922, -27.688365936279297, -26.151704788208008, -24.61504364013672, -23.078384399414062, -21.541723251342773, -20.005062103271484, -18.468399047851562, -16.931739807128906, -15.3950777053833, -13.858415603637695, -12.321754455566406, -10.785093307495117, -9.248432159423828, -7.711770534515381, -6.175108909606934, -4.6384477615356445, -3.1017866134643555, -1.56512451171875, -0.028463363647460938, 1.5081939697265625, 3.0448553562164307, 4.581516742706299, 6.118178367614746, 7.654839515686035, 9.191500663757324, 10.72816276550293, 12.264823913574219, 13.801485061645508, 15.338146209716797, 16.874807357788086, 18.411468505859375, 19.948131561279297, 21.484790802001953, 23.021453857421875, 24.558115005493164, 26.094776153564453, 27.631437301635742, 29.16809844970703, 30.704761505126953, 32.24142074584961, 33.77808380126953, 35.31474304199219, 36.85140609741211, 38.38806915283203, 39.92473220825195, 41.46139144897461, 42.99805450439453, 44.53471374511719, 46.07137680053711, 47.60803985595703, 49.14469909667969, 50.681358337402344]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 6.0, 4.0, 4.0, 9.0, 6.0, 7.0, 13.0, 13.0, 21.0, 20.0, 18.0, 30.0, 29.0, 29.0, 30.0, 43.0, 31.0, 57.0, 45.0, 36.0, 43.0, 46.0, 42.0, 49.0, 46.0, 35.0, 34.0, 30.0, 28.0, 23.0, 20.0, 25.0, 24.0, 23.0, 13.0, 11.0, 12.0, 8.0, 9.0, 9.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-26.401382446289062, -25.59588623046875, -24.79039192199707, -23.984895706176758, -23.179399490356445, -22.373905181884766, -21.568408966064453, -20.76291275024414, -19.957416534423828, -19.151920318603516, -18.346426010131836, -17.540929794311523, -16.73543357849121, -15.929938316345215, -15.124443054199219, -14.318946838378906, -13.51345157623291, -12.707956314086914, -11.902460098266602, -11.096964836120605, -10.291468620300293, -9.485973358154297, -8.680477142333984, -7.874981880187988, -7.069486141204834, -6.26399040222168, -5.458494663238525, -4.652998924255371, -3.847503423690796, -3.0420079231262207, -2.2365121841430664, -1.431016445159912, -0.6255207061767578, 0.1799749732017517, 0.9854706525802612, 1.790966272354126, 2.5964620113372803, 3.4019575119018555, 4.20745325088501, 5.012948989868164, 5.818444728851318, 6.623940467834473, 7.429436206817627, 8.234931945800781, 9.040427207946777, 9.845922470092773, 10.651418685913086, 11.456914901733398, 12.262410163879395, 13.06790542602539, 13.873401641845703, 14.6788969039917, 15.484393119812012, 16.289888381958008, 17.09538459777832, 17.90087890625, 18.706375122070312, 19.511871337890625, 20.317365646362305, 21.122861862182617, 21.92835807800293, 22.73385238647461, 23.539348602294922, 24.344844818115234, 25.150341033935547]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 7.0, 13.0, 10.0, 20.0, 24.0, 23.0, 59.0, 80.0, 120.0, 277.0, 719.0, 2532.0, 12686.0, 146946.0, 3978084.0, 43753.0, 6442.0, 1569.0, 475.0, 195.0, 79.0, 50.0, 39.0, 19.0, 17.0, 9.0, 12.0, 6.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3359375, -5.1597900390625, -4.983642578125, -4.8074951171875, -4.63134765625, -4.4552001953125, -4.279052734375, -4.1029052734375, -3.9267578125, -3.7506103515625, -3.574462890625, -3.3983154296875, -3.22216796875, -3.0460205078125, -2.869873046875, -2.6937255859375, -2.517578125, -2.3414306640625, -2.165283203125, -1.9891357421875, -1.81298828125, -1.6368408203125, -1.460693359375, -1.2845458984375, -1.1083984375, -0.9322509765625, -0.756103515625, -0.5799560546875, -0.40380859375, -0.2276611328125, -0.051513671875, 0.1246337890625, 0.30078125, 0.4769287109375, 0.653076171875, 0.8292236328125, 1.00537109375, 1.1815185546875, 1.357666015625, 1.5338134765625, 1.7099609375, 1.8861083984375, 2.062255859375, 2.2384033203125, 2.41455078125, 2.5906982421875, 2.766845703125, 2.9429931640625, 3.119140625, 3.2952880859375, 3.471435546875, 3.6475830078125, 3.82373046875, 3.9998779296875, 4.176025390625, 4.3521728515625, 4.5283203125, 4.7044677734375, 4.880615234375, 5.0567626953125, 5.23291015625, 5.4090576171875, 5.585205078125, 5.7613525390625, 5.9375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 7.0, 11.0, 10.0, 14.0, 18.0, 23.0, 35.0, 29.0, 46.0, 60.0, 61.0, 74.0, 67.0, 71.0, 67.0, 70.0, 62.0, 35.0, 50.0, 46.0, 30.0, 24.0, 17.0, 17.0, 18.0, 10.0, 7.0, 6.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.498046875, -1.4535064697265625, -1.408966064453125, -1.3644256591796875, -1.31988525390625, -1.2753448486328125, -1.230804443359375, -1.1862640380859375, -1.1417236328125, -1.0971832275390625, -1.052642822265625, -1.0081024169921875, -0.96356201171875, -0.9190216064453125, -0.874481201171875, -0.8299407958984375, -0.785400390625, -0.7408599853515625, -0.696319580078125, -0.6517791748046875, -0.60723876953125, -0.5626983642578125, -0.518157958984375, -0.4736175537109375, -0.4290771484375, -0.3845367431640625, -0.339996337890625, -0.2954559326171875, -0.25091552734375, -0.2063751220703125, -0.161834716796875, -0.1172943115234375, -0.07275390625, -0.0282135009765625, 0.016326904296875, 0.0608673095703125, 0.10540771484375, 0.1499481201171875, 0.194488525390625, 0.2390289306640625, 0.2835693359375, 0.3281097412109375, 0.372650146484375, 0.4171905517578125, 0.46173095703125, 0.5062713623046875, 0.550811767578125, 0.5953521728515625, 0.639892578125, 0.6844329833984375, 0.728973388671875, 0.7735137939453125, 0.81805419921875, 0.8625946044921875, 0.907135009765625, 0.9516754150390625, 0.9962158203125, 1.0407562255859375, 1.085296630859375, 1.1298370361328125, 1.17437744140625, 1.2189178466796875, 1.263458251953125, 1.3079986572265625, 1.3525390625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 10.0, 3.0, 5.0, 9.0, 22.0, 29.0, 27.0, 36.0, 65.0, 87.0, 102.0, 197.0, 310.0, 557.0, 988.0, 1802.0, 3366.0, 7647.0, 21099.0, 88738.0, 3635451.0, 365484.0, 43897.0, 13083.0, 5323.0, 2564.0, 1339.0, 837.0, 423.0, 270.0, 156.0, 116.0, 74.0, 42.0, 33.0, 29.0, 21.0, 14.0, 6.0, 10.0, 7.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.923828125, -2.83465576171875, -2.7454833984375, -2.65631103515625, -2.567138671875, -2.47796630859375, -2.3887939453125, -2.29962158203125, -2.21044921875, -2.12127685546875, -2.0321044921875, -1.94293212890625, -1.853759765625, -1.76458740234375, -1.6754150390625, -1.58624267578125, -1.4970703125, -1.40789794921875, -1.3187255859375, -1.22955322265625, -1.140380859375, -1.05120849609375, -0.9620361328125, -0.87286376953125, -0.78369140625, -0.69451904296875, -0.6053466796875, -0.51617431640625, -0.427001953125, -0.33782958984375, -0.2486572265625, -0.15948486328125, -0.0703125, 0.01885986328125, 0.1080322265625, 0.19720458984375, 0.286376953125, 0.37554931640625, 0.4647216796875, 0.55389404296875, 0.64306640625, 0.73223876953125, 0.8214111328125, 0.91058349609375, 0.999755859375, 1.08892822265625, 1.1781005859375, 1.26727294921875, 1.3564453125, 1.44561767578125, 1.5347900390625, 1.62396240234375, 1.713134765625, 1.80230712890625, 1.8914794921875, 1.98065185546875, 2.06982421875, 2.15899658203125, 2.2481689453125, 2.33734130859375, 2.426513671875, 2.51568603515625, 2.6048583984375, 2.69403076171875, 2.783203125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 5.0, 1.0, 9.0, 4.0, 11.0, 23.0, 19.0, 29.0, 59.0, 123.0, 319.0, 2833.0, 373.0, 104.0, 60.0, 21.0, 25.0, 18.0, 9.0, 4.0, 6.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.85107421875, -0.8271560668945312, -0.8032379150390625, -0.7793197631835938, -0.755401611328125, -0.7314834594726562, -0.7075653076171875, -0.6836471557617188, -0.65972900390625, -0.6358108520507812, -0.6118927001953125, -0.5879745483398438, -0.564056396484375, -0.5401382446289062, -0.5162200927734375, -0.49230194091796875, -0.4683837890625, -0.44446563720703125, -0.4205474853515625, -0.39662933349609375, -0.372711181640625, -0.34879302978515625, -0.3248748779296875, -0.30095672607421875, -0.27703857421875, -0.25312042236328125, -0.2292022705078125, -0.20528411865234375, -0.181365966796875, -0.15744781494140625, -0.1335296630859375, -0.10961151123046875, -0.085693359375, -0.06177520751953125, -0.0378570556640625, -0.01393890380859375, 0.009979248046875, 0.03389739990234375, 0.0578155517578125, 0.08173370361328125, 0.10565185546875, 0.12957000732421875, 0.1534881591796875, 0.17740631103515625, 0.201324462890625, 0.22524261474609375, 0.2491607666015625, 0.27307891845703125, 0.2969970703125, 0.32091522216796875, 0.3448333740234375, 0.36875152587890625, 0.392669677734375, 0.41658782958984375, 0.4405059814453125, 0.46442413330078125, 0.48834228515625, 0.5122604370117188, 0.5361785888671875, 0.5600967407226562, 0.584014892578125, 0.6079330444335938, 0.6318511962890625, 0.6557693481445312, 0.6796875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 13.0, 21.0, 57.0, 148.0, 281.0, 277.0, 140.0, 51.0, 18.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.58993148803711, -11.360471725463867, -11.131011009216309, -10.901551246643066, -10.672090530395508, -10.442630767822266, -10.213171005249023, -9.983710289001465, -9.754250526428223, -9.52479076385498, -9.295330047607422, -9.06587028503418, -8.836410522460938, -8.606949806213379, -8.377490043640137, -8.148029327392578, -7.918569564819336, -7.6891093254089355, -7.459649085998535, -7.230189323425293, -7.000729084014893, -6.771268844604492, -6.54180908203125, -6.31234884262085, -6.082888603210449, -5.853428363800049, -5.623968124389648, -5.394508361816406, -5.165048122406006, -4.9355878829956055, -4.706128120422363, -4.476667881011963, -4.247207164764404, -4.017746925354004, -3.7882869243621826, -3.5588269233703613, -3.329366683959961, -3.0999064445495605, -2.8704464435577393, -2.640986442565918, -2.4115262031555176, -2.182065963745117, -1.952605962753296, -1.723145842552185, -1.4936857223510742, -1.2642256021499634, -1.0347654819488525, -0.8053053617477417, -0.5758452415466309, -0.34638512134552, -0.11692500114440918, 0.11253511905670166, 0.3419952392578125, 0.5714553594589233, 0.8009154796600342, 1.030375599861145, 1.2598357200622559, 1.4892958402633667, 1.7187559604644775, 1.9482160806655884, 2.177676200866699, 2.4071364402770996, 2.636596441268921, 2.866056442260742, 3.0955166816711426]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 9.0, 6.0, 13.0, 14.0, 9.0, 15.0, 16.0, 19.0, 14.0, 29.0, 35.0, 36.0, 35.0, 28.0, 33.0, 38.0, 41.0, 41.0, 41.0, 45.0, 46.0, 32.0, 42.0, 48.0, 31.0, 35.0, 30.0, 27.0, 29.0, 18.0, 28.0, 19.0, 10.0, 13.0, 17.0, 8.0, 12.0, 15.0, 4.0, 5.0, 6.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9324939250946045, -1.8687617778778076, -1.8050297498703003, -1.7412976026535034, -1.677565574645996, -1.6138334274291992, -1.5501012802124023, -1.4863691329956055, -1.4226371049880981, -1.3589049577713013, -1.295172929763794, -1.231440782546997, -1.1677086353302002, -1.1039766073226929, -1.040244460105896, -0.9765123724937439, -0.9127802848815918, -0.8490481972694397, -0.7853161096572876, -0.7215839624404907, -0.6578518748283386, -0.5941197872161865, -0.5303876399993896, -0.46665555238723755, -0.40292346477508545, -0.33919137716293335, -0.27545925974845886, -0.21172715723514557, -0.14799505472183228, -0.08426296710968018, -0.02053084969520569, 0.0432012677192688, 0.10693359375, 0.1706656962633133, 0.2343977987766266, 0.2981299161911011, 0.3618620038032532, 0.4255940914154053, 0.48932620882987976, 0.5530583262443542, 0.6167904138565063, 0.6805225014686584, 0.7442545890808105, 0.8079867362976074, 0.8717188239097595, 0.9354509115219116, 0.9991830587387085, 1.0629150867462158, 1.1266472339630127, 1.1903793811798096, 1.254111409187317, 1.3178435564041138, 1.381575584411621, 1.445307731628418, 1.5090398788452148, 1.5727720260620117, 1.636504054069519, 1.700236201286316, 1.7639682292938232, 1.8277003765106201, 1.891432523727417, 1.9551645517349243, 2.0188965797424316, 2.0826287269592285, 2.1463608741760254]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 13.0, 17.0, 24.0, 37.0, 57.0, 91.0, 162.0, 306.0, 700.0, 1732.0, 4718.0, 14387.0, 51946.0, 197220.0, 433528.0, 248748.0, 67391.0, 17931.0, 5772.0, 2131.0, 870.0, 334.0, 189.0, 82.0, 46.0, 29.0, 29.0, 12.0, 13.0, 13.0, 6.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.09765625, -3.985687255859375, -3.87371826171875, -3.761749267578125, -3.6497802734375, -3.537811279296875, -3.42584228515625, -3.313873291015625, -3.201904296875, -3.089935302734375, -2.97796630859375, -2.865997314453125, -2.7540283203125, -2.642059326171875, -2.53009033203125, -2.418121337890625, -2.30615234375, -2.194183349609375, -2.08221435546875, -1.970245361328125, -1.8582763671875, -1.746307373046875, -1.63433837890625, -1.522369384765625, -1.410400390625, -1.298431396484375, -1.18646240234375, -1.074493408203125, -0.9625244140625, -0.850555419921875, -0.73858642578125, -0.626617431640625, -0.5146484375, -0.402679443359375, -0.29071044921875, -0.178741455078125, -0.0667724609375, 0.045196533203125, 0.15716552734375, 0.269134521484375, 0.381103515625, 0.493072509765625, 0.60504150390625, 0.717010498046875, 0.8289794921875, 0.940948486328125, 1.05291748046875, 1.164886474609375, 1.27685546875, 1.388824462890625, 1.50079345703125, 1.612762451171875, 1.7247314453125, 1.836700439453125, 1.94866943359375, 2.060638427734375, 2.172607421875, 2.284576416015625, 2.39654541015625, 2.508514404296875, 2.6204833984375, 2.732452392578125, 2.84442138671875, 2.956390380859375, 3.068359375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 12.0, 5.0, 7.0, 9.0, 14.0, 12.0, 15.0, 19.0, 25.0, 45.0, 43.0, 43.0, 46.0, 59.0, 65.0, 64.0, 48.0, 58.0, 48.0, 51.0, 64.0, 43.0, 38.0, 35.0, 30.0, 24.0, 19.0, 11.0, 8.0, 12.0, 9.0, 3.0, 10.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.494140625, -1.4532470703125, -1.412353515625, -1.3714599609375, -1.33056640625, -1.2896728515625, -1.248779296875, -1.2078857421875, -1.1669921875, -1.1260986328125, -1.085205078125, -1.0443115234375, -1.00341796875, -0.9625244140625, -0.921630859375, -0.8807373046875, -0.83984375, -0.7989501953125, -0.758056640625, -0.7171630859375, -0.67626953125, -0.6353759765625, -0.594482421875, -0.5535888671875, -0.5126953125, -0.4718017578125, -0.430908203125, -0.3900146484375, -0.34912109375, -0.3082275390625, -0.267333984375, -0.2264404296875, -0.185546875, -0.1446533203125, -0.103759765625, -0.0628662109375, -0.02197265625, 0.0189208984375, 0.059814453125, 0.1007080078125, 0.1416015625, 0.1824951171875, 0.223388671875, 0.2642822265625, 0.30517578125, 0.3460693359375, 0.386962890625, 0.4278564453125, 0.46875, 0.5096435546875, 0.550537109375, 0.5914306640625, 0.63232421875, 0.6732177734375, 0.714111328125, 0.7550048828125, 0.7958984375, 0.8367919921875, 0.877685546875, 0.9185791015625, 0.95947265625, 1.0003662109375, 1.041259765625, 1.0821533203125, 1.123046875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 3.0, 1.0, 3.0, 8.0, 4.0, 10.0, 14.0, 21.0, 27.0, 40.0, 59.0, 91.0, 192.0, 260.0, 560.0, 1411.0, 3824.0, 15501.0, 105096.0, 648670.0, 233968.0, 29228.0, 6031.0, 1901.0, 770.0, 336.0, 193.0, 102.0, 83.0, 47.0, 28.0, 21.0, 12.0, 13.0, 9.0, 6.0, 6.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.875, -6.68231201171875, -6.4896240234375, -6.29693603515625, -6.104248046875, -5.91156005859375, -5.7188720703125, -5.52618408203125, -5.33349609375, -5.14080810546875, -4.9481201171875, -4.75543212890625, -4.562744140625, -4.37005615234375, -4.1773681640625, -3.98468017578125, -3.7919921875, -3.59930419921875, -3.4066162109375, -3.21392822265625, -3.021240234375, -2.82855224609375, -2.6358642578125, -2.44317626953125, -2.25048828125, -2.05780029296875, -1.8651123046875, -1.67242431640625, -1.479736328125, -1.28704833984375, -1.0943603515625, -0.90167236328125, -0.708984375, -0.51629638671875, -0.3236083984375, -0.13092041015625, 0.061767578125, 0.25445556640625, 0.4471435546875, 0.63983154296875, 0.83251953125, 1.02520751953125, 1.2178955078125, 1.41058349609375, 1.603271484375, 1.79595947265625, 1.9886474609375, 2.18133544921875, 2.3740234375, 2.56671142578125, 2.7593994140625, 2.95208740234375, 3.144775390625, 3.33746337890625, 3.5301513671875, 3.72283935546875, 3.91552734375, 4.10821533203125, 4.3009033203125, 4.49359130859375, 4.686279296875, 4.87896728515625, 5.0716552734375, 5.26434326171875, 5.45703125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 10.0, 8.0, 13.0, 18.0, 16.0, 36.0, 33.0, 27.0, 31.0, 43.0, 42.0, 59.0, 55.0, 45.0, 62.0, 45.0, 48.0, 57.0, 53.0, 52.0, 43.0, 42.0, 29.0, 26.0, 17.0, 15.0, 12.0, 9.0, 14.0, 6.0, 6.0, 7.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1875, -8.93115234375, -8.6748046875, -8.41845703125, -8.162109375, -7.90576171875, -7.6494140625, -7.39306640625, -7.13671875, -6.88037109375, -6.6240234375, -6.36767578125, -6.111328125, -5.85498046875, -5.5986328125, -5.34228515625, -5.0859375, -4.82958984375, -4.5732421875, -4.31689453125, -4.060546875, -3.80419921875, -3.5478515625, -3.29150390625, -3.03515625, -2.77880859375, -2.5224609375, -2.26611328125, -2.009765625, -1.75341796875, -1.4970703125, -1.24072265625, -0.984375, -0.72802734375, -0.4716796875, -0.21533203125, 0.041015625, 0.29736328125, 0.5537109375, 0.81005859375, 1.06640625, 1.32275390625, 1.5791015625, 1.83544921875, 2.091796875, 2.34814453125, 2.6044921875, 2.86083984375, 3.1171875, 3.37353515625, 3.6298828125, 3.88623046875, 4.142578125, 4.39892578125, 4.6552734375, 4.91162109375, 5.16796875, 5.42431640625, 5.6806640625, 5.93701171875, 6.193359375, 6.44970703125, 6.7060546875, 6.96240234375, 7.21875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 6.0, 8.0, 10.0, 10.0, 16.0, 34.0, 44.0, 87.0, 157.0, 329.0, 899.0, 4437.0, 105875.0, 916142.0, 17491.0, 1974.0, 564.0, 181.0, 121.0, 62.0, 36.0, 34.0, 16.0, 11.0, 4.0, 5.0, 0.0, 2.0, 4.0, 2.0, 3.0], "bins": [-9.671875, -9.462860107421875, -9.25384521484375, -9.044830322265625, -8.8358154296875, -8.626800537109375, -8.41778564453125, -8.208770751953125, -7.999755859375, -7.790740966796875, -7.58172607421875, -7.372711181640625, -7.1636962890625, -6.954681396484375, -6.74566650390625, -6.536651611328125, -6.32763671875, -6.118621826171875, -5.90960693359375, -5.700592041015625, -5.4915771484375, -5.282562255859375, -5.07354736328125, -4.864532470703125, -4.655517578125, -4.446502685546875, -4.23748779296875, -4.028472900390625, -3.8194580078125, -3.610443115234375, -3.40142822265625, -3.192413330078125, -2.9833984375, -2.774383544921875, -2.56536865234375, -2.356353759765625, -2.1473388671875, -1.938323974609375, -1.72930908203125, -1.520294189453125, -1.311279296875, -1.102264404296875, -0.89324951171875, -0.684234619140625, -0.4752197265625, -0.266204833984375, -0.05718994140625, 0.151824951171875, 0.36083984375, 0.569854736328125, 0.77886962890625, 0.987884521484375, 1.1968994140625, 1.405914306640625, 1.61492919921875, 1.823944091796875, 2.032958984375, 2.241973876953125, 2.45098876953125, 2.660003662109375, 2.8690185546875, 3.078033447265625, 3.28704833984375, 3.496063232421875, 3.705078125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 8.0, 12.0, 18.0, 34.0, 73.0, 128.0, 171.0, 187.0, 161.0, 102.0, 58.0, 24.0, 23.0, 7.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00045299530029296875, -0.00043076276779174805, -0.00040853023529052734, -0.00038629770278930664, -0.00036406517028808594, -0.00034183263778686523, -0.00031960010528564453, -0.00029736757278442383, -0.0002751350402832031, -0.0002529025077819824, -0.00023066997528076172, -0.00020843744277954102, -0.0001862049102783203, -0.0001639723777770996, -0.0001417398452758789, -0.0001195073127746582, -9.72747802734375e-05, -7.50422477722168e-05, -5.2809715270996094e-05, -3.057718276977539e-05, -8.344650268554688e-06, 1.3887882232666016e-05, 3.612041473388672e-05, 5.835294723510742e-05, 8.058547973632812e-05, 0.00010281801223754883, 0.00012505054473876953, 0.00014728307723999023, 0.00016951560974121094, 0.00019174814224243164, 0.00021398067474365234, 0.00023621320724487305, 0.00025844573974609375, 0.00028067827224731445, 0.00030291080474853516, 0.00032514333724975586, 0.00034737586975097656, 0.00036960840225219727, 0.00039184093475341797, 0.00041407346725463867, 0.0004363059997558594, 0.0004585385322570801, 0.0004807710647583008, 0.0005030035972595215, 0.0005252361297607422, 0.0005474686622619629, 0.0005697011947631836, 0.0005919337272644043, 0.000614166259765625, 0.0006363987922668457, 0.0006586313247680664, 0.0006808638572692871, 0.0007030963897705078, 0.0007253289222717285, 0.0007475614547729492, 0.0007697939872741699, 0.0007920265197753906, 0.0008142590522766113, 0.000836491584777832, 0.0008587241172790527, 0.0008809566497802734, 0.0009031891822814941, 0.0009254217147827148, 0.0009476542472839355, 0.0009698867797851562]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 13.0, 5.0, 9.0, 9.0, 10.0, 24.0, 27.0, 36.0, 55.0, 81.0, 121.0, 176.0, 360.0, 708.0, 1480.0, 4290.0, 17877.0, 161795.0, 742196.0, 99940.0, 13146.0, 3491.0, 1239.0, 572.0, 331.0, 170.0, 119.0, 63.0, 62.0, 36.0, 23.0, 16.0, 9.0, 11.0, 10.0, 11.0, 9.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.58984375, -2.50738525390625, -2.4249267578125, -2.34246826171875, -2.260009765625, -2.17755126953125, -2.0950927734375, -2.01263427734375, -1.93017578125, -1.84771728515625, -1.7652587890625, -1.68280029296875, -1.600341796875, -1.51788330078125, -1.4354248046875, -1.35296630859375, -1.2705078125, -1.18804931640625, -1.1055908203125, -1.02313232421875, -0.940673828125, -0.85821533203125, -0.7757568359375, -0.69329833984375, -0.61083984375, -0.52838134765625, -0.4459228515625, -0.36346435546875, -0.281005859375, -0.19854736328125, -0.1160888671875, -0.03363037109375, 0.048828125, 0.13128662109375, 0.2137451171875, 0.29620361328125, 0.378662109375, 0.46112060546875, 0.5435791015625, 0.62603759765625, 0.70849609375, 0.79095458984375, 0.8734130859375, 0.95587158203125, 1.038330078125, 1.12078857421875, 1.2032470703125, 1.28570556640625, 1.3681640625, 1.45062255859375, 1.5330810546875, 1.61553955078125, 1.697998046875, 1.78045654296875, 1.8629150390625, 1.94537353515625, 2.02783203125, 2.11029052734375, 2.1927490234375, 2.27520751953125, 2.357666015625, 2.44012451171875, 2.5225830078125, 2.60504150390625, 2.6875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 9.0, 9.0, 10.0, 18.0, 16.0, 28.0, 50.0, 53.0, 76.0, 98.0, 162.0, 123.0, 108.0, 59.0, 39.0, 27.0, 16.0, 14.0, 13.0, 12.0, 8.0, 12.0, 8.0, 4.0, 9.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.828125, -3.7147216796875, -3.601318359375, -3.4879150390625, -3.37451171875, -3.2611083984375, -3.147705078125, -3.0343017578125, -2.9208984375, -2.8074951171875, -2.694091796875, -2.5806884765625, -2.46728515625, -2.3538818359375, -2.240478515625, -2.1270751953125, -2.013671875, -1.9002685546875, -1.786865234375, -1.6734619140625, -1.56005859375, -1.4466552734375, -1.333251953125, -1.2198486328125, -1.1064453125, -0.9930419921875, -0.879638671875, -0.7662353515625, -0.65283203125, -0.5394287109375, -0.426025390625, -0.3126220703125, -0.19921875, -0.0858154296875, 0.027587890625, 0.1409912109375, 0.25439453125, 0.3677978515625, 0.481201171875, 0.5946044921875, 0.7080078125, 0.8214111328125, 0.934814453125, 1.0482177734375, 1.16162109375, 1.2750244140625, 1.388427734375, 1.5018310546875, 1.615234375, 1.7286376953125, 1.842041015625, 1.9554443359375, 2.06884765625, 2.1822509765625, 2.295654296875, 2.4090576171875, 2.5224609375, 2.6358642578125, 2.749267578125, 2.8626708984375, 2.97607421875, 3.0894775390625, 3.202880859375, 3.3162841796875, 3.4296875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 9.0, 11.0, 18.0, 36.0, 69.0, 164.0, 195.0, 234.0, 136.0, 85.0, 29.0, 19.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-110.6727294921875, -108.36756896972656, -106.0624008178711, -103.75724029541016, -101.45207214355469, -99.14691162109375, -96.84175109863281, -94.53659057617188, -92.2314224243164, -89.92626190185547, -87.62109375, -85.31593322753906, -83.01077270507812, -80.70560455322266, -78.40044403076172, -76.09527587890625, -73.79011535644531, -71.48495483398438, -69.1797866821289, -66.87462615966797, -64.5694580078125, -62.26429748535156, -59.959136962890625, -57.65397262573242, -55.34880828857422, -53.043643951416016, -50.73847961425781, -48.433319091796875, -46.12815475463867, -43.82299041748047, -41.51782989501953, -39.21266555786133, -36.907493591308594, -34.60232925415039, -32.29716491699219, -29.99200439453125, -27.686840057373047, -25.381675720214844, -23.076513290405273, -20.771350860595703, -18.4661865234375, -16.161022186279297, -13.855859756469727, -11.55069637298584, -9.245532989501953, -6.940369606018066, -4.63520622253418, -2.3300437927246094, -0.02487945556640625, 2.2802839279174805, 4.585447311401367, 6.890610694885254, 9.19577407836914, 11.500937461853027, 13.806100845336914, 16.111263275146484, 18.416427612304688, 20.72159194946289, 23.02675437927246, 25.33191680908203, 27.637081146240234, 29.942245483398438, 32.247406005859375, 34.55257034301758, 36.85773468017578]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 1.0, 7.0, 1.0, 4.0, 9.0, 3.0, 6.0, 6.0, 10.0, 14.0, 17.0, 15.0, 25.0, 30.0, 32.0, 30.0, 32.0, 41.0, 49.0, 47.0, 57.0, 53.0, 52.0, 50.0, 49.0, 46.0, 39.0, 39.0, 20.0, 30.0, 21.0, 29.0, 27.0, 18.0, 14.0, 21.0, 10.0, 9.0, 13.0, 6.0, 6.0, 5.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-36.22459411621094, -35.073638916015625, -33.92268753051758, -32.771732330322266, -31.620779037475586, -30.469825744628906, -29.318872451782227, -28.167919158935547, -27.016963958740234, -25.866010665893555, -24.715057373046875, -23.564102172851562, -22.413148880004883, -21.262195587158203, -20.111242294311523, -18.960289001464844, -17.809335708618164, -16.658382415771484, -15.507428169250488, -14.356474876403809, -13.205520629882812, -12.054567337036133, -10.903614044189453, -9.752659797668457, -8.601706504821777, -7.4507527351379395, -6.299798965454102, -5.148845672607422, -3.997891902923584, -2.846938133239746, -1.6959848403930664, -0.5450305938720703, 0.6059226989746094, 1.7568763494491577, 2.907829999923706, 4.058783531188965, 5.209737300872803, 6.360691070556641, 7.51164436340332, 8.662598609924316, 9.813551902770996, 10.964505195617676, 12.115459442138672, 13.266412734985352, 14.417366027832031, 15.568320274353027, 16.71927261352539, 17.870227813720703, 19.021181106567383, 20.172134399414062, 21.323087692260742, 22.474040985107422, 23.624996185302734, 24.775949478149414, 25.926902770996094, 27.077857971191406, 28.228809356689453, 29.379762649536133, 30.530715942382812, 31.681671142578125, 32.83262252807617, 33.983577728271484, 35.13452911376953, 36.285484313964844, 37.436439514160156]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 11.0, 10.0, 10.0, 13.0, 19.0, 35.0, 31.0, 69.0, 96.0, 143.0, 239.0, 405.0, 717.0, 1496.0, 3381.0, 8745.0, 28986.0, 170189.0, 3806233.0, 133026.0, 25365.0, 7966.0, 3380.0, 1605.0, 826.0, 473.0, 287.0, 185.0, 110.0, 60.0, 52.0, 41.0, 16.0, 18.0, 16.0, 9.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.572265625, -3.45867919921875, -3.3450927734375, -3.23150634765625, -3.117919921875, -3.00433349609375, -2.8907470703125, -2.77716064453125, -2.66357421875, -2.54998779296875, -2.4364013671875, -2.32281494140625, -2.209228515625, -2.09564208984375, -1.9820556640625, -1.86846923828125, -1.7548828125, -1.64129638671875, -1.5277099609375, -1.41412353515625, -1.300537109375, -1.18695068359375, -1.0733642578125, -0.95977783203125, -0.84619140625, -0.73260498046875, -0.6190185546875, -0.50543212890625, -0.391845703125, -0.27825927734375, -0.1646728515625, -0.05108642578125, 0.0625, 0.17608642578125, 0.2896728515625, 0.40325927734375, 0.516845703125, 0.63043212890625, 0.7440185546875, 0.85760498046875, 0.97119140625, 1.08477783203125, 1.1983642578125, 1.31195068359375, 1.425537109375, 1.53912353515625, 1.6527099609375, 1.76629638671875, 1.8798828125, 1.99346923828125, 2.1070556640625, 2.22064208984375, 2.334228515625, 2.44781494140625, 2.5614013671875, 2.67498779296875, 2.78857421875, 2.90216064453125, 3.0157470703125, 3.12933349609375, 3.242919921875, 3.35650634765625, 3.4700927734375, 3.58367919921875, 3.697265625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 4.0, 9.0, 13.0, 20.0, 21.0, 17.0, 30.0, 38.0, 36.0, 80.0, 82.0, 91.0, 84.0, 63.0, 82.0, 69.0, 55.0, 44.0, 31.0, 23.0, 20.0, 21.0, 13.0, 8.0, 11.0, 3.0, 5.0, 3.0, 10.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.50390625, -1.443206787109375, -1.38250732421875, -1.321807861328125, -1.2611083984375, -1.200408935546875, -1.13970947265625, -1.079010009765625, -1.018310546875, -0.957611083984375, -0.89691162109375, -0.836212158203125, -0.7755126953125, -0.714813232421875, -0.65411376953125, -0.593414306640625, -0.53271484375, -0.472015380859375, -0.41131591796875, -0.350616455078125, -0.2899169921875, -0.229217529296875, -0.16851806640625, -0.107818603515625, -0.047119140625, 0.013580322265625, 0.07427978515625, 0.134979248046875, 0.1956787109375, 0.256378173828125, 0.31707763671875, 0.377777099609375, 0.4384765625, 0.499176025390625, 0.55987548828125, 0.620574951171875, 0.6812744140625, 0.741973876953125, 0.80267333984375, 0.863372802734375, 0.924072265625, 0.984771728515625, 1.04547119140625, 1.106170654296875, 1.1668701171875, 1.227569580078125, 1.28826904296875, 1.348968505859375, 1.40966796875, 1.470367431640625, 1.53106689453125, 1.591766357421875, 1.6524658203125, 1.713165283203125, 1.77386474609375, 1.834564208984375, 1.895263671875, 1.955963134765625, 2.01666259765625, 2.077362060546875, 2.1380615234375, 2.198760986328125, 2.25946044921875, 2.320159912109375, 2.380859375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 2.0, 6.0, 9.0, 15.0, 15.0, 19.0, 34.0, 46.0, 57.0, 93.0, 131.0, 184.0, 326.0, 427.0, 758.0, 1275.0, 2300.0, 4397.0, 9969.0, 26834.0, 101550.0, 3097057.0, 822614.0, 84293.0, 23659.0, 8854.0, 4033.0, 2118.0, 1187.0, 702.0, 421.0, 294.0, 171.0, 129.0, 92.0, 52.0, 34.0, 31.0, 27.0, 17.0, 14.0, 10.0, 12.0, 3.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.12109375, -3.016845703125, -2.91259765625, -2.808349609375, -2.7041015625, -2.599853515625, -2.49560546875, -2.391357421875, -2.287109375, -2.182861328125, -2.07861328125, -1.974365234375, -1.8701171875, -1.765869140625, -1.66162109375, -1.557373046875, -1.453125, -1.348876953125, -1.24462890625, -1.140380859375, -1.0361328125, -0.931884765625, -0.82763671875, -0.723388671875, -0.619140625, -0.514892578125, -0.41064453125, -0.306396484375, -0.2021484375, -0.097900390625, 0.00634765625, 0.110595703125, 0.21484375, 0.319091796875, 0.42333984375, 0.527587890625, 0.6318359375, 0.736083984375, 0.84033203125, 0.944580078125, 1.048828125, 1.153076171875, 1.25732421875, 1.361572265625, 1.4658203125, 1.570068359375, 1.67431640625, 1.778564453125, 1.8828125, 1.987060546875, 2.09130859375, 2.195556640625, 2.2998046875, 2.404052734375, 2.50830078125, 2.612548828125, 2.716796875, 2.821044921875, 2.92529296875, 3.029541015625, 3.1337890625, 3.238037109375, 3.34228515625, 3.446533203125, 3.55078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 6.0, 2.0, 4.0, 10.0, 8.0, 22.0, 24.0, 44.0, 92.0, 145.0, 337.0, 2584.0, 361.0, 174.0, 85.0, 51.0, 40.0, 27.0, 12.0, 6.0, 11.0, 5.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.017578125, -0.983184814453125, -0.94879150390625, -0.914398193359375, -0.8800048828125, -0.845611572265625, -0.81121826171875, -0.776824951171875, -0.742431640625, -0.708038330078125, -0.67364501953125, -0.639251708984375, -0.6048583984375, -0.570465087890625, -0.53607177734375, -0.501678466796875, -0.46728515625, -0.432891845703125, -0.39849853515625, -0.364105224609375, -0.3297119140625, -0.295318603515625, -0.26092529296875, -0.226531982421875, -0.192138671875, -0.157745361328125, -0.12335205078125, -0.088958740234375, -0.0545654296875, -0.020172119140625, 0.01422119140625, 0.048614501953125, 0.0830078125, 0.117401123046875, 0.15179443359375, 0.186187744140625, 0.2205810546875, 0.254974365234375, 0.28936767578125, 0.323760986328125, 0.358154296875, 0.392547607421875, 0.42694091796875, 0.461334228515625, 0.4957275390625, 0.530120849609375, 0.56451416015625, 0.598907470703125, 0.63330078125, 0.667694091796875, 0.70208740234375, 0.736480712890625, 0.7708740234375, 0.805267333984375, 0.83966064453125, 0.874053955078125, 0.908447265625, 0.942840576171875, 0.97723388671875, 1.011627197265625, 1.0460205078125, 1.080413818359375, 1.11480712890625, 1.149200439453125, 1.18359375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 6.0, 16.0, 20.0, 34.0, 36.0, 80.0, 74.0, 110.0, 129.0, 119.0, 112.0, 101.0, 54.0, 40.0, 29.0, 15.0, 14.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6553447246551514, -3.4925971031188965, -3.3298494815826416, -3.1671018600463867, -3.004354476928711, -2.841606616973877, -2.678859233856201, -2.5161116123199463, -2.3533639907836914, -2.1906163692474365, -2.0278687477111816, -1.8651212453842163, -1.7023736238479614, -1.5396260023117065, -1.3768784999847412, -1.2141308784484863, -1.0513832569122314, -0.8886356353759766, -0.7258880734443665, -0.5631405115127563, -0.40039288997650146, -0.23764526844024658, -0.07489770650863647, 0.08784985542297363, 0.2505974769592285, 0.413345068693161, 0.5760926604270935, 0.7388402223587036, 0.9015878438949585, 1.0643354654312134, 1.2270829677581787, 1.3898305892944336, 1.5525779724121094, 1.7153255939483643, 1.8780732154846191, 2.040820837020874, 2.203568458557129, 2.3663158416748047, 2.5290634632110596, 2.6918110847473145, 2.8545587062835693, 3.017306327819824, 3.180053949356079, 3.342801570892334, 3.5055489540100098, 3.6682968139648438, 3.8310441970825195, 3.9937918186187744, 4.156539440155029, 4.319286823272705, 4.482034683227539, 4.644782066345215, 4.807529926300049, 4.970277309417725, 5.133025169372559, 5.295772552490234, 5.45851993560791, 5.621267318725586, 5.78401517868042, 5.946762561798096, 6.10951042175293, 6.2722578048706055, 6.4350056648254395, 6.597753047943115, 6.760500907897949]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 2.0, 2.0, 5.0, 3.0, 9.0, 7.0, 9.0, 14.0, 17.0, 18.0, 19.0, 20.0, 20.0, 26.0, 30.0, 32.0, 34.0, 39.0, 40.0, 37.0, 32.0, 43.0, 33.0, 50.0, 49.0, 35.0, 44.0, 47.0, 35.0, 41.0, 28.0, 22.0, 35.0, 23.0, 22.0, 17.0, 16.0, 10.0, 8.0, 7.0, 9.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.909581184387207, -2.8189187049865723, -2.7282564640045166, -2.637593984603882, -2.546931505203247, -2.4562692642211914, -2.3656067848205566, -2.274944305419922, -2.184282064437866, -2.0936195850372314, -2.002957344055176, -1.912294864654541, -1.8216325044631958, -1.7309701442718506, -1.6403076648712158, -1.5496453046798706, -1.4589828252792358, -1.3683204650878906, -1.2776579856872559, -1.1869956254959106, -1.0963332653045654, -1.0056707859039307, -0.9150084257125854, -0.8243460655212402, -0.7336836457252502, -0.6430212259292603, -0.552358865737915, -0.46169644594192505, -0.37103405594825745, -0.28037166595458984, -0.18970924615859985, -0.09904688596725464, -0.008384466171264648, 0.08227793127298355, 0.17294032871723175, 0.26360273361206055, 0.35426512360572815, 0.44492751359939575, 0.5355899333953857, 0.626252293586731, 0.716914713382721, 0.8075771331787109, 0.8982394933700562, 0.9889019131660461, 1.0795643329620361, 1.1702266931533813, 1.2608890533447266, 1.3515515327453613, 1.4422138929367065, 1.5328762531280518, 1.6235387325286865, 1.7142010927200317, 1.804863452911377, 1.8955259323120117, 1.986188292503357, 2.076850652694702, 2.167513132095337, 2.2581756114959717, 2.3488378524780273, 2.439500331878662, 2.530162811279297, 2.6208250522613525, 2.7114875316619873, 2.802149772644043, 2.8928122520446777]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 3.0, 3.0, 9.0, 11.0, 20.0, 43.0, 55.0, 72.0, 149.0, 237.0, 445.0, 895.0, 2155.0, 5516.0, 16982.0, 63501.0, 256305.0, 454180.0, 183616.0, 44197.0, 12504.0, 4327.0, 1662.0, 779.0, 383.0, 193.0, 116.0, 67.0, 37.0, 28.0, 19.0, 21.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.04296875, -3.934783935546875, -3.82659912109375, -3.718414306640625, -3.6102294921875, -3.502044677734375, -3.39385986328125, -3.285675048828125, -3.177490234375, -3.069305419921875, -2.96112060546875, -2.852935791015625, -2.7447509765625, -2.636566162109375, -2.52838134765625, -2.420196533203125, -2.31201171875, -2.203826904296875, -2.09564208984375, -1.987457275390625, -1.8792724609375, -1.771087646484375, -1.66290283203125, -1.554718017578125, -1.446533203125, -1.338348388671875, -1.23016357421875, -1.121978759765625, -1.0137939453125, -0.905609130859375, -0.79742431640625, -0.689239501953125, -0.5810546875, -0.472869873046875, -0.36468505859375, -0.256500244140625, -0.1483154296875, -0.040130615234375, 0.06805419921875, 0.176239013671875, 0.284423828125, 0.392608642578125, 0.50079345703125, 0.608978271484375, 0.7171630859375, 0.825347900390625, 0.93353271484375, 1.041717529296875, 1.14990234375, 1.258087158203125, 1.36627197265625, 1.474456787109375, 1.5826416015625, 1.690826416015625, 1.79901123046875, 1.907196044921875, 2.015380859375, 2.123565673828125, 2.23175048828125, 2.339935302734375, 2.4481201171875, 2.556304931640625, 2.66448974609375, 2.772674560546875, 2.880859375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 6.0, 6.0, 10.0, 18.0, 10.0, 17.0, 20.0, 27.0, 35.0, 54.0, 55.0, 89.0, 87.0, 70.0, 93.0, 66.0, 66.0, 49.0, 54.0, 38.0, 24.0, 27.0, 18.0, 8.0, 16.0, 10.0, 6.0, 7.0, 8.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.435546875, -1.373199462890625, -1.31085205078125, -1.248504638671875, -1.1861572265625, -1.123809814453125, -1.06146240234375, -0.999114990234375, -0.936767578125, -0.874420166015625, -0.81207275390625, -0.749725341796875, -0.6873779296875, -0.625030517578125, -0.56268310546875, -0.500335693359375, -0.43798828125, -0.375640869140625, -0.31329345703125, -0.250946044921875, -0.1885986328125, -0.126251220703125, -0.06390380859375, -0.001556396484375, 0.060791015625, 0.123138427734375, 0.18548583984375, 0.247833251953125, 0.3101806640625, 0.372528076171875, 0.43487548828125, 0.497222900390625, 0.5595703125, 0.621917724609375, 0.68426513671875, 0.746612548828125, 0.8089599609375, 0.871307373046875, 0.93365478515625, 0.996002197265625, 1.058349609375, 1.120697021484375, 1.18304443359375, 1.245391845703125, 1.3077392578125, 1.370086669921875, 1.43243408203125, 1.494781494140625, 1.55712890625, 1.619476318359375, 1.68182373046875, 1.744171142578125, 1.8065185546875, 1.868865966796875, 1.93121337890625, 1.993560791015625, 2.055908203125, 2.118255615234375, 2.18060302734375, 2.242950439453125, 2.3052978515625, 2.367645263671875, 2.42999267578125, 2.492340087890625, 2.5546875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 6.0, 7.0, 6.0, 10.0, 16.0, 27.0, 20.0, 31.0, 84.0, 98.0, 186.0, 317.0, 706.0, 1906.0, 7892.0, 108199.0, 844149.0, 75193.0, 6605.0, 1650.0, 678.0, 306.0, 166.0, 109.0, 71.0, 34.0, 21.0, 16.0, 10.0, 11.0, 6.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.12109375, -6.84124755859375, -6.5614013671875, -6.28155517578125, -6.001708984375, -5.72186279296875, -5.4420166015625, -5.16217041015625, -4.88232421875, -4.60247802734375, -4.3226318359375, -4.04278564453125, -3.762939453125, -3.48309326171875, -3.2032470703125, -2.92340087890625, -2.6435546875, -2.36370849609375, -2.0838623046875, -1.80401611328125, -1.524169921875, -1.24432373046875, -0.9644775390625, -0.68463134765625, -0.40478515625, -0.12493896484375, 0.1549072265625, 0.43475341796875, 0.714599609375, 0.99444580078125, 1.2742919921875, 1.55413818359375, 1.833984375, 2.11383056640625, 2.3936767578125, 2.67352294921875, 2.953369140625, 3.23321533203125, 3.5130615234375, 3.79290771484375, 4.07275390625, 4.35260009765625, 4.6324462890625, 4.91229248046875, 5.192138671875, 5.47198486328125, 5.7518310546875, 6.03167724609375, 6.3115234375, 6.59136962890625, 6.8712158203125, 7.15106201171875, 7.430908203125, 7.71075439453125, 7.9906005859375, 8.27044677734375, 8.55029296875, 8.83013916015625, 9.1099853515625, 9.38983154296875, 9.669677734375, 9.94952392578125, 10.2293701171875, 10.50921630859375, 10.7890625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 1.0, 4.0, 5.0, 2.0, 16.0, 10.0, 14.0, 10.0, 18.0, 20.0, 30.0, 29.0, 28.0, 32.0, 52.0, 43.0, 53.0, 55.0, 59.0, 51.0, 51.0, 56.0, 50.0, 46.0, 41.0, 36.0, 29.0, 30.0, 17.0, 23.0, 12.0, 13.0, 12.0, 2.0, 6.0, 5.0, 12.0, 3.0, 5.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.1171875, -7.850341796875, -7.58349609375, -7.316650390625, -7.0498046875, -6.782958984375, -6.51611328125, -6.249267578125, -5.982421875, -5.715576171875, -5.44873046875, -5.181884765625, -4.9150390625, -4.648193359375, -4.38134765625, -4.114501953125, -3.84765625, -3.580810546875, -3.31396484375, -3.047119140625, -2.7802734375, -2.513427734375, -2.24658203125, -1.979736328125, -1.712890625, -1.446044921875, -1.17919921875, -0.912353515625, -0.6455078125, -0.378662109375, -0.11181640625, 0.155029296875, 0.421875, 0.688720703125, 0.95556640625, 1.222412109375, 1.4892578125, 1.756103515625, 2.02294921875, 2.289794921875, 2.556640625, 2.823486328125, 3.09033203125, 3.357177734375, 3.6240234375, 3.890869140625, 4.15771484375, 4.424560546875, 4.69140625, 4.958251953125, 5.22509765625, 5.491943359375, 5.7587890625, 6.025634765625, 6.29248046875, 6.559326171875, 6.826171875, 7.093017578125, 7.35986328125, 7.626708984375, 7.8935546875, 8.160400390625, 8.42724609375, 8.694091796875, 8.9609375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 10.0, 11.0, 19.0, 13.0, 21.0, 40.0, 76.0, 128.0, 225.0, 532.0, 2032.0, 21149.0, 943297.0, 76102.0, 3434.0, 782.0, 319.0, 134.0, 76.0, 44.0, 43.0, 22.0, 11.0, 10.0, 5.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.421875, -8.1788330078125, -7.935791015625, -7.6927490234375, -7.44970703125, -7.2066650390625, -6.963623046875, -6.7205810546875, -6.4775390625, -6.2344970703125, -5.991455078125, -5.7484130859375, -5.50537109375, -5.2623291015625, -5.019287109375, -4.7762451171875, -4.533203125, -4.2901611328125, -4.047119140625, -3.8040771484375, -3.56103515625, -3.3179931640625, -3.074951171875, -2.8319091796875, -2.5888671875, -2.3458251953125, -2.102783203125, -1.8597412109375, -1.61669921875, -1.3736572265625, -1.130615234375, -0.8875732421875, -0.64453125, -0.4014892578125, -0.158447265625, 0.0845947265625, 0.32763671875, 0.5706787109375, 0.813720703125, 1.0567626953125, 1.2998046875, 1.5428466796875, 1.785888671875, 2.0289306640625, 2.27197265625, 2.5150146484375, 2.758056640625, 3.0010986328125, 3.244140625, 3.4871826171875, 3.730224609375, 3.9732666015625, 4.21630859375, 4.4593505859375, 4.702392578125, 4.9454345703125, 5.1884765625, 5.4315185546875, 5.674560546875, 5.9176025390625, 6.16064453125, 6.4036865234375, 6.646728515625, 6.8897705078125, 7.1328125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 0.0, 4.0, 4.0, 13.0, 10.0, 9.0, 17.0, 30.0, 18.0, 53.0, 52.0, 59.0, 60.0, 75.0, 95.0, 88.0, 90.0, 63.0, 66.0, 39.0, 31.0, 24.0, 20.0, 13.0, 18.0, 8.0, 10.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00039005279541015625, -0.0003789253532886505, -0.0003677979111671448, -0.00035667046904563904, -0.0003455430269241333, -0.00033441558480262756, -0.0003232881426811218, -0.0003121607005596161, -0.00030103325843811035, -0.0002899058163166046, -0.0002787783741950989, -0.00026765093207359314, -0.0002565234899520874, -0.00024539604783058167, -0.00023426860570907593, -0.0002231411635875702, -0.00021201372146606445, -0.00020088627934455872, -0.00018975883722305298, -0.00017863139510154724, -0.0001675039529800415, -0.00015637651085853577, -0.00014524906873703003, -0.0001341216266155243, -0.00012299418449401855, -0.00011186674237251282, -0.00010073930025100708, -8.961185812950134e-05, -7.84844160079956e-05, -6.735697388648987e-05, -5.622953176498413e-05, -4.5102089643478394e-05, -3.3974647521972656e-05, -2.284720540046692e-05, -1.1719763278961182e-05, -5.923211574554443e-07, 1.0535120964050293e-05, 2.166256308555603e-05, 3.279000520706177e-05, 4.3917447328567505e-05, 5.504488945007324e-05, 6.617233157157898e-05, 7.729977369308472e-05, 8.842721581459045e-05, 9.955465793609619e-05, 0.00011068210005760193, 0.00012180954217910767, 0.0001329369843006134, 0.00014406442642211914, 0.00015519186854362488, 0.00016631931066513062, 0.00017744675278663635, 0.0001885741949081421, 0.00019970163702964783, 0.00021082907915115356, 0.0002219565212726593, 0.00023308396339416504, 0.0002442114055156708, 0.0002553388476371765, 0.00026646628975868225, 0.000277593731880188, 0.0002887211740016937, 0.00029984861612319946, 0.0003109760582447052, 0.00032210350036621094]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 15.0, 20.0, 36.0, 77.0, 216.0, 465.0, 1481.0, 8209.0, 384275.0, 639827.0, 11236.0, 1780.0, 517.0, 216.0, 92.0, 37.0, 15.0, 7.0, 8.0, 7.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.40625, -7.211669921875, -7.01708984375, -6.822509765625, -6.6279296875, -6.433349609375, -6.23876953125, -6.044189453125, -5.849609375, -5.655029296875, -5.46044921875, -5.265869140625, -5.0712890625, -4.876708984375, -4.68212890625, -4.487548828125, -4.29296875, -4.098388671875, -3.90380859375, -3.709228515625, -3.5146484375, -3.320068359375, -3.12548828125, -2.930908203125, -2.736328125, -2.541748046875, -2.34716796875, -2.152587890625, -1.9580078125, -1.763427734375, -1.56884765625, -1.374267578125, -1.1796875, -0.985107421875, -0.79052734375, -0.595947265625, -0.4013671875, -0.206787109375, -0.01220703125, 0.182373046875, 0.376953125, 0.571533203125, 0.76611328125, 0.960693359375, 1.1552734375, 1.349853515625, 1.54443359375, 1.739013671875, 1.93359375, 2.128173828125, 2.32275390625, 2.517333984375, 2.7119140625, 2.906494140625, 3.10107421875, 3.295654296875, 3.490234375, 3.684814453125, 3.87939453125, 4.073974609375, 4.2685546875, 4.463134765625, 4.65771484375, 4.852294921875, 5.046875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 10.0, 18.0, 24.0, 50.0, 100.0, 221.0, 269.0, 168.0, 85.0, 31.0, 15.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4296875, -11.1524658203125, -10.875244140625, -10.5980224609375, -10.32080078125, -10.0435791015625, -9.766357421875, -9.4891357421875, -9.2119140625, -8.9346923828125, -8.657470703125, -8.3802490234375, -8.10302734375, -7.8258056640625, -7.548583984375, -7.2713623046875, -6.994140625, -6.7169189453125, -6.439697265625, -6.1624755859375, -5.88525390625, -5.6080322265625, -5.330810546875, -5.0535888671875, -4.7763671875, -4.4991455078125, -4.221923828125, -3.9447021484375, -3.66748046875, -3.3902587890625, -3.113037109375, -2.8358154296875, -2.55859375, -2.2813720703125, -2.004150390625, -1.7269287109375, -1.44970703125, -1.1724853515625, -0.895263671875, -0.6180419921875, -0.3408203125, -0.0635986328125, 0.213623046875, 0.4908447265625, 0.76806640625, 1.0452880859375, 1.322509765625, 1.5997314453125, 1.876953125, 2.1541748046875, 2.431396484375, 2.7086181640625, 2.98583984375, 3.2630615234375, 3.540283203125, 3.8175048828125, 4.0947265625, 4.3719482421875, 4.649169921875, 4.9263916015625, 5.20361328125, 5.4808349609375, 5.758056640625, 6.0352783203125, 6.3125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 11.0, 22.0, 49.0, 109.0, 247.0, 250.0, 194.0, 89.0, 23.0, 11.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.743690490722656, -41.84067916870117, -38.93766784667969, -36.03466033935547, -33.131649017333984, -30.2286376953125, -27.32562828063965, -24.422618865966797, -21.519607543945312, -18.616596221923828, -15.713586807250977, -12.810576438903809, -9.90756607055664, -7.004555702209473, -4.101545333862305, -1.1985359191894531, 1.7044754028320312, 4.607485771179199, 7.510496139526367, 10.413506507873535, 13.316516876220703, 16.219528198242188, 19.12253761291504, 22.02554702758789, 24.928558349609375, 27.83156967163086, 30.73457908630371, 33.63758850097656, 36.54059982299805, 39.44361114501953, 42.34661865234375, 45.249629974365234, 48.15264892578125, 51.055660247802734, 53.95867156982422, 56.86167907714844, 59.76469039916992, 62.667701721191406, 65.57070922851562, 68.47372436523438, 71.3767318725586, 74.27973937988281, 77.18275451660156, 80.08576202392578, 82.98876953125, 85.89178466796875, 88.79479217529297, 91.69779968261719, 94.60081481933594, 97.50382232666016, 100.4068374633789, 103.30984497070312, 106.21286010742188, 109.1158676147461, 112.01887512207031, 114.92189025878906, 117.82489776611328, 120.7279052734375, 123.63092041015625, 126.53392791748047, 129.4369354248047, 132.33995056152344, 135.2429656982422, 138.14596557617188, 141.04898071289062]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 0.0, 5.0, 8.0, 6.0, 20.0, 12.0, 17.0, 14.0, 23.0, 30.0, 32.0, 37.0, 39.0, 44.0, 40.0, 54.0, 45.0, 71.0, 47.0, 53.0, 27.0, 42.0, 51.0, 48.0, 37.0, 38.0, 21.0, 26.0, 20.0, 13.0, 16.0, 10.0, 15.0, 10.0, 12.0, 3.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.98225402832031, -36.763214111328125, -35.5441780090332, -34.325138092041016, -33.106101989746094, -31.887062072753906, -30.66802406311035, -29.448986053466797, -28.229948043823242, -27.010910034179688, -25.791872024536133, -24.572834014892578, -23.35379409790039, -22.13475799560547, -20.91571807861328, -19.696680068969727, -18.477642059326172, -17.258604049682617, -16.039566040039062, -14.820527076721191, -13.601489067077637, -12.382451057434082, -11.163412094116211, -9.944374084472656, -8.725336074829102, -7.506298065185547, -6.287259578704834, -5.068221092224121, -3.8491830825805664, -2.6301450729370117, -1.4111065864562988, -0.19206809997558594, 1.0269660949707031, 2.246004343032837, 3.4650425910949707, 4.684081077575684, 5.903119087219238, 7.122157096862793, 8.341196060180664, 9.560234069824219, 10.779272079467773, 11.998310089111328, 13.217348098754883, 14.436387062072754, 15.655425071716309, 16.874462127685547, 18.093502044677734, 19.31254005432129, 20.531578063964844, 21.7506160736084, 22.969654083251953, 24.188692092895508, 25.407730102539062, 26.62677001953125, 27.845808029174805, 29.06484603881836, 30.283884048461914, 31.50292205810547, 32.721961975097656, 33.94099807739258, 35.160037994384766, 36.37907409667969, 37.598114013671875, 38.81715393066406, 40.036190032958984]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 6.0, 9.0, 9.0, 23.0, 29.0, 44.0, 65.0, 103.0, 193.0, 372.0, 759.0, 1815.0, 5654.0, 31160.0, 4000748.0, 134583.0, 12913.0, 3291.0, 1242.0, 586.0, 268.0, 144.0, 96.0, 60.0, 34.0, 19.0, 15.0, 12.0, 7.0, 7.0, 1.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.81640625, -6.57940673828125, -6.3424072265625, -6.10540771484375, -5.868408203125, -5.63140869140625, -5.3944091796875, -5.15740966796875, -4.92041015625, -4.68341064453125, -4.4464111328125, -4.20941162109375, -3.972412109375, -3.73541259765625, -3.4984130859375, -3.26141357421875, -3.0244140625, -2.78741455078125, -2.5504150390625, -2.31341552734375, -2.076416015625, -1.83941650390625, -1.6024169921875, -1.36541748046875, -1.12841796875, -0.89141845703125, -0.6544189453125, -0.41741943359375, -0.180419921875, 0.05657958984375, 0.2935791015625, 0.53057861328125, 0.767578125, 1.00457763671875, 1.2415771484375, 1.47857666015625, 1.715576171875, 1.95257568359375, 2.1895751953125, 2.42657470703125, 2.66357421875, 2.90057373046875, 3.1375732421875, 3.37457275390625, 3.611572265625, 3.84857177734375, 4.0855712890625, 4.32257080078125, 4.5595703125, 4.79656982421875, 5.0335693359375, 5.27056884765625, 5.507568359375, 5.74456787109375, 5.9815673828125, 6.21856689453125, 6.45556640625, 6.69256591796875, 6.9295654296875, 7.16656494140625, 7.403564453125, 7.64056396484375, 7.8775634765625, 8.11456298828125, 8.3515625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 10.0, 8.0, 8.0, 12.0, 16.0, 19.0, 23.0, 42.0, 54.0, 57.0, 53.0, 93.0, 94.0, 73.0, 77.0, 71.0, 62.0, 57.0, 30.0, 30.0, 28.0, 15.0, 11.0, 9.0, 13.0, 7.0, 5.0, 4.0, 2.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.771484375, -1.701324462890625, -1.63116455078125, -1.561004638671875, -1.4908447265625, -1.420684814453125, -1.35052490234375, -1.280364990234375, -1.210205078125, -1.140045166015625, -1.06988525390625, -0.999725341796875, -0.9295654296875, -0.859405517578125, -0.78924560546875, -0.719085693359375, -0.64892578125, -0.578765869140625, -0.50860595703125, -0.438446044921875, -0.3682861328125, -0.298126220703125, -0.22796630859375, -0.157806396484375, -0.087646484375, -0.017486572265625, 0.05267333984375, 0.122833251953125, 0.1929931640625, 0.263153076171875, 0.33331298828125, 0.403472900390625, 0.4736328125, 0.543792724609375, 0.61395263671875, 0.684112548828125, 0.7542724609375, 0.824432373046875, 0.89459228515625, 0.964752197265625, 1.034912109375, 1.105072021484375, 1.17523193359375, 1.245391845703125, 1.3155517578125, 1.385711669921875, 1.45587158203125, 1.526031494140625, 1.59619140625, 1.666351318359375, 1.73651123046875, 1.806671142578125, 1.8768310546875, 1.946990966796875, 2.01715087890625, 2.087310791015625, 2.157470703125, 2.227630615234375, 2.29779052734375, 2.367950439453125, 2.4381103515625, 2.508270263671875, 2.57843017578125, 2.648590087890625, 2.71875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 3.0, 10.0, 7.0, 20.0, 15.0, 37.0, 45.0, 55.0, 76.0, 114.0, 206.0, 303.0, 623.0, 1031.0, 2230.0, 5400.0, 16240.0, 76045.0, 3770703.0, 272031.0, 32970.0, 9197.0, 3462.0, 1587.0, 757.0, 401.0, 262.0, 161.0, 106.0, 58.0, 43.0, 24.0, 19.0, 17.0, 14.0, 8.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.6875, -5.53277587890625, -5.3780517578125, -5.22332763671875, -5.068603515625, -4.91387939453125, -4.7591552734375, -4.60443115234375, -4.44970703125, -4.29498291015625, -4.1402587890625, -3.98553466796875, -3.830810546875, -3.67608642578125, -3.5213623046875, -3.36663818359375, -3.2119140625, -3.05718994140625, -2.9024658203125, -2.74774169921875, -2.593017578125, -2.43829345703125, -2.2835693359375, -2.12884521484375, -1.97412109375, -1.81939697265625, -1.6646728515625, -1.50994873046875, -1.355224609375, -1.20050048828125, -1.0457763671875, -0.89105224609375, -0.736328125, -0.58160400390625, -0.4268798828125, -0.27215576171875, -0.117431640625, 0.03729248046875, 0.1920166015625, 0.34674072265625, 0.50146484375, 0.65618896484375, 0.8109130859375, 0.96563720703125, 1.120361328125, 1.27508544921875, 1.4298095703125, 1.58453369140625, 1.7392578125, 1.89398193359375, 2.0487060546875, 2.20343017578125, 2.358154296875, 2.51287841796875, 2.6676025390625, 2.82232666015625, 2.97705078125, 3.13177490234375, 3.2864990234375, 3.44122314453125, 3.595947265625, 3.75067138671875, 3.9053955078125, 4.06011962890625, 4.21484375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 7.0, 12.0, 24.0, 31.0, 49.0, 61.0, 140.0, 359.0, 2900.0, 220.0, 95.0, 60.0, 22.0, 22.0, 19.0, 12.0, 6.0, 5.0, 1.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.4423828125, -1.4048004150390625, -1.367218017578125, -1.3296356201171875, -1.29205322265625, -1.2544708251953125, -1.216888427734375, -1.1793060302734375, -1.1417236328125, -1.1041412353515625, -1.066558837890625, -1.0289764404296875, -0.99139404296875, -0.9538116455078125, -0.916229248046875, -0.8786468505859375, -0.841064453125, -0.8034820556640625, -0.765899658203125, -0.7283172607421875, -0.69073486328125, -0.6531524658203125, -0.615570068359375, -0.5779876708984375, -0.5404052734375, -0.5028228759765625, -0.465240478515625, -0.4276580810546875, -0.39007568359375, -0.3524932861328125, -0.314910888671875, -0.2773284912109375, -0.23974609375, -0.2021636962890625, -0.164581298828125, -0.1269989013671875, -0.08941650390625, -0.0518341064453125, -0.014251708984375, 0.0233306884765625, 0.0609130859375, 0.0984954833984375, 0.136077880859375, 0.1736602783203125, 0.21124267578125, 0.2488250732421875, 0.286407470703125, 0.3239898681640625, 0.361572265625, 0.3991546630859375, 0.436737060546875, 0.4743194580078125, 0.51190185546875, 0.5494842529296875, 0.587066650390625, 0.6246490478515625, 0.6622314453125, 0.6998138427734375, 0.737396240234375, 0.7749786376953125, 0.81256103515625, 0.8501434326171875, 0.887725830078125, 0.9253082275390625, 0.962890625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 7.0, 30.0, 74.0, 155.0, 305.0, 275.0, 108.0, 33.0, 7.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.323867797851562, -12.884834289550781, -12.44580078125, -12.006767272949219, -11.567733764648438, -11.128700256347656, -10.689666748046875, -10.250633239746094, -9.811599731445312, -9.372566223144531, -8.93353271484375, -8.494499206542969, -8.055465698242188, -7.616432189941406, -7.177398681640625, -6.738365173339844, -6.2993316650390625, -5.860298156738281, -5.4212646484375, -4.982231140136719, -4.5431976318359375, -4.104164123535156, -3.665130615234375, -3.2260971069335938, -2.7870635986328125, -2.3480300903320312, -1.90899658203125, -1.4699630737304688, -1.0309295654296875, -0.5918960571289062, -0.152862548828125, 0.28617095947265625, 0.7252035140991211, 1.1642370223999023, 1.6032705307006836, 2.042304039001465, 2.481337547302246, 2.9203710556030273, 3.3594045639038086, 3.79843807220459, 4.237471580505371, 4.676505088806152, 5.115538597106934, 5.554572105407715, 5.993605613708496, 6.432639122009277, 6.871672630310059, 7.31070613861084, 7.749739646911621, 8.188773155212402, 8.627806663513184, 9.066840171813965, 9.505873680114746, 9.944907188415527, 10.383940696716309, 10.82297420501709, 11.262007713317871, 11.701041221618652, 12.140074729919434, 12.579108238220215, 13.018141746520996, 13.457175254821777, 13.896208763122559, 14.33524227142334, 14.774275779724121]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 2.0, 13.0, 8.0, 3.0, 6.0, 13.0, 12.0, 13.0, 15.0, 18.0, 30.0, 32.0, 29.0, 27.0, 33.0, 39.0, 38.0, 30.0, 32.0, 36.0, 41.0, 37.0, 36.0, 32.0, 43.0, 37.0, 33.0, 27.0, 37.0, 26.0, 29.0, 22.0, 20.0, 28.0, 28.0, 14.0, 19.0, 15.0, 8.0, 12.0, 7.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.726691722869873, -3.6079018115997314, -3.48911190032959, -3.3703219890594482, -3.2515320777893066, -3.132742166519165, -3.0139522552490234, -2.8951621055603027, -2.7763724327087402, -2.6575825214385986, -2.538792610168457, -2.4200026988983154, -2.301212787628174, -2.1824228763580322, -2.0636329650878906, -1.9448429346084595, -1.8260529041290283, -1.7072629928588867, -1.5884730815887451, -1.4696831703186035, -1.350893259048462, -1.2321033477783203, -1.1133133172988892, -0.9945234060287476, -0.875733494758606, -0.7569435834884644, -0.6381536722183228, -0.5193637013435364, -0.4005737900733948, -0.2817838788032532, -0.1629939079284668, -0.044203996658325195, 0.0745859146118164, 0.1933758407831192, 0.312165766954422, 0.430955708026886, 0.5497456192970276, 0.6685355305671692, 0.7873255014419556, 0.9061154127120972, 1.0249053239822388, 1.1436952352523804, 1.262485146522522, 1.3812751770019531, 1.5000650882720947, 1.6188549995422363, 1.737644910812378, 1.8564348220825195, 1.9752247333526611, 2.0940146446228027, 2.2128045558929443, 2.331594467163086, 2.4503843784332275, 2.569174289703369, 2.68796443939209, 2.8067541122436523, 2.925544261932373, 3.0443341732025146, 3.1631240844726562, 3.281913995742798, 3.4007039070129395, 3.519493818283081, 3.6382837295532227, 3.7570738792419434, 3.875863552093506]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 13.0, 12.0, 24.0, 65.0, 68.0, 127.0, 181.0, 382.0, 786.0, 1983.0, 5633.0, 22796.0, 141877.0, 604087.0, 225137.0, 33400.0, 7601.0, 2384.0, 942.0, 464.0, 249.0, 129.0, 76.0, 51.0, 34.0, 21.0, 7.0, 9.0, 5.0, 6.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.21484375, -3.07269287109375, -2.9305419921875, -2.78839111328125, -2.646240234375, -2.50408935546875, -2.3619384765625, -2.21978759765625, -2.07763671875, -1.93548583984375, -1.7933349609375, -1.65118408203125, -1.509033203125, -1.36688232421875, -1.2247314453125, -1.08258056640625, -0.9404296875, -0.79827880859375, -0.6561279296875, -0.51397705078125, -0.371826171875, -0.22967529296875, -0.0875244140625, 0.05462646484375, 0.19677734375, 0.33892822265625, 0.4810791015625, 0.62322998046875, 0.765380859375, 0.90753173828125, 1.0496826171875, 1.19183349609375, 1.333984375, 1.47613525390625, 1.6182861328125, 1.76043701171875, 1.902587890625, 2.04473876953125, 2.1868896484375, 2.32904052734375, 2.47119140625, 2.61334228515625, 2.7554931640625, 2.89764404296875, 3.039794921875, 3.18194580078125, 3.3240966796875, 3.46624755859375, 3.6083984375, 3.75054931640625, 3.8927001953125, 4.03485107421875, 4.177001953125, 4.31915283203125, 4.4613037109375, 4.60345458984375, 4.74560546875, 4.88775634765625, 5.0299072265625, 5.17205810546875, 5.314208984375, 5.45635986328125, 5.5985107421875, 5.74066162109375, 5.8828125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 12.0, 12.0, 16.0, 14.0, 22.0, 24.0, 35.0, 41.0, 55.0, 60.0, 63.0, 89.0, 72.0, 74.0, 65.0, 64.0, 41.0, 46.0, 37.0, 37.0, 22.0, 15.0, 16.0, 18.0, 10.0, 8.0, 4.0, 7.0, 2.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.076171875, -2.006683349609375, -1.93719482421875, -1.867706298828125, -1.7982177734375, -1.728729248046875, -1.65924072265625, -1.589752197265625, -1.520263671875, -1.450775146484375, -1.38128662109375, -1.311798095703125, -1.2423095703125, -1.172821044921875, -1.10333251953125, -1.033843994140625, -0.96435546875, -0.894866943359375, -0.82537841796875, -0.755889892578125, -0.6864013671875, -0.616912841796875, -0.54742431640625, -0.477935791015625, -0.408447265625, -0.338958740234375, -0.26947021484375, -0.199981689453125, -0.1304931640625, -0.061004638671875, 0.00848388671875, 0.077972412109375, 0.1474609375, 0.216949462890625, 0.28643798828125, 0.355926513671875, 0.4254150390625, 0.494903564453125, 0.56439208984375, 0.633880615234375, 0.703369140625, 0.772857666015625, 0.84234619140625, 0.911834716796875, 0.9813232421875, 1.050811767578125, 1.12030029296875, 1.189788818359375, 1.25927734375, 1.328765869140625, 1.39825439453125, 1.467742919921875, 1.5372314453125, 1.606719970703125, 1.67620849609375, 1.745697021484375, 1.815185546875, 1.884674072265625, 1.95416259765625, 2.023651123046875, 2.0931396484375, 2.162628173828125, 2.23211669921875, 2.301605224609375, 2.37109375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 5.0, 3.0, 9.0, 10.0, 7.0, 11.0, 18.0, 25.0, 47.0, 47.0, 77.0, 83.0, 115.0, 168.0, 303.0, 428.0, 691.0, 1320.0, 3187.0, 12834.0, 122958.0, 716636.0, 166506.0, 15910.0, 3527.0, 1431.0, 764.0, 480.0, 273.0, 192.0, 150.0, 87.0, 68.0, 48.0, 31.0, 21.0, 18.0, 16.0, 11.0, 10.0, 11.0, 8.0, 1.0, 7.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.4375, -5.26519775390625, -5.0928955078125, -4.92059326171875, -4.748291015625, -4.57598876953125, -4.4036865234375, -4.23138427734375, -4.05908203125, -3.88677978515625, -3.7144775390625, -3.54217529296875, -3.369873046875, -3.19757080078125, -3.0252685546875, -2.85296630859375, -2.6806640625, -2.50836181640625, -2.3360595703125, -2.16375732421875, -1.991455078125, -1.81915283203125, -1.6468505859375, -1.47454833984375, -1.30224609375, -1.12994384765625, -0.9576416015625, -0.78533935546875, -0.613037109375, -0.44073486328125, -0.2684326171875, -0.09613037109375, 0.076171875, 0.24847412109375, 0.4207763671875, 0.59307861328125, 0.765380859375, 0.93768310546875, 1.1099853515625, 1.28228759765625, 1.45458984375, 1.62689208984375, 1.7991943359375, 1.97149658203125, 2.143798828125, 2.31610107421875, 2.4884033203125, 2.66070556640625, 2.8330078125, 3.00531005859375, 3.1776123046875, 3.34991455078125, 3.522216796875, 3.69451904296875, 3.8668212890625, 4.03912353515625, 4.21142578125, 4.38372802734375, 4.5560302734375, 4.72833251953125, 4.900634765625, 5.07293701171875, 5.2452392578125, 5.41754150390625, 5.58984375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 4.0, 5.0, 1.0, 11.0, 11.0, 11.0, 15.0, 15.0, 11.0, 29.0, 26.0, 26.0, 41.0, 41.0, 38.0, 39.0, 45.0, 53.0, 52.0, 49.0, 61.0, 58.0, 45.0, 40.0, 46.0, 39.0, 34.0, 23.0, 16.0, 23.0, 19.0, 14.0, 17.0, 13.0, 7.0, 7.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.40625, -8.12255859375, -7.8388671875, -7.55517578125, -7.271484375, -6.98779296875, -6.7041015625, -6.42041015625, -6.13671875, -5.85302734375, -5.5693359375, -5.28564453125, -5.001953125, -4.71826171875, -4.4345703125, -4.15087890625, -3.8671875, -3.58349609375, -3.2998046875, -3.01611328125, -2.732421875, -2.44873046875, -2.1650390625, -1.88134765625, -1.59765625, -1.31396484375, -1.0302734375, -0.74658203125, -0.462890625, -0.17919921875, 0.1044921875, 0.38818359375, 0.671875, 0.95556640625, 1.2392578125, 1.52294921875, 1.806640625, 2.09033203125, 2.3740234375, 2.65771484375, 2.94140625, 3.22509765625, 3.5087890625, 3.79248046875, 4.076171875, 4.35986328125, 4.6435546875, 4.92724609375, 5.2109375, 5.49462890625, 5.7783203125, 6.06201171875, 6.345703125, 6.62939453125, 6.9130859375, 7.19677734375, 7.48046875, 7.76416015625, 8.0478515625, 8.33154296875, 8.615234375, 8.89892578125, 9.1826171875, 9.46630859375, 9.75]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 9.0, 11.0, 22.0, 28.0, 50.0, 88.0, 155.0, 437.0, 1723.0, 27069.0, 1002358.0, 14591.0, 1293.0, 379.0, 153.0, 68.0, 36.0, 23.0, 15.0, 10.0, 10.0, 8.0, 9.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.40625, -10.142333984375, -9.87841796875, -9.614501953125, -9.3505859375, -9.086669921875, -8.82275390625, -8.558837890625, -8.294921875, -8.031005859375, -7.76708984375, -7.503173828125, -7.2392578125, -6.975341796875, -6.71142578125, -6.447509765625, -6.18359375, -5.919677734375, -5.65576171875, -5.391845703125, -5.1279296875, -4.864013671875, -4.60009765625, -4.336181640625, -4.072265625, -3.808349609375, -3.54443359375, -3.280517578125, -3.0166015625, -2.752685546875, -2.48876953125, -2.224853515625, -1.9609375, -1.697021484375, -1.43310546875, -1.169189453125, -0.9052734375, -0.641357421875, -0.37744140625, -0.113525390625, 0.150390625, 0.414306640625, 0.67822265625, 0.942138671875, 1.2060546875, 1.469970703125, 1.73388671875, 1.997802734375, 2.26171875, 2.525634765625, 2.78955078125, 3.053466796875, 3.3173828125, 3.581298828125, 3.84521484375, 4.109130859375, 4.373046875, 4.636962890625, 4.90087890625, 5.164794921875, 5.4287109375, 5.692626953125, 5.95654296875, 6.220458984375, 6.484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 6.0, 5.0, 4.0, 8.0, 9.0, 10.0, 9.0, 18.0, 27.0, 23.0, 36.0, 35.0, 46.0, 55.0, 76.0, 74.0, 76.0, 85.0, 73.0, 52.0, 69.0, 43.0, 30.0, 28.0, 21.0, 14.0, 22.0, 13.0, 11.0, 7.0, 8.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.000335693359375, -0.00032607465982437134, -0.0003164559602737427, -0.000306837260723114, -0.00029721856117248535, -0.0002875998616218567, -0.00027798116207122803, -0.00026836246252059937, -0.0002587437629699707, -0.00024912506341934204, -0.00023950636386871338, -0.00022988766431808472, -0.00022026896476745605, -0.0002106502652168274, -0.00020103156566619873, -0.00019141286611557007, -0.0001817941665649414, -0.00017217546701431274, -0.00016255676746368408, -0.00015293806791305542, -0.00014331936836242676, -0.0001337006688117981, -0.00012408196926116943, -0.00011446326971054077, -0.00010484457015991211, -9.522587060928345e-05, -8.560717105865479e-05, -7.598847150802612e-05, -6.636977195739746e-05, -5.67510724067688e-05, -4.713237285614014e-05, -3.7513673305511475e-05, -2.7894973754882812e-05, -1.827627420425415e-05, -8.657574653625488e-06, 9.611248970031738e-07, 1.0579824447631836e-05, 2.0198523998260498e-05, 2.981722354888916e-05, 3.943592309951782e-05, 4.9054622650146484e-05, 5.8673322200775146e-05, 6.829202175140381e-05, 7.791072130203247e-05, 8.752942085266113e-05, 9.71481204032898e-05, 0.00010676681995391846, 0.00011638551950454712, 0.00012600421905517578, 0.00013562291860580444, 0.0001452416181564331, 0.00015486031770706177, 0.00016447901725769043, 0.0001740977168083191, 0.00018371641635894775, 0.00019333511590957642, 0.00020295381546020508, 0.00021257251501083374, 0.0002221912145614624, 0.00023180991411209106, 0.00024142861366271973, 0.0002510473132133484, 0.00026066601276397705, 0.0002702847123146057, 0.0002799034118652344]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 14.0, 14.0, 24.0, 36.0, 60.0, 96.0, 207.0, 400.0, 940.0, 2593.0, 13972.0, 360196.0, 643367.0, 21136.0, 3386.0, 1114.0, 447.0, 221.0, 116.0, 66.0, 40.0, 26.0, 21.0, 12.0, 8.0, 6.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.5234375, -4.3907470703125, -4.258056640625, -4.1253662109375, -3.99267578125, -3.8599853515625, -3.727294921875, -3.5946044921875, -3.4619140625, -3.3292236328125, -3.196533203125, -3.0638427734375, -2.93115234375, -2.7984619140625, -2.665771484375, -2.5330810546875, -2.400390625, -2.2677001953125, -2.135009765625, -2.0023193359375, -1.86962890625, -1.7369384765625, -1.604248046875, -1.4715576171875, -1.3388671875, -1.2061767578125, -1.073486328125, -0.9407958984375, -0.80810546875, -0.6754150390625, -0.542724609375, -0.4100341796875, -0.27734375, -0.1446533203125, -0.011962890625, 0.1207275390625, 0.25341796875, 0.3861083984375, 0.518798828125, 0.6514892578125, 0.7841796875, 0.9168701171875, 1.049560546875, 1.1822509765625, 1.31494140625, 1.4476318359375, 1.580322265625, 1.7130126953125, 1.845703125, 1.9783935546875, 2.111083984375, 2.2437744140625, 2.37646484375, 2.5091552734375, 2.641845703125, 2.7745361328125, 2.9072265625, 3.0399169921875, 3.172607421875, 3.3052978515625, 3.43798828125, 3.5706787109375, 3.703369140625, 3.8360595703125, 3.96875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 0.0, 7.0, 8.0, 14.0, 20.0, 22.0, 53.0, 83.0, 129.0, 147.0, 152.0, 127.0, 93.0, 58.0, 37.0, 17.0, 17.0, 6.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.55078125, -6.374267578125, -6.19775390625, -6.021240234375, -5.8447265625, -5.668212890625, -5.49169921875, -5.315185546875, -5.138671875, -4.962158203125, -4.78564453125, -4.609130859375, -4.4326171875, -4.256103515625, -4.07958984375, -3.903076171875, -3.7265625, -3.550048828125, -3.37353515625, -3.197021484375, -3.0205078125, -2.843994140625, -2.66748046875, -2.490966796875, -2.314453125, -2.137939453125, -1.96142578125, -1.784912109375, -1.6083984375, -1.431884765625, -1.25537109375, -1.078857421875, -0.90234375, -0.725830078125, -0.54931640625, -0.372802734375, -0.1962890625, -0.019775390625, 0.15673828125, 0.333251953125, 0.509765625, 0.686279296875, 0.86279296875, 1.039306640625, 1.2158203125, 1.392333984375, 1.56884765625, 1.745361328125, 1.921875, 2.098388671875, 2.27490234375, 2.451416015625, 2.6279296875, 2.804443359375, 2.98095703125, 3.157470703125, 3.333984375, 3.510498046875, 3.68701171875, 3.863525390625, 4.0400390625, 4.216552734375, 4.39306640625, 4.569580078125, 4.74609375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 10.0, 72.0, 322.0, 422.0, 142.0, 27.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.71023559570312, -134.8750762939453, -131.0399169921875, -127.20476531982422, -123.36961364746094, -119.53445434570312, -115.69929504394531, -111.86414337158203, -108.02898406982422, -104.1938247680664, -100.35867309570312, -96.52351379394531, -92.68836212158203, -88.85320281982422, -85.01805114746094, -81.18289184570312, -77.34773254394531, -73.5125732421875, -69.67742156982422, -65.8422622680664, -62.00710678100586, -58.17195129394531, -54.336795806884766, -50.50164031982422, -46.66648864746094, -42.83133316040039, -38.996177673339844, -35.16101837158203, -31.325862884521484, -27.490707397460938, -23.65555191040039, -19.82039451599121, -15.985237121582031, -12.150080680847168, -8.314924240112305, -4.479768753051758, -0.6446123123168945, 3.1905441284179688, 7.025699615478516, 10.860857009887695, 14.696012496948242, 18.53116798400879, 22.36632537841797, 26.201480865478516, 30.036636352539062, 33.871795654296875, 37.706947326660156, 41.54210662841797, 45.377262115478516, 49.21241760253906, 53.04757308959961, 56.882728576660156, 60.71788787841797, 64.55303955078125, 68.38819885253906, 72.22335815429688, 76.05850982666016, 79.89366912841797, 83.72882080078125, 87.56398010253906, 91.39913177490234, 95.23429107666016, 99.06944274902344, 102.90460205078125, 106.73976135253906]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 6.0, 2.0, 8.0, 7.0, 16.0, 12.0, 17.0, 16.0, 19.0, 28.0, 29.0, 27.0, 32.0, 39.0, 40.0, 44.0, 53.0, 47.0, 50.0, 59.0, 39.0, 42.0, 45.0, 43.0, 36.0, 49.0, 27.0, 35.0, 28.0, 18.0, 16.0, 18.0, 8.0, 8.0, 12.0, 8.0, 8.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.68806838989258, -33.64277648925781, -32.59748077392578, -31.552188873291016, -30.506895065307617, -29.46160125732422, -28.416309356689453, -27.371015548706055, -26.325721740722656, -25.280427932739258, -24.23513412475586, -23.189842224121094, -22.144548416137695, -21.099254608154297, -20.05396270751953, -19.008668899536133, -17.963375091552734, -16.918081283569336, -15.872788429260254, -14.827495574951172, -13.782201766967773, -12.736907958984375, -11.691615104675293, -10.646322250366211, -9.601028442382812, -8.555734634399414, -7.510441780090332, -6.465148448944092, -5.419855117797852, -4.374561786651611, -3.329268455505371, -2.283975124359131, -1.238677978515625, -0.19338464736938477, 0.8519086837768555, 1.8972020149230957, 2.942495346069336, 3.987788677215576, 5.033082008361816, 6.078375339508057, 7.123668670654297, 8.168962478637695, 9.214255332946777, 10.25954818725586, 11.304841995239258, 12.350135803222656, 13.395428657531738, 14.44072151184082, 15.486015319824219, 16.531309127807617, 17.576602935791016, 18.62189483642578, 19.66718864440918, 20.712482452392578, 21.757774353027344, 22.803068161010742, 23.84836196899414, 24.89365577697754, 25.938949584960938, 26.984241485595703, 28.0295352935791, 29.0748291015625, 30.120121002197266, 31.165414810180664, 32.21070861816406]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 3.0, 10.0, 9.0, 10.0, 22.0, 36.0, 50.0, 85.0, 112.0, 187.0, 279.0, 585.0, 1244.0, 2789.0, 7646.0, 31612.0, 332798.0, 3725227.0, 70484.0, 13457.0, 4112.0, 1722.0, 789.0, 441.0, 207.0, 141.0, 56.0, 52.0, 39.0, 28.0, 15.0, 9.0, 11.0, 2.0, 7.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.802734375, -3.662994384765625, -3.52325439453125, -3.383514404296875, -3.2437744140625, -3.104034423828125, -2.96429443359375, -2.824554443359375, -2.684814453125, -2.545074462890625, -2.40533447265625, -2.265594482421875, -2.1258544921875, -1.986114501953125, -1.84637451171875, -1.706634521484375, -1.56689453125, -1.427154541015625, -1.28741455078125, -1.147674560546875, -1.0079345703125, -0.868194580078125, -0.72845458984375, -0.588714599609375, -0.448974609375, -0.309234619140625, -0.16949462890625, -0.029754638671875, 0.1099853515625, 0.249725341796875, 0.38946533203125, 0.529205322265625, 0.6689453125, 0.808685302734375, 0.94842529296875, 1.088165283203125, 1.2279052734375, 1.367645263671875, 1.50738525390625, 1.647125244140625, 1.786865234375, 1.926605224609375, 2.06634521484375, 2.206085205078125, 2.3458251953125, 2.485565185546875, 2.62530517578125, 2.765045166015625, 2.90478515625, 3.044525146484375, 3.18426513671875, 3.324005126953125, 3.4637451171875, 3.603485107421875, 3.74322509765625, 3.882965087890625, 4.022705078125, 4.162445068359375, 4.30218505859375, 4.441925048828125, 4.5816650390625, 4.721405029296875, 4.86114501953125, 5.000885009765625, 5.140625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 7.0, 7.0, 7.0, 15.0, 22.0, 28.0, 32.0, 41.0, 54.0, 68.0, 75.0, 84.0, 84.0, 90.0, 81.0, 54.0, 55.0, 48.0, 38.0, 28.0, 21.0, 18.0, 13.0, 8.0, 7.0, 6.0, 2.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.626953125, -2.553619384765625, -2.48028564453125, -2.406951904296875, -2.3336181640625, -2.260284423828125, -2.18695068359375, -2.113616943359375, -2.040283203125, -1.966949462890625, -1.89361572265625, -1.820281982421875, -1.7469482421875, -1.673614501953125, -1.60028076171875, -1.526947021484375, -1.45361328125, -1.380279541015625, -1.30694580078125, -1.233612060546875, -1.1602783203125, -1.086944580078125, -1.01361083984375, -0.940277099609375, -0.866943359375, -0.793609619140625, -0.72027587890625, -0.646942138671875, -0.5736083984375, -0.500274658203125, -0.42694091796875, -0.353607177734375, -0.2802734375, -0.206939697265625, -0.13360595703125, -0.060272216796875, 0.0130615234375, 0.086395263671875, 0.15972900390625, 0.233062744140625, 0.306396484375, 0.379730224609375, 0.45306396484375, 0.526397705078125, 0.5997314453125, 0.673065185546875, 0.74639892578125, 0.819732666015625, 0.89306640625, 0.966400146484375, 1.03973388671875, 1.113067626953125, 1.1864013671875, 1.259735107421875, 1.33306884765625, 1.406402587890625, 1.479736328125, 1.553070068359375, 1.62640380859375, 1.699737548828125, 1.7730712890625, 1.846405029296875, 1.91973876953125, 1.993072509765625, 2.06640625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 9.0, 11.0, 21.0, 17.0, 33.0, 50.0, 64.0, 113.0, 150.0, 252.0, 386.0, 669.0, 1126.0, 2109.0, 4755.0, 12859.0, 52601.0, 526160.0, 3445473.0, 112671.0, 21478.0, 6781.0, 2913.0, 1462.0, 809.0, 462.0, 301.0, 178.0, 144.0, 64.0, 45.0, 35.0, 26.0, 18.0, 12.0, 4.0, 9.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.171875, -4.056640625, -3.94140625, -3.826171875, -3.7109375, -3.595703125, -3.48046875, -3.365234375, -3.25, -3.134765625, -3.01953125, -2.904296875, -2.7890625, -2.673828125, -2.55859375, -2.443359375, -2.328125, -2.212890625, -2.09765625, -1.982421875, -1.8671875, -1.751953125, -1.63671875, -1.521484375, -1.40625, -1.291015625, -1.17578125, -1.060546875, -0.9453125, -0.830078125, -0.71484375, -0.599609375, -0.484375, -0.369140625, -0.25390625, -0.138671875, -0.0234375, 0.091796875, 0.20703125, 0.322265625, 0.4375, 0.552734375, 0.66796875, 0.783203125, 0.8984375, 1.013671875, 1.12890625, 1.244140625, 1.359375, 1.474609375, 1.58984375, 1.705078125, 1.8203125, 1.935546875, 2.05078125, 2.166015625, 2.28125, 2.396484375, 2.51171875, 2.626953125, 2.7421875, 2.857421875, 2.97265625, 3.087890625, 3.203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 8.0, 4.0, 10.0, 20.0, 22.0, 45.0, 93.0, 148.0, 401.0, 2358.0, 509.0, 215.0, 106.0, 48.0, 32.0, 22.0, 6.0, 8.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3359375, -2.268310546875, -2.20068359375, -2.133056640625, -2.0654296875, -1.997802734375, -1.93017578125, -1.862548828125, -1.794921875, -1.727294921875, -1.65966796875, -1.592041015625, -1.5244140625, -1.456787109375, -1.38916015625, -1.321533203125, -1.25390625, -1.186279296875, -1.11865234375, -1.051025390625, -0.9833984375, -0.915771484375, -0.84814453125, -0.780517578125, -0.712890625, -0.645263671875, -0.57763671875, -0.510009765625, -0.4423828125, -0.374755859375, -0.30712890625, -0.239501953125, -0.171875, -0.104248046875, -0.03662109375, 0.031005859375, 0.0986328125, 0.166259765625, 0.23388671875, 0.301513671875, 0.369140625, 0.436767578125, 0.50439453125, 0.572021484375, 0.6396484375, 0.707275390625, 0.77490234375, 0.842529296875, 0.91015625, 0.977783203125, 1.04541015625, 1.113037109375, 1.1806640625, 1.248291015625, 1.31591796875, 1.383544921875, 1.451171875, 1.518798828125, 1.58642578125, 1.654052734375, 1.7216796875, 1.789306640625, 1.85693359375, 1.924560546875, 1.9921875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 6.0, 9.0, 11.0, 26.0, 55.0, 68.0, 115.0, 140.0, 144.0, 145.0, 109.0, 56.0, 44.0, 37.0, 15.0, 15.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.77614688873291, -7.456036567687988, -7.135926246643066, -6.8158159255981445, -6.495705604553223, -6.175595283508301, -5.855485439300537, -5.535375118255615, -5.215264797210693, -4.8951544761657715, -4.57504415512085, -4.254933834075928, -3.934823751449585, -3.614713430404663, -3.2946033477783203, -2.9744930267333984, -2.6543827056884766, -2.3342723846435547, -2.014162063598633, -1.69405198097229, -1.3739416599273682, -1.0538313388824463, -0.733721137046814, -0.41361093521118164, -0.09350061416625977, 0.22660964727401733, 0.5467199087142944, 0.8668301701545715, 1.1869404315948486, 1.5070507526397705, 1.8271609544754028, 2.147271156311035, 2.4673824310302734, 2.7874927520751953, 3.107603073120117, 3.42771315574646, 3.747823476791382, 4.067934036254883, 4.3880438804626465, 4.708154201507568, 5.02826452255249, 5.348374843597412, 5.668485164642334, 5.988595485687256, 6.3087053298950195, 6.628815650939941, 6.948925971984863, 7.269036293029785, 7.589146614074707, 7.909256935119629, 8.22936725616455, 8.549477577209473, 8.869587898254395, 9.189698219299316, 9.509808540344238, 9.829917907714844, 10.150028228759766, 10.470138549804688, 10.79024887084961, 11.110359191894531, 11.430469512939453, 11.750579833984375, 12.070690155029297, 12.390800476074219, 12.71091079711914]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 6.0, 11.0, 11.0, 10.0, 11.0, 10.0, 12.0, 14.0, 23.0, 26.0, 23.0, 37.0, 28.0, 38.0, 42.0, 36.0, 51.0, 47.0, 41.0, 40.0, 46.0, 54.0, 53.0, 39.0, 63.0, 40.0, 29.0, 24.0, 26.0, 19.0, 22.0, 12.0, 14.0, 12.0, 7.0, 8.0, 6.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3377227783203125, -5.162957191467285, -4.988192081451416, -4.813426971435547, -4.6386613845825195, -4.463895797729492, -4.289130687713623, -4.114365577697754, -3.9395999908447266, -3.7648346424102783, -3.59006929397583, -3.415303945541382, -3.2405385971069336, -3.0657732486724854, -2.891007900238037, -2.716242551803589, -2.5414772033691406, -2.3667118549346924, -2.191946506500244, -2.017181158065796, -1.8424158096313477, -1.6676504611968994, -1.4928851127624512, -1.318119764328003, -1.1433544158935547, -0.9685890674591064, -0.7938237190246582, -0.61905837059021, -0.4442930221557617, -0.2695276737213135, -0.09476232528686523, 0.08000302314758301, 0.25476837158203125, 0.4295337200164795, 0.6042990684509277, 0.779064416885376, 0.9538297653198242, 1.1285951137542725, 1.3033604621887207, 1.478125810623169, 1.6528911590576172, 1.8276565074920654, 2.0024218559265137, 2.177187204360962, 2.35195255279541, 2.5267179012298584, 2.7014832496643066, 2.876248598098755, 3.051013946533203, 3.2257792949676514, 3.4005446434020996, 3.575309991836548, 3.750075340270996, 3.9248406887054443, 4.099606037139893, 4.274371147155762, 4.449136734008789, 4.623902320861816, 4.7986674308776855, 4.973432540893555, 5.148198127746582, 5.322963714599609, 5.4977288246154785, 5.672493934631348, 5.847259521484375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 12.0, 12.0, 27.0, 46.0, 80.0, 194.0, 511.0, 1830.0, 9562.0, 97333.0, 754176.0, 166710.0, 14509.0, 2469.0, 647.0, 212.0, 90.0, 50.0, 30.0, 18.0, 11.0, 10.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4375, -8.20697021484375, -7.9764404296875, -7.74591064453125, -7.515380859375, -7.28485107421875, -7.0543212890625, -6.82379150390625, -6.59326171875, -6.36273193359375, -6.1322021484375, -5.90167236328125, -5.671142578125, -5.44061279296875, -5.2100830078125, -4.97955322265625, -4.7490234375, -4.51849365234375, -4.2879638671875, -4.05743408203125, -3.826904296875, -3.59637451171875, -3.3658447265625, -3.13531494140625, -2.90478515625, -2.67425537109375, -2.4437255859375, -2.21319580078125, -1.982666015625, -1.75213623046875, -1.5216064453125, -1.29107666015625, -1.060546875, -0.83001708984375, -0.5994873046875, -0.36895751953125, -0.138427734375, 0.09210205078125, 0.3226318359375, 0.55316162109375, 0.78369140625, 1.01422119140625, 1.2447509765625, 1.47528076171875, 1.705810546875, 1.93634033203125, 2.1668701171875, 2.39739990234375, 2.6279296875, 2.85845947265625, 3.0889892578125, 3.31951904296875, 3.550048828125, 3.78057861328125, 4.0111083984375, 4.24163818359375, 4.47216796875, 4.70269775390625, 4.9332275390625, 5.16375732421875, 5.394287109375, 5.62481689453125, 5.8553466796875, 6.08587646484375, 6.31640625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 4.0, 7.0, 9.0, 10.0, 20.0, 19.0, 23.0, 29.0, 40.0, 45.0, 44.0, 77.0, 78.0, 74.0, 82.0, 69.0, 60.0, 53.0, 56.0, 41.0, 40.0, 30.0, 22.0, 21.0, 12.0, 7.0, 7.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9765625, -1.911224365234375, -1.84588623046875, -1.780548095703125, -1.7152099609375, -1.649871826171875, -1.58453369140625, -1.519195556640625, -1.453857421875, -1.388519287109375, -1.32318115234375, -1.257843017578125, -1.1925048828125, -1.127166748046875, -1.06182861328125, -0.996490478515625, -0.93115234375, -0.865814208984375, -0.80047607421875, -0.735137939453125, -0.6697998046875, -0.604461669921875, -0.53912353515625, -0.473785400390625, -0.408447265625, -0.343109130859375, -0.27777099609375, -0.212432861328125, -0.1470947265625, -0.081756591796875, -0.01641845703125, 0.048919677734375, 0.1142578125, 0.179595947265625, 0.24493408203125, 0.310272216796875, 0.3756103515625, 0.440948486328125, 0.50628662109375, 0.571624755859375, 0.636962890625, 0.702301025390625, 0.76763916015625, 0.832977294921875, 0.8983154296875, 0.963653564453125, 1.02899169921875, 1.094329833984375, 1.15966796875, 1.225006103515625, 1.29034423828125, 1.355682373046875, 1.4210205078125, 1.486358642578125, 1.55169677734375, 1.617034912109375, 1.682373046875, 1.747711181640625, 1.81304931640625, 1.878387451171875, 1.9437255859375, 2.009063720703125, 2.07440185546875, 2.139739990234375, 2.205078125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 6.0, 9.0, 14.0, 14.0, 24.0, 30.0, 38.0, 68.0, 74.0, 136.0, 198.0, 315.0, 592.0, 1191.0, 2863.0, 10788.0, 102407.0, 785161.0, 126595.0, 12041.0, 3136.0, 1241.0, 583.0, 394.0, 207.0, 128.0, 83.0, 65.0, 40.0, 29.0, 23.0, 7.0, 7.0, 12.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.7578125, -5.5487060546875, -5.339599609375, -5.1304931640625, -4.92138671875, -4.7122802734375, -4.503173828125, -4.2940673828125, -4.0849609375, -3.8758544921875, -3.666748046875, -3.4576416015625, -3.24853515625, -3.0394287109375, -2.830322265625, -2.6212158203125, -2.412109375, -2.2030029296875, -1.993896484375, -1.7847900390625, -1.57568359375, -1.3665771484375, -1.157470703125, -0.9483642578125, -0.7392578125, -0.5301513671875, -0.321044921875, -0.1119384765625, 0.09716796875, 0.3062744140625, 0.515380859375, 0.7244873046875, 0.93359375, 1.1427001953125, 1.351806640625, 1.5609130859375, 1.77001953125, 1.9791259765625, 2.188232421875, 2.3973388671875, 2.6064453125, 2.8155517578125, 3.024658203125, 3.2337646484375, 3.44287109375, 3.6519775390625, 3.861083984375, 4.0701904296875, 4.279296875, 4.4884033203125, 4.697509765625, 4.9066162109375, 5.11572265625, 5.3248291015625, 5.533935546875, 5.7430419921875, 5.9521484375, 6.1612548828125, 6.370361328125, 6.5794677734375, 6.78857421875, 6.9976806640625, 7.206787109375, 7.4158935546875, 7.625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 8.0, 13.0, 7.0, 12.0, 18.0, 24.0, 20.0, 31.0, 42.0, 37.0, 39.0, 55.0, 49.0, 72.0, 62.0, 65.0, 57.0, 49.0, 50.0, 48.0, 48.0, 35.0, 29.0, 22.0, 26.0, 18.0, 17.0, 9.0, 7.0, 6.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.54296875, -7.29339599609375, -7.0438232421875, -6.79425048828125, -6.544677734375, -6.29510498046875, -6.0455322265625, -5.79595947265625, -5.54638671875, -5.29681396484375, -5.0472412109375, -4.79766845703125, -4.548095703125, -4.29852294921875, -4.0489501953125, -3.79937744140625, -3.5498046875, -3.30023193359375, -3.0506591796875, -2.80108642578125, -2.551513671875, -2.30194091796875, -2.0523681640625, -1.80279541015625, -1.55322265625, -1.30364990234375, -1.0540771484375, -0.80450439453125, -0.554931640625, -0.30535888671875, -0.0557861328125, 0.19378662109375, 0.443359375, 0.69293212890625, 0.9425048828125, 1.19207763671875, 1.441650390625, 1.69122314453125, 1.9407958984375, 2.19036865234375, 2.43994140625, 2.68951416015625, 2.9390869140625, 3.18865966796875, 3.438232421875, 3.68780517578125, 3.9373779296875, 4.18695068359375, 4.4365234375, 4.68609619140625, 4.9356689453125, 5.18524169921875, 5.434814453125, 5.68438720703125, 5.9339599609375, 6.18353271484375, 6.43310546875, 6.68267822265625, 6.9322509765625, 7.18182373046875, 7.431396484375, 7.68096923828125, 7.9305419921875, 8.18011474609375, 8.4296875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 3.0, 11.0, 11.0, 16.0, 20.0, 39.0, 51.0, 92.0, 143.0, 265.0, 613.0, 1675.0, 6686.0, 65868.0, 844058.0, 116175.0, 9398.0, 2017.0, 667.0, 319.0, 159.0, 99.0, 61.0, 36.0, 20.0, 15.0, 9.0, 10.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.638671875, -3.533477783203125, -3.42828369140625, -3.323089599609375, -3.2178955078125, -3.112701416015625, -3.00750732421875, -2.902313232421875, -2.797119140625, -2.691925048828125, -2.58673095703125, -2.481536865234375, -2.3763427734375, -2.271148681640625, -2.16595458984375, -2.060760498046875, -1.95556640625, -1.850372314453125, -1.74517822265625, -1.639984130859375, -1.5347900390625, -1.429595947265625, -1.32440185546875, -1.219207763671875, -1.114013671875, -1.008819580078125, -0.90362548828125, -0.798431396484375, -0.6932373046875, -0.588043212890625, -0.48284912109375, -0.377655029296875, -0.2724609375, -0.167266845703125, -0.06207275390625, 0.043121337890625, 0.1483154296875, 0.253509521484375, 0.35870361328125, 0.463897705078125, 0.569091796875, 0.674285888671875, 0.77947998046875, 0.884674072265625, 0.9898681640625, 1.095062255859375, 1.20025634765625, 1.305450439453125, 1.41064453125, 1.515838623046875, 1.62103271484375, 1.726226806640625, 1.8314208984375, 1.936614990234375, 2.04180908203125, 2.147003173828125, 2.252197265625, 2.357391357421875, 2.46258544921875, 2.567779541015625, 2.6729736328125, 2.778167724609375, 2.88336181640625, 2.988555908203125, 3.09375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 17.0, 28.0, 48.0, 80.0, 98.0, 169.0, 232.0, 104.0, 72.0, 49.0, 27.0, 23.0, 18.0, 7.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006008148193359375, -0.0005779117345809937, -0.0005550086498260498, -0.000532105565071106, -0.0005092024803161621, -0.00048629939556121826, -0.0004633963108062744, -0.00044049322605133057, -0.0004175901412963867, -0.00039468705654144287, -0.000371783971786499, -0.0003488808870315552, -0.00032597780227661133, -0.0003030747175216675, -0.00028017163276672363, -0.0002572685480117798, -0.00023436546325683594, -0.0002114623785018921, -0.00018855929374694824, -0.0001656562089920044, -0.00014275312423706055, -0.0001198500394821167, -9.694695472717285e-05, -7.4043869972229e-05, -5.1140785217285156e-05, -2.823770046234131e-05, -5.334615707397461e-06, 1.7568469047546387e-05, 4.0471553802490234e-05, 6.337463855743408e-05, 8.627772331237793e-05, 0.00010918080806732178, 0.00013208389282226562, 0.00015498697757720947, 0.00017789006233215332, 0.00020079314708709717, 0.00022369623184204102, 0.00024659931659698486, 0.0002695024013519287, 0.00029240548610687256, 0.0003153085708618164, 0.00033821165561676025, 0.0003611147403717041, 0.00038401782512664795, 0.0004069209098815918, 0.00042982399463653564, 0.0004527270793914795, 0.00047563016414642334, 0.0004985332489013672, 0.000521436333656311, 0.0005443394184112549, 0.0005672425031661987, 0.0005901455879211426, 0.0006130486726760864, 0.0006359517574310303, 0.0006588548421859741, 0.000681757926940918, 0.0007046610116958618, 0.0007275640964508057, 0.0007504671812057495, 0.0007733702659606934, 0.0007962733507156372, 0.0008191764354705811, 0.0008420795202255249, 0.0008649826049804688]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 8.0, 11.0, 4.0, 15.0, 20.0, 37.0, 34.0, 52.0, 69.0, 106.0, 123.0, 241.0, 381.0, 596.0, 1159.0, 2466.0, 6625.0, 24249.0, 157421.0, 683555.0, 138170.0, 22028.0, 6091.0, 2352.0, 1084.0, 578.0, 370.0, 217.0, 138.0, 97.0, 63.0, 52.0, 34.0, 21.0, 22.0, 18.0, 11.0, 7.0, 8.0, 5.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.9990234375, -1.9355010986328125, -1.871978759765625, -1.8084564208984375, -1.74493408203125, -1.6814117431640625, -1.617889404296875, -1.5543670654296875, -1.4908447265625, -1.4273223876953125, -1.363800048828125, -1.3002777099609375, -1.23675537109375, -1.1732330322265625, -1.109710693359375, -1.0461883544921875, -0.982666015625, -0.9191436767578125, -0.855621337890625, -0.7920989990234375, -0.72857666015625, -0.6650543212890625, -0.601531982421875, -0.5380096435546875, -0.4744873046875, -0.4109649658203125, -0.347442626953125, -0.2839202880859375, -0.22039794921875, -0.1568756103515625, -0.093353271484375, -0.0298309326171875, 0.03369140625, 0.0972137451171875, 0.160736083984375, 0.2242584228515625, 0.28778076171875, 0.3513031005859375, 0.414825439453125, 0.4783477783203125, 0.5418701171875, 0.6053924560546875, 0.668914794921875, 0.7324371337890625, 0.79595947265625, 0.8594818115234375, 0.923004150390625, 0.9865264892578125, 1.050048828125, 1.1135711669921875, 1.177093505859375, 1.2406158447265625, 1.30413818359375, 1.3676605224609375, 1.431182861328125, 1.4947052001953125, 1.5582275390625, 1.6217498779296875, 1.685272216796875, 1.7487945556640625, 1.81231689453125, 1.8758392333984375, 1.939361572265625, 2.0028839111328125, 2.06640625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 4.0, 5.0, 6.0, 11.0, 10.0, 22.0, 19.0, 26.0, 42.0, 61.0, 61.0, 70.0, 84.0, 103.0, 87.0, 76.0, 76.0, 60.0, 42.0, 29.0, 21.0, 18.0, 14.0, 7.0, 9.0, 8.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.73046875, -2.65606689453125, -2.5816650390625, -2.50726318359375, -2.432861328125, -2.35845947265625, -2.2840576171875, -2.20965576171875, -2.13525390625, -2.06085205078125, -1.9864501953125, -1.91204833984375, -1.837646484375, -1.76324462890625, -1.6888427734375, -1.61444091796875, -1.5400390625, -1.46563720703125, -1.3912353515625, -1.31683349609375, -1.242431640625, -1.16802978515625, -1.0936279296875, -1.01922607421875, -0.94482421875, -0.87042236328125, -0.7960205078125, -0.72161865234375, -0.647216796875, -0.57281494140625, -0.4984130859375, -0.42401123046875, -0.349609375, -0.27520751953125, -0.2008056640625, -0.12640380859375, -0.052001953125, 0.02239990234375, 0.0968017578125, 0.17120361328125, 0.24560546875, 0.32000732421875, 0.3944091796875, 0.46881103515625, 0.543212890625, 0.61761474609375, 0.6920166015625, 0.76641845703125, 0.8408203125, 0.91522216796875, 0.9896240234375, 1.06402587890625, 1.138427734375, 1.21282958984375, 1.2872314453125, 1.36163330078125, 1.43603515625, 1.51043701171875, 1.5848388671875, 1.65924072265625, 1.733642578125, 1.80804443359375, 1.8824462890625, 1.95684814453125, 2.03125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 15.0, 44.0, 100.0, 206.0, 284.0, 211.0, 86.0, 34.0, 10.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.668087005615234, -44.50807189941406, -42.348060607910156, -40.188045501708984, -38.02803421020508, -35.868019104003906, -33.7080078125, -31.547992706298828, -29.38797950744629, -27.22796630859375, -25.06795310974121, -22.907939910888672, -20.7479248046875, -18.587913513183594, -16.427898406982422, -14.267885208129883, -12.107872009277344, -9.947858810424805, -7.787845134735107, -5.62783145904541, -3.467818260192871, -1.307805061340332, 0.8522090911865234, 3.0122222900390625, 5.172235488891602, 7.332248687744141, 9.49226188659668, 11.652276039123535, 13.812289237976074, 15.972302436828613, 18.13231658935547, 20.292329788208008, 22.45233917236328, 24.61235237121582, 26.77236557006836, 28.93238067626953, 31.092391967773438, 33.25240707397461, 35.41242218017578, 37.57243347167969, 39.732444763183594, 41.892459869384766, 44.05247116088867, 46.212486267089844, 48.37249755859375, 50.53251266479492, 52.692527770996094, 54.8525390625, 57.01255416870117, 59.172569274902344, 61.33258056640625, 63.49259567260742, 65.6526107788086, 67.8126220703125, 69.9726333618164, 72.13264465332031, 74.29266357421875, 76.45267486572266, 78.6126937866211, 80.772705078125, 82.9327163696289, 85.09272766113281, 87.25274658203125, 89.41275787353516, 91.57276916503906]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 2.0, 4.0, 0.0, 4.0, 9.0, 4.0, 4.0, 10.0, 11.0, 6.0, 11.0, 16.0, 18.0, 18.0, 16.0, 36.0, 27.0, 30.0, 43.0, 42.0, 53.0, 41.0, 58.0, 50.0, 60.0, 49.0, 47.0, 39.0, 40.0, 31.0, 27.0, 26.0, 33.0, 30.0, 21.0, 20.0, 13.0, 11.0, 10.0, 10.0, 7.0, 3.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.500905990600586, -26.612884521484375, -25.724864959716797, -24.836843490600586, -23.948822021484375, -23.060802459716797, -22.172780990600586, -21.284759521484375, -20.396739959716797, -19.508718490600586, -18.620698928833008, -17.732677459716797, -16.844655990600586, -15.956635475158691, -15.068614959716797, -14.180593490600586, -13.292572021484375, -12.40455150604248, -11.51653003692627, -10.628509521484375, -9.740488052368164, -8.85246753692627, -7.964447021484375, -7.076426029205322, -6.1884050369262695, -5.300384044647217, -4.412363052368164, -3.5243425369262695, -2.636321544647217, -1.748300552368164, -0.8602800369262695, 0.027740955352783203, 0.9157619476318359, 1.8037828207015991, 2.6918036937713623, 3.579824447631836, 4.467845439910889, 5.355866432189941, 6.243886947631836, 7.131907939910889, 8.019928932189941, 8.907949447631836, 9.795970916748047, 10.683991432189941, 11.572011947631836, 12.460033416748047, 13.348053932189941, 14.236074447631836, 15.124095916748047, 16.012117385864258, 16.900136947631836, 17.788158416748047, 18.676179885864258, 19.56420135498047, 20.452220916748047, 21.340242385864258, 22.22826385498047, 23.11628532409668, 24.004304885864258, 24.89232635498047, 25.78034782409668, 26.66836929321289, 27.55638885498047, 28.44441032409668, 29.332429885864258]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 6.0, 2.0, 4.0, 9.0, 15.0, 13.0, 20.0, 44.0, 76.0, 151.0, 282.0, 775.0, 2415.0, 12157.0, 149026.0, 3735475.0, 272273.0, 16931.0, 3070.0, 860.0, 338.0, 159.0, 78.0, 35.0, 21.0, 10.0, 13.0, 6.0, 8.0, 4.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-5.921875, -5.779449462890625, -5.63702392578125, -5.494598388671875, -5.3521728515625, -5.209747314453125, -5.06732177734375, -4.924896240234375, -4.782470703125, -4.640045166015625, -4.49761962890625, -4.355194091796875, -4.2127685546875, -4.070343017578125, -3.92791748046875, -3.785491943359375, -3.64306640625, -3.500640869140625, -3.35821533203125, -3.215789794921875, -3.0733642578125, -2.930938720703125, -2.78851318359375, -2.646087646484375, -2.503662109375, -2.361236572265625, -2.21881103515625, -2.076385498046875, -1.9339599609375, -1.791534423828125, -1.64910888671875, -1.506683349609375, -1.3642578125, -1.221832275390625, -1.07940673828125, -0.936981201171875, -0.7945556640625, -0.652130126953125, -0.50970458984375, -0.367279052734375, -0.224853515625, -0.082427978515625, 0.05999755859375, 0.202423095703125, 0.3448486328125, 0.487274169921875, 0.62969970703125, 0.772125244140625, 0.91455078125, 1.056976318359375, 1.19940185546875, 1.341827392578125, 1.4842529296875, 1.626678466796875, 1.76910400390625, 1.911529541015625, 2.053955078125, 2.196380615234375, 2.33880615234375, 2.481231689453125, 2.6236572265625, 2.766082763671875, 2.90850830078125, 3.050933837890625, 3.193359375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 4.0, 12.0, 8.0, 20.0, 15.0, 21.0, 26.0, 33.0, 37.0, 36.0, 62.0, 72.0, 77.0, 46.0, 66.0, 66.0, 64.0, 59.0, 64.0, 30.0, 35.0, 27.0, 32.0, 26.0, 13.0, 11.0, 8.0, 8.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8203125, -1.76702880859375, -1.7137451171875, -1.66046142578125, -1.607177734375, -1.55389404296875, -1.5006103515625, -1.44732666015625, -1.39404296875, -1.34075927734375, -1.2874755859375, -1.23419189453125, -1.180908203125, -1.12762451171875, -1.0743408203125, -1.02105712890625, -0.9677734375, -0.91448974609375, -0.8612060546875, -0.80792236328125, -0.754638671875, -0.70135498046875, -0.6480712890625, -0.59478759765625, -0.54150390625, -0.48822021484375, -0.4349365234375, -0.38165283203125, -0.328369140625, -0.27508544921875, -0.2218017578125, -0.16851806640625, -0.115234375, -0.06195068359375, -0.0086669921875, 0.04461669921875, 0.097900390625, 0.15118408203125, 0.2044677734375, 0.25775146484375, 0.31103515625, 0.36431884765625, 0.4176025390625, 0.47088623046875, 0.524169921875, 0.57745361328125, 0.6307373046875, 0.68402099609375, 0.7373046875, 0.79058837890625, 0.8438720703125, 0.89715576171875, 0.950439453125, 1.00372314453125, 1.0570068359375, 1.11029052734375, 1.16357421875, 1.21685791015625, 1.2701416015625, 1.32342529296875, 1.376708984375, 1.42999267578125, 1.4832763671875, 1.53656005859375, 1.58984375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 4.0, 8.0, 9.0, 13.0, 25.0, 36.0, 32.0, 79.0, 138.0, 231.0, 587.0, 1296.0, 4081.0, 16652.0, 128518.0, 3364503.0, 628297.0, 38487.0, 7508.0, 2087.0, 871.0, 363.0, 195.0, 99.0, 45.0, 29.0, 27.0, 15.0, 8.0, 5.0, 4.0, 1.0, 5.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.91796875, -3.79449462890625, -3.6710205078125, -3.54754638671875, -3.424072265625, -3.30059814453125, -3.1771240234375, -3.05364990234375, -2.93017578125, -2.80670166015625, -2.6832275390625, -2.55975341796875, -2.436279296875, -2.31280517578125, -2.1893310546875, -2.06585693359375, -1.9423828125, -1.81890869140625, -1.6954345703125, -1.57196044921875, -1.448486328125, -1.32501220703125, -1.2015380859375, -1.07806396484375, -0.95458984375, -0.83111572265625, -0.7076416015625, -0.58416748046875, -0.460693359375, -0.33721923828125, -0.2137451171875, -0.09027099609375, 0.033203125, 0.15667724609375, 0.2801513671875, 0.40362548828125, 0.527099609375, 0.65057373046875, 0.7740478515625, 0.89752197265625, 1.02099609375, 1.14447021484375, 1.2679443359375, 1.39141845703125, 1.514892578125, 1.63836669921875, 1.7618408203125, 1.88531494140625, 2.0087890625, 2.13226318359375, 2.2557373046875, 2.37921142578125, 2.502685546875, 2.62615966796875, 2.7496337890625, 2.87310791015625, 2.99658203125, 3.12005615234375, 3.2435302734375, 3.36700439453125, 3.490478515625, 3.61395263671875, 3.7374267578125, 3.86090087890625, 3.984375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 10.0, 7.0, 14.0, 10.0, 17.0, 40.0, 78.0, 130.0, 286.0, 598.0, 963.0, 878.0, 476.0, 246.0, 121.0, 65.0, 44.0, 28.0, 19.0, 9.0, 8.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.505859375, -3.370269775390625, -3.23468017578125, -3.099090576171875, -2.9635009765625, -2.827911376953125, -2.69232177734375, -2.556732177734375, -2.421142578125, -2.285552978515625, -2.14996337890625, -2.014373779296875, -1.8787841796875, -1.743194580078125, -1.60760498046875, -1.472015380859375, -1.33642578125, -1.200836181640625, -1.06524658203125, -0.929656982421875, -0.7940673828125, -0.658477783203125, -0.52288818359375, -0.387298583984375, -0.251708984375, -0.116119384765625, 0.01947021484375, 0.155059814453125, 0.2906494140625, 0.426239013671875, 0.56182861328125, 0.697418212890625, 0.8330078125, 0.968597412109375, 1.10418701171875, 1.239776611328125, 1.3753662109375, 1.510955810546875, 1.64654541015625, 1.782135009765625, 1.917724609375, 2.053314208984375, 2.18890380859375, 2.324493408203125, 2.4600830078125, 2.595672607421875, 2.73126220703125, 2.866851806640625, 3.00244140625, 3.138031005859375, 3.27362060546875, 3.409210205078125, 3.5447998046875, 3.680389404296875, 3.81597900390625, 3.951568603515625, 4.087158203125, 4.222747802734375, 4.35833740234375, 4.493927001953125, 4.6295166015625, 4.765106201171875, 4.90069580078125, 5.036285400390625, 5.171875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 3.0, 4.0, 9.0, 22.0, 48.0, 97.0, 157.0, 186.0, 194.0, 126.0, 63.0, 35.0, 22.0, 6.0, 4.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.715469360351562, -22.699506759643555, -21.683544158935547, -20.66758155822754, -19.65161895751953, -18.635656356811523, -17.619693756103516, -16.603731155395508, -15.5877685546875, -14.571805953979492, -13.555843353271484, -12.539880752563477, -11.523918151855469, -10.507955551147461, -9.491992950439453, -8.476030349731445, -7.4600677490234375, -6.44410514831543, -5.428142547607422, -4.412179946899414, -3.3962173461914062, -2.3802547454833984, -1.3642921447753906, -0.3483295440673828, 0.667633056640625, 1.6835956573486328, 2.6995582580566406, 3.7155208587646484, 4.731483459472656, 5.747446060180664, 6.763408660888672, 7.77937126159668, 8.795330047607422, 9.81129264831543, 10.827255249023438, 11.843217849731445, 12.859180450439453, 13.875143051147461, 14.891105651855469, 15.907068252563477, 16.923030853271484, 17.938993453979492, 18.9549560546875, 19.970918655395508, 20.986881256103516, 22.002843856811523, 23.01880645751953, 24.03476905822754, 25.050731658935547, 26.066694259643555, 27.082656860351562, 28.09861946105957, 29.114582061767578, 30.130544662475586, 31.146507263183594, 32.16246795654297, 33.17843246459961, 34.19439697265625, 35.210357666015625, 36.226318359375, 37.24228286743164, 38.25824737548828, 39.274208068847656, 40.29016876220703, 41.30613327026367]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 8.0, 5.0, 11.0, 18.0, 9.0, 15.0, 18.0, 28.0, 38.0, 36.0, 41.0, 39.0, 39.0, 53.0, 54.0, 57.0, 53.0, 66.0, 59.0, 62.0, 45.0, 42.0, 32.0, 32.0, 26.0, 27.0, 18.0, 16.0, 15.0, 10.0, 9.0, 10.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.70244026184082, -19.173219680786133, -18.644001007080078, -18.11478042602539, -17.585559844970703, -17.056339263916016, -16.52712059020996, -15.997900009155273, -15.468680381774902, -14.939460754394531, -14.410240173339844, -13.881020545959473, -13.351800918579102, -12.822580337524414, -12.293360710144043, -11.764141082763672, -11.234920501708984, -10.705700874328613, -10.176480293273926, -9.647260665893555, -9.118040084838867, -8.588820457458496, -8.059600830078125, -7.530380725860596, -7.001160621643066, -6.471940517425537, -5.942720413208008, -5.413500785827637, -4.884280681610107, -4.355060577392578, -3.825840711593628, -3.2966208457946777, -2.7674007415771484, -2.238180637359619, -1.708960771560669, -1.1797407865524292, -0.6505208015441895, -0.12130069732666016, 0.40791916847229004, 0.9371390342712402, 1.4663591384887695, 1.9955791234970093, 2.524799108505249, 3.054018974304199, 3.5832390785217285, 4.112459182739258, 4.641678810119629, 5.170898914337158, 5.7001190185546875, 6.229339122772217, 6.758559226989746, 7.287778854370117, 7.8169989585876465, 8.346219062805176, 8.875438690185547, 9.404659271240234, 9.933878898620605, 10.463098526000977, 10.992319107055664, 11.521538734436035, 12.050758361816406, 12.579978942871094, 13.109198570251465, 13.638418197631836, 14.167638778686523]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 14.0, 11.0, 7.0, 15.0, 23.0, 23.0, 35.0, 60.0, 76.0, 127.0, 174.0, 238.0, 351.0, 588.0, 887.0, 1311.0, 2241.0, 3625.0, 6667.0, 12201.0, 24328.0, 50053.0, 117070.0, 290291.0, 304467.0, 124940.0, 53471.0, 25103.0, 12867.0, 7027.0, 3922.0, 2217.0, 1455.0, 879.0, 614.0, 372.0, 222.0, 180.0, 123.0, 70.0, 46.0, 34.0, 29.0, 39.0, 14.0, 14.0, 12.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.8544921875, -1.79473876953125, -1.7349853515625, -1.67523193359375, -1.615478515625, -1.55572509765625, -1.4959716796875, -1.43621826171875, -1.37646484375, -1.31671142578125, -1.2569580078125, -1.19720458984375, -1.137451171875, -1.07769775390625, -1.0179443359375, -0.95819091796875, -0.8984375, -0.83868408203125, -0.7789306640625, -0.71917724609375, -0.659423828125, -0.59967041015625, -0.5399169921875, -0.48016357421875, -0.42041015625, -0.36065673828125, -0.3009033203125, -0.24114990234375, -0.181396484375, -0.12164306640625, -0.0618896484375, -0.00213623046875, 0.0576171875, 0.11737060546875, 0.1771240234375, 0.23687744140625, 0.296630859375, 0.35638427734375, 0.4161376953125, 0.47589111328125, 0.53564453125, 0.59539794921875, 0.6551513671875, 0.71490478515625, 0.774658203125, 0.83441162109375, 0.8941650390625, 0.95391845703125, 1.013671875, 1.07342529296875, 1.1331787109375, 1.19293212890625, 1.252685546875, 1.31243896484375, 1.3721923828125, 1.43194580078125, 1.49169921875, 1.55145263671875, 1.6112060546875, 1.67095947265625, 1.730712890625, 1.79046630859375, 1.8502197265625, 1.90997314453125, 1.9697265625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 7.0, 10.0, 12.0, 11.0, 26.0, 23.0, 28.0, 33.0, 52.0, 60.0, 57.0, 62.0, 60.0, 55.0, 62.0, 61.0, 65.0, 55.0, 45.0, 39.0, 35.0, 30.0, 28.0, 25.0, 15.0, 11.0, 6.0, 5.0, 4.0, 3.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7646484375, -1.71392822265625, -1.6632080078125, -1.61248779296875, -1.561767578125, -1.51104736328125, -1.4603271484375, -1.40960693359375, -1.35888671875, -1.30816650390625, -1.2574462890625, -1.20672607421875, -1.156005859375, -1.10528564453125, -1.0545654296875, -1.00384521484375, -0.953125, -0.90240478515625, -0.8516845703125, -0.80096435546875, -0.750244140625, -0.69952392578125, -0.6488037109375, -0.59808349609375, -0.54736328125, -0.49664306640625, -0.4459228515625, -0.39520263671875, -0.344482421875, -0.29376220703125, -0.2430419921875, -0.19232177734375, -0.1416015625, -0.09088134765625, -0.0401611328125, 0.01055908203125, 0.061279296875, 0.11199951171875, 0.1627197265625, 0.21343994140625, 0.26416015625, 0.31488037109375, 0.3656005859375, 0.41632080078125, 0.467041015625, 0.51776123046875, 0.5684814453125, 0.61920166015625, 0.669921875, 0.72064208984375, 0.7713623046875, 0.82208251953125, 0.872802734375, 0.92352294921875, 0.9742431640625, 1.02496337890625, 1.07568359375, 1.12640380859375, 1.1771240234375, 1.22784423828125, 1.278564453125, 1.32928466796875, 1.3800048828125, 1.43072509765625, 1.4814453125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 5.0, 9.0, 14.0, 16.0, 20.0, 26.0, 41.0, 74.0, 105.0, 165.0, 265.0, 478.0, 1060.0, 2456.0, 9101.0, 94596.0, 855963.0, 71701.0, 7959.0, 2234.0, 986.0, 474.0, 302.0, 165.0, 124.0, 68.0, 42.0, 28.0, 29.0, 14.0, 8.0, 3.0, 5.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.07421875, -6.84930419921875, -6.6243896484375, -6.39947509765625, -6.174560546875, -5.94964599609375, -5.7247314453125, -5.49981689453125, -5.27490234375, -5.04998779296875, -4.8250732421875, -4.60015869140625, -4.375244140625, -4.15032958984375, -3.9254150390625, -3.70050048828125, -3.4755859375, -3.25067138671875, -3.0257568359375, -2.80084228515625, -2.575927734375, -2.35101318359375, -2.1260986328125, -1.90118408203125, -1.67626953125, -1.45135498046875, -1.2264404296875, -1.00152587890625, -0.776611328125, -0.55169677734375, -0.3267822265625, -0.10186767578125, 0.123046875, 0.34796142578125, 0.5728759765625, 0.79779052734375, 1.022705078125, 1.24761962890625, 1.4725341796875, 1.69744873046875, 1.92236328125, 2.14727783203125, 2.3721923828125, 2.59710693359375, 2.822021484375, 3.04693603515625, 3.2718505859375, 3.49676513671875, 3.7216796875, 3.94659423828125, 4.1715087890625, 4.39642333984375, 4.621337890625, 4.84625244140625, 5.0711669921875, 5.29608154296875, 5.52099609375, 5.74591064453125, 5.9708251953125, 6.19573974609375, 6.420654296875, 6.64556884765625, 6.8704833984375, 7.09539794921875, 7.3203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 8.0, 18.0, 19.0, 14.0, 35.0, 51.0, 44.0, 64.0, 69.0, 63.0, 83.0, 87.0, 89.0, 68.0, 58.0, 56.0, 40.0, 37.0, 26.0, 14.0, 14.0, 8.0, 6.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.67578125, -6.35870361328125, -6.0416259765625, -5.72454833984375, -5.407470703125, -5.09039306640625, -4.7733154296875, -4.45623779296875, -4.13916015625, -3.82208251953125, -3.5050048828125, -3.18792724609375, -2.870849609375, -2.55377197265625, -2.2366943359375, -1.91961669921875, -1.6025390625, -1.28546142578125, -0.9683837890625, -0.65130615234375, -0.334228515625, -0.01715087890625, 0.2999267578125, 0.61700439453125, 0.93408203125, 1.25115966796875, 1.5682373046875, 1.88531494140625, 2.202392578125, 2.51947021484375, 2.8365478515625, 3.15362548828125, 3.470703125, 3.78778076171875, 4.1048583984375, 4.42193603515625, 4.739013671875, 5.05609130859375, 5.3731689453125, 5.69024658203125, 6.00732421875, 6.32440185546875, 6.6414794921875, 6.95855712890625, 7.275634765625, 7.59271240234375, 7.9097900390625, 8.22686767578125, 8.5439453125, 8.86102294921875, 9.1781005859375, 9.49517822265625, 9.812255859375, 10.12933349609375, 10.4464111328125, 10.76348876953125, 11.08056640625, 11.39764404296875, 11.7147216796875, 12.03179931640625, 12.348876953125, 12.66595458984375, 12.9830322265625, 13.30010986328125, 13.6171875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 9.0, 22.0, 24.0, 44.0, 64.0, 91.0, 154.0, 265.0, 586.0, 1549.0, 4819.0, 25328.0, 315509.0, 653534.0, 36989.0, 6331.0, 1750.0, 684.0, 323.0, 156.0, 103.0, 66.0, 43.0, 21.0, 17.0, 16.0, 16.0, 9.0, 6.0, 5.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.1484375, -3.05609130859375, -2.9637451171875, -2.87139892578125, -2.779052734375, -2.68670654296875, -2.5943603515625, -2.50201416015625, -2.40966796875, -2.31732177734375, -2.2249755859375, -2.13262939453125, -2.040283203125, -1.94793701171875, -1.8555908203125, -1.76324462890625, -1.6708984375, -1.57855224609375, -1.4862060546875, -1.39385986328125, -1.301513671875, -1.20916748046875, -1.1168212890625, -1.02447509765625, -0.93212890625, -0.83978271484375, -0.7474365234375, -0.65509033203125, -0.562744140625, -0.47039794921875, -0.3780517578125, -0.28570556640625, -0.193359375, -0.10101318359375, -0.0086669921875, 0.08367919921875, 0.176025390625, 0.26837158203125, 0.3607177734375, 0.45306396484375, 0.54541015625, 0.63775634765625, 0.7301025390625, 0.82244873046875, 0.914794921875, 1.00714111328125, 1.0994873046875, 1.19183349609375, 1.2841796875, 1.37652587890625, 1.4688720703125, 1.56121826171875, 1.653564453125, 1.74591064453125, 1.8382568359375, 1.93060302734375, 2.02294921875, 2.11529541015625, 2.2076416015625, 2.29998779296875, 2.392333984375, 2.48468017578125, 2.5770263671875, 2.66937255859375, 2.76171875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 6.0, 10.0, 11.0, 10.0, 12.0, 17.0, 19.0, 19.0, 29.0, 37.0, 41.0, 48.0, 77.0, 117.0, 155.0, 100.0, 51.0, 44.0, 39.0, 25.0, 24.0, 12.0, 15.0, 14.0, 12.0, 9.0, 7.0, 7.0, 4.0, 5.0, 5.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003981590270996094, -0.00038535892963409424, -0.0003725588321685791, -0.00035975873470306396, -0.00034695863723754883, -0.0003341585397720337, -0.00032135844230651855, -0.0003085583448410034, -0.0002957582473754883, -0.00028295814990997314, -0.000270158052444458, -0.00025735795497894287, -0.00024455785751342773, -0.0002317577600479126, -0.00021895766258239746, -0.00020615756511688232, -0.0001933574676513672, -0.00018055737018585205, -0.00016775727272033691, -0.00015495717525482178, -0.00014215707778930664, -0.0001293569803237915, -0.00011655688285827637, -0.00010375678539276123, -9.09566879272461e-05, -7.815659046173096e-05, -6.535649299621582e-05, -5.2556395530700684e-05, -3.975629806518555e-05, -2.695620059967041e-05, -1.4156103134155273e-05, -1.3560056686401367e-06, 1.1444091796875e-05, 2.4244189262390137e-05, 3.7044286727905273e-05, 4.984438419342041e-05, 6.264448165893555e-05, 7.544457912445068e-05, 8.824467658996582e-05, 0.00010104477405548096, 0.0001138448715209961, 0.00012664496898651123, 0.00013944506645202637, 0.0001522451639175415, 0.00016504526138305664, 0.00017784535884857178, 0.00019064545631408691, 0.00020344555377960205, 0.0002162456512451172, 0.00022904574871063232, 0.00024184584617614746, 0.0002546459436416626, 0.00026744604110717773, 0.00028024613857269287, 0.000293046236038208, 0.00030584633350372314, 0.0003186464309692383, 0.0003314465284347534, 0.00034424662590026855, 0.0003570467233657837, 0.00036984682083129883, 0.00038264691829681396, 0.0003954470157623291, 0.00040824711322784424, 0.0004210472106933594]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 6.0, 8.0, 8.0, 12.0, 19.0, 23.0, 40.0, 39.0, 86.0, 118.0, 192.0, 307.0, 647.0, 1413.0, 3748.0, 13742.0, 103418.0, 818637.0, 87441.0, 12431.0, 3396.0, 1342.0, 614.0, 328.0, 186.0, 97.0, 75.0, 46.0, 39.0, 29.0, 18.0, 16.0, 11.0, 8.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.181640625, -3.094390869140625, -3.00714111328125, -2.919891357421875, -2.8326416015625, -2.745391845703125, -2.65814208984375, -2.570892333984375, -2.483642578125, -2.396392822265625, -2.30914306640625, -2.221893310546875, -2.1346435546875, -2.047393798828125, -1.96014404296875, -1.872894287109375, -1.78564453125, -1.698394775390625, -1.61114501953125, -1.523895263671875, -1.4366455078125, -1.349395751953125, -1.26214599609375, -1.174896240234375, -1.087646484375, -1.000396728515625, -0.91314697265625, -0.825897216796875, -0.7386474609375, -0.651397705078125, -0.56414794921875, -0.476898193359375, -0.3896484375, -0.302398681640625, -0.21514892578125, -0.127899169921875, -0.0406494140625, 0.046600341796875, 0.13385009765625, 0.221099853515625, 0.308349609375, 0.395599365234375, 0.48284912109375, 0.570098876953125, 0.6573486328125, 0.744598388671875, 0.83184814453125, 0.919097900390625, 1.00634765625, 1.093597412109375, 1.18084716796875, 1.268096923828125, 1.3553466796875, 1.442596435546875, 1.52984619140625, 1.617095947265625, 1.704345703125, 1.791595458984375, 1.87884521484375, 1.966094970703125, 2.0533447265625, 2.140594482421875, 2.22784423828125, 2.315093994140625, 2.40234375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 5.0, 10.0, 5.0, 17.0, 15.0, 21.0, 28.0, 50.0, 81.0, 122.0, 172.0, 149.0, 117.0, 69.0, 57.0, 30.0, 25.0, 14.0, 6.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.126953125, -3.018310546875, -2.90966796875, -2.801025390625, -2.6923828125, -2.583740234375, -2.47509765625, -2.366455078125, -2.2578125, -2.149169921875, -2.04052734375, -1.931884765625, -1.8232421875, -1.714599609375, -1.60595703125, -1.497314453125, -1.388671875, -1.280029296875, -1.17138671875, -1.062744140625, -0.9541015625, -0.845458984375, -0.73681640625, -0.628173828125, -0.51953125, -0.410888671875, -0.30224609375, -0.193603515625, -0.0849609375, 0.023681640625, 0.13232421875, 0.240966796875, 0.349609375, 0.458251953125, 0.56689453125, 0.675537109375, 0.7841796875, 0.892822265625, 1.00146484375, 1.110107421875, 1.21875, 1.327392578125, 1.43603515625, 1.544677734375, 1.6533203125, 1.761962890625, 1.87060546875, 1.979248046875, 2.087890625, 2.196533203125, 2.30517578125, 2.413818359375, 2.5224609375, 2.631103515625, 2.73974609375, 2.848388671875, 2.95703125, 3.065673828125, 3.17431640625, 3.282958984375, 3.3916015625, 3.500244140625, 3.60888671875, 3.717529296875, 3.826171875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 10.0, 13.0, 45.0, 110.0, 252.0, 301.0, 175.0, 47.0, 20.0, 17.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-73.80152893066406, -71.91454315185547, -70.02754974365234, -68.14056396484375, -66.25357818603516, -64.36658477783203, -62.47959899902344, -60.59260940551758, -58.70561981201172, -56.81863021850586, -54.931644439697266, -53.044654846191406, -51.15766525268555, -49.27067565917969, -47.383689880371094, -45.496700286865234, -43.60971450805664, -41.72272491455078, -39.83573913574219, -37.94874954223633, -36.06175994873047, -34.174774169921875, -32.287784576416016, -30.400794982910156, -28.51380729675293, -26.626819610595703, -24.739830017089844, -22.852842330932617, -20.96585464477539, -19.07886505126953, -17.191877365112305, -15.304888725280762, -13.417903900146484, -11.530915260314941, -9.643926620483398, -7.756938934326172, -5.869950294494629, -3.982961654663086, -2.0959739685058594, -0.2089853286743164, 1.6780033111572266, 3.5649917125701904, 5.451980113983154, 7.338968276977539, 9.225956916809082, 11.112945556640625, 12.999933242797852, 14.886921882629395, 16.773910522460938, 18.660898208618164, 20.547887802124023, 22.43487548828125, 24.32186508178711, 26.208852767944336, 28.095840454101562, 29.982830047607422, 31.86981773376465, 33.756805419921875, 35.643795013427734, 37.530784606933594, 39.41777038574219, 41.30475997924805, 43.191749572753906, 45.0787353515625, 46.96572494506836]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 6.0, 3.0, 6.0, 6.0, 7.0, 3.0, 7.0, 13.0, 18.0, 17.0, 16.0, 26.0, 28.0, 38.0, 28.0, 39.0, 38.0, 48.0, 50.0, 59.0, 58.0, 52.0, 47.0, 45.0, 48.0, 35.0, 30.0, 34.0, 34.0, 22.0, 28.0, 22.0, 14.0, 17.0, 14.0, 10.0, 4.0, 7.0, 9.0, 8.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-24.49203872680664, -23.80278205871582, -23.113523483276367, -22.424266815185547, -21.735008239746094, -21.045751571655273, -20.356494903564453, -19.667236328125, -18.97797966003418, -18.28872299194336, -17.599464416503906, -16.910207748413086, -16.220951080322266, -15.531692504882812, -14.842435836791992, -14.153178215026855, -13.463920593261719, -12.774662971496582, -12.085405349731445, -11.396148681640625, -10.706891059875488, -10.017633438110352, -9.328376770019531, -8.639119148254395, -7.949861526489258, -7.260603904724121, -6.571346759796143, -5.882089614868164, -5.192831993103027, -4.503574371337891, -3.814317226409912, -3.1250600814819336, -2.435800552368164, -1.7465431690216064, -1.0572857856750488, -0.3680284023284912, 0.3212289810180664, 1.010486364364624, 1.6997437477111816, 2.38900089263916, 3.078258514404297, 3.7675158977508545, 4.456773281097412, 5.146030426025391, 5.835288047790527, 6.524545669555664, 7.213802814483643, 7.903059959411621, 8.592317581176758, 9.281575202941895, 9.970832824707031, 10.660089492797852, 11.349347114562988, 12.038604736328125, 12.727861404418945, 13.417119026184082, 14.106376647949219, 14.795634269714355, 15.484891891479492, 16.174148559570312, 16.863407135009766, 17.552663803100586, 18.241920471191406, 18.93117904663086, 19.62043571472168]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 3.0, 2.0, 5.0, 12.0, 6.0, 8.0, 9.0, 13.0, 16.0, 25.0, 47.0, 53.0, 84.0, 159.0, 255.0, 592.0, 2096.0, 10522.0, 210580.0, 3868037.0, 91694.0, 7437.0, 1557.0, 487.0, 225.0, 112.0, 56.0, 53.0, 31.0, 14.0, 16.0, 14.0, 14.0, 7.0, 8.0, 6.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.33203125, -5.181396484375, -5.03076171875, -4.880126953125, -4.7294921875, -4.578857421875, -4.42822265625, -4.277587890625, -4.126953125, -3.976318359375, -3.82568359375, -3.675048828125, -3.5244140625, -3.373779296875, -3.22314453125, -3.072509765625, -2.921875, -2.771240234375, -2.62060546875, -2.469970703125, -2.3193359375, -2.168701171875, -2.01806640625, -1.867431640625, -1.716796875, -1.566162109375, -1.41552734375, -1.264892578125, -1.1142578125, -0.963623046875, -0.81298828125, -0.662353515625, -0.51171875, -0.361083984375, -0.21044921875, -0.059814453125, 0.0908203125, 0.241455078125, 0.39208984375, 0.542724609375, 0.693359375, 0.843994140625, 0.99462890625, 1.145263671875, 1.2958984375, 1.446533203125, 1.59716796875, 1.747802734375, 1.8984375, 2.049072265625, 2.19970703125, 2.350341796875, 2.5009765625, 2.651611328125, 2.80224609375, 2.952880859375, 3.103515625, 3.254150390625, 3.40478515625, 3.555419921875, 3.7060546875, 3.856689453125, 4.00732421875, 4.157958984375, 4.30859375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 14.0, 20.0, 22.0, 35.0, 34.0, 81.0, 53.0, 73.0, 75.0, 83.0, 67.0, 79.0, 71.0, 55.0, 51.0, 45.0, 31.0, 40.0, 18.0, 11.0, 12.0, 6.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4296875, -2.3703460693359375, -2.311004638671875, -2.2516632080078125, -2.19232177734375, -2.1329803466796875, -2.073638916015625, -2.0142974853515625, -1.9549560546875, -1.8956146240234375, -1.836273193359375, -1.7769317626953125, -1.71759033203125, -1.6582489013671875, -1.598907470703125, -1.5395660400390625, -1.480224609375, -1.4208831787109375, -1.361541748046875, -1.3022003173828125, -1.24285888671875, -1.1835174560546875, -1.124176025390625, -1.0648345947265625, -1.0054931640625, -0.9461517333984375, -0.886810302734375, -0.8274688720703125, -0.76812744140625, -0.7087860107421875, -0.649444580078125, -0.5901031494140625, -0.53076171875, -0.4714202880859375, -0.412078857421875, -0.3527374267578125, -0.29339599609375, -0.2340545654296875, -0.174713134765625, -0.1153717041015625, -0.0560302734375, 0.0033111572265625, 0.062652587890625, 0.1219940185546875, 0.18133544921875, 0.2406768798828125, 0.300018310546875, 0.3593597412109375, 0.418701171875, 0.4780426025390625, 0.537384033203125, 0.5967254638671875, 0.65606689453125, 0.7154083251953125, 0.774749755859375, 0.8340911865234375, 0.8934326171875, 0.9527740478515625, 1.012115478515625, 1.0714569091796875, 1.13079833984375, 1.1901397705078125, 1.249481201171875, 1.3088226318359375, 1.3681640625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 2.0, 4.0, 5.0, 5.0, 8.0, 16.0, 28.0, 27.0, 46.0, 62.0, 84.0, 137.0, 209.0, 340.0, 601.0, 1075.0, 2173.0, 4518.0, 11582.0, 34753.0, 157722.0, 1632510.0, 2089198.0, 198394.0, 39064.0, 12051.0, 4982.0, 2202.0, 1083.0, 551.0, 316.0, 195.0, 111.0, 79.0, 35.0, 31.0, 23.0, 15.0, 8.0, 8.0, 7.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-2.484375, -2.41351318359375, -2.3426513671875, -2.27178955078125, -2.200927734375, -2.13006591796875, -2.0592041015625, -1.98834228515625, -1.91748046875, -1.84661865234375, -1.7757568359375, -1.70489501953125, -1.634033203125, -1.56317138671875, -1.4923095703125, -1.42144775390625, -1.3505859375, -1.27972412109375, -1.2088623046875, -1.13800048828125, -1.067138671875, -0.99627685546875, -0.9254150390625, -0.85455322265625, -0.78369140625, -0.71282958984375, -0.6419677734375, -0.57110595703125, -0.500244140625, -0.42938232421875, -0.3585205078125, -0.28765869140625, -0.216796875, -0.14593505859375, -0.0750732421875, -0.00421142578125, 0.066650390625, 0.13751220703125, 0.2083740234375, 0.27923583984375, 0.35009765625, 0.42095947265625, 0.4918212890625, 0.56268310546875, 0.633544921875, 0.70440673828125, 0.7752685546875, 0.84613037109375, 0.9169921875, 0.98785400390625, 1.0587158203125, 1.12957763671875, 1.200439453125, 1.27130126953125, 1.3421630859375, 1.41302490234375, 1.48388671875, 1.55474853515625, 1.6256103515625, 1.69647216796875, 1.767333984375, 1.83819580078125, 1.9090576171875, 1.97991943359375, 2.05078125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 14.0, 10.0, 11.0, 23.0, 26.0, 25.0, 67.0, 85.0, 151.0, 253.0, 462.0, 764.0, 843.0, 565.0, 321.0, 178.0, 92.0, 58.0, 37.0, 31.0, 15.0, 11.0, 8.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-4.29296875, -4.191009521484375, -4.08905029296875, -3.987091064453125, -3.8851318359375, -3.783172607421875, -3.68121337890625, -3.579254150390625, -3.477294921875, -3.375335693359375, -3.27337646484375, -3.171417236328125, -3.0694580078125, -2.967498779296875, -2.86553955078125, -2.763580322265625, -2.66162109375, -2.559661865234375, -2.45770263671875, -2.355743408203125, -2.2537841796875, -2.151824951171875, -2.04986572265625, -1.947906494140625, -1.845947265625, -1.743988037109375, -1.64202880859375, -1.540069580078125, -1.4381103515625, -1.336151123046875, -1.23419189453125, -1.132232666015625, -1.0302734375, -0.928314208984375, -0.82635498046875, -0.724395751953125, -0.6224365234375, -0.520477294921875, -0.41851806640625, -0.316558837890625, -0.214599609375, -0.112640380859375, -0.01068115234375, 0.091278076171875, 0.1932373046875, 0.295196533203125, 0.39715576171875, 0.499114990234375, 0.60107421875, 0.703033447265625, 0.80499267578125, 0.906951904296875, 1.0089111328125, 1.110870361328125, 1.21282958984375, 1.314788818359375, 1.416748046875, 1.518707275390625, 1.62066650390625, 1.722625732421875, 1.8245849609375, 1.926544189453125, 2.02850341796875, 2.130462646484375, 2.232421875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 5.0, 9.0, 10.0, 18.0, 30.0, 87.0, 138.0, 190.0, 195.0, 139.0, 75.0, 54.0, 17.0, 14.0, 8.0, 1.0, 0.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.332759857177734, -26.44536781311035, -25.5579776763916, -24.67058563232422, -23.78319549560547, -22.895803451538086, -22.008413314819336, -21.121021270751953, -20.233631134033203, -19.34623908996582, -18.45884895324707, -17.571456909179688, -16.684066772460938, -15.796674728393555, -14.909284591674805, -14.021892547607422, -13.134501457214355, -12.247110366821289, -11.359719276428223, -10.472328186035156, -9.58493709564209, -8.697546005249023, -7.810154438018799, -6.922763347625732, -6.035372257232666, -5.1479811668396, -4.260590076446533, -3.3731987476348877, -2.4858076572418213, -1.5984163284301758, -0.7110252380371094, 0.17636585235595703, 1.0637569427490234, 1.9511480331420898, 2.8385391235351562, 3.7259304523468018, 4.613321304321289, 5.500712871551514, 6.38810396194458, 7.2754950523376465, 8.162885665893555, 9.050276756286621, 9.937667846679688, 10.825058937072754, 11.71245002746582, 12.599842071533203, 13.487232208251953, 14.374624252319336, 15.262015342712402, 16.14940643310547, 17.03679847717285, 17.9241886138916, 18.811580657958984, 19.698970794677734, 20.586362838745117, 21.473752975463867, 22.36114501953125, 23.248537063598633, 24.135927200317383, 25.023319244384766, 25.910709381103516, 26.7981014251709, 27.68549156188965, 28.57288360595703, 29.46027374267578]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 6.0, 2.0, 4.0, 4.0, 8.0, 7.0, 5.0, 17.0, 13.0, 27.0, 18.0, 25.0, 33.0, 46.0, 44.0, 44.0, 58.0, 53.0, 58.0, 56.0, 55.0, 47.0, 52.0, 58.0, 45.0, 36.0, 32.0, 35.0, 21.0, 23.0, 21.0, 12.0, 9.0, 14.0, 4.0, 6.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.746856689453125, -15.28621768951416, -14.825578689575195, -14.364940643310547, -13.904301643371582, -13.443662643432617, -12.983023643493652, -12.522384643554688, -12.061745643615723, -11.601106643676758, -11.140467643737793, -10.679828643798828, -10.21919059753418, -9.758551597595215, -9.29791259765625, -8.837273597717285, -8.37663459777832, -7.9159955978393555, -7.455357074737549, -6.994718074798584, -6.534079074859619, -6.0734405517578125, -5.612801551818848, -5.152162551879883, -4.691524505615234, -4.2308855056762695, -3.770246744155884, -3.309607982635498, -2.848968982696533, -2.3883302211761475, -1.9276914596557617, -1.4670524597167969, -1.006413459777832, -0.5457745790481567, -0.08513575792312622, 0.3755030632019043, 0.8361419439315796, 1.2967808246612549, 1.7574195861816406, 2.2180585861206055, 2.678697347640991, 3.139336109161377, 3.599975109100342, 4.060613632202148, 4.521252632141113, 4.981891632080078, 5.442530632019043, 5.903169631958008, 6.3638081550598145, 6.824447154998779, 7.285085678100586, 7.745724678039551, 8.206363677978516, 8.66700267791748, 9.127641677856445, 9.588279724121094, 10.048918724060059, 10.509557723999023, 10.970196723937988, 11.430835723876953, 11.891473770141602, 12.352112770080566, 12.812751770019531, 13.273390769958496, 13.734029769897461]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 14.0, 16.0, 16.0, 25.0, 45.0, 63.0, 123.0, 207.0, 312.0, 525.0, 927.0, 1750.0, 3159.0, 6521.0, 14852.0, 37671.0, 116549.0, 404884.0, 319324.0, 87377.0, 30104.0, 12276.0, 5555.0, 2829.0, 1424.0, 792.0, 489.0, 262.0, 155.0, 106.0, 64.0, 41.0, 27.0, 20.0, 10.0, 10.0, 10.0, 5.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.564453125, -2.48876953125, -2.4130859375, -2.33740234375, -2.26171875, -2.18603515625, -2.1103515625, -2.03466796875, -1.958984375, -1.88330078125, -1.8076171875, -1.73193359375, -1.65625, -1.58056640625, -1.5048828125, -1.42919921875, -1.353515625, -1.27783203125, -1.2021484375, -1.12646484375, -1.05078125, -0.97509765625, -0.8994140625, -0.82373046875, -0.748046875, -0.67236328125, -0.5966796875, -0.52099609375, -0.4453125, -0.36962890625, -0.2939453125, -0.21826171875, -0.142578125, -0.06689453125, 0.0087890625, 0.08447265625, 0.16015625, 0.23583984375, 0.3115234375, 0.38720703125, 0.462890625, 0.53857421875, 0.6142578125, 0.68994140625, 0.765625, 0.84130859375, 0.9169921875, 0.99267578125, 1.068359375, 1.14404296875, 1.2197265625, 1.29541015625, 1.37109375, 1.44677734375, 1.5224609375, 1.59814453125, 1.673828125, 1.74951171875, 1.8251953125, 1.90087890625, 1.9765625, 2.05224609375, 2.1279296875, 2.20361328125, 2.279296875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 10.0, 4.0, 8.0, 10.0, 22.0, 27.0, 39.0, 22.0, 42.0, 48.0, 63.0, 59.0, 62.0, 64.0, 55.0, 78.0, 57.0, 65.0, 54.0, 39.0, 38.0, 17.0, 34.0, 25.0, 24.0, 14.0, 12.0, 3.0, 5.0, 5.0, 2.0, 3.0], "bins": [-2.3984375, -2.3465652465820312, -2.2946929931640625, -2.2428207397460938, -2.190948486328125, -2.1390762329101562, -2.0872039794921875, -2.0353317260742188, -1.98345947265625, -1.9315872192382812, -1.8797149658203125, -1.8278427124023438, -1.775970458984375, -1.7240982055664062, -1.6722259521484375, -1.6203536987304688, -1.5684814453125, -1.5166091918945312, -1.4647369384765625, -1.4128646850585938, -1.360992431640625, -1.3091201782226562, -1.2572479248046875, -1.2053756713867188, -1.15350341796875, -1.1016311645507812, -1.0497589111328125, -0.9978866577148438, -0.946014404296875, -0.8941421508789062, -0.8422698974609375, -0.7903976440429688, -0.738525390625, -0.6866531372070312, -0.6347808837890625, -0.5829086303710938, -0.531036376953125, -0.47916412353515625, -0.4272918701171875, -0.37541961669921875, -0.32354736328125, -0.27167510986328125, -0.2198028564453125, -0.16793060302734375, -0.116058349609375, -0.06418609619140625, -0.0123138427734375, 0.03955841064453125, 0.0914306640625, 0.14330291748046875, 0.1951751708984375, 0.24704742431640625, 0.298919677734375, 0.35079193115234375, 0.4026641845703125, 0.45453643798828125, 0.50640869140625, 0.5582809448242188, 0.6101531982421875, 0.6620254516601562, 0.713897705078125, 0.7657699584960938, 0.8176422119140625, 0.8695144653320312, 0.92138671875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 7.0, 12.0, 15.0, 17.0, 27.0, 50.0, 58.0, 97.0, 131.0, 213.0, 411.0, 723.0, 1501.0, 4118.0, 14904.0, 87595.0, 742136.0, 164428.0, 22563.0, 5546.0, 1943.0, 887.0, 432.0, 275.0, 149.0, 100.0, 75.0, 49.0, 26.0, 18.0, 12.0, 12.0, 6.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.73046875, -4.5809326171875, -4.431396484375, -4.2818603515625, -4.13232421875, -3.9827880859375, -3.833251953125, -3.6837158203125, -3.5341796875, -3.3846435546875, -3.235107421875, -3.0855712890625, -2.93603515625, -2.7864990234375, -2.636962890625, -2.4874267578125, -2.337890625, -2.1883544921875, -2.038818359375, -1.8892822265625, -1.73974609375, -1.5902099609375, -1.440673828125, -1.2911376953125, -1.1416015625, -0.9920654296875, -0.842529296875, -0.6929931640625, -0.54345703125, -0.3939208984375, -0.244384765625, -0.0948486328125, 0.0546875, 0.2042236328125, 0.353759765625, 0.5032958984375, 0.65283203125, 0.8023681640625, 0.951904296875, 1.1014404296875, 1.2509765625, 1.4005126953125, 1.550048828125, 1.6995849609375, 1.84912109375, 1.9986572265625, 2.148193359375, 2.2977294921875, 2.447265625, 2.5968017578125, 2.746337890625, 2.8958740234375, 3.04541015625, 3.1949462890625, 3.344482421875, 3.4940185546875, 3.6435546875, 3.7930908203125, 3.942626953125, 4.0921630859375, 4.24169921875, 4.3912353515625, 4.540771484375, 4.6903076171875, 4.83984375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 7.0, 3.0, 4.0, 5.0, 6.0, 11.0, 16.0, 20.0, 24.0, 16.0, 25.0, 24.0, 34.0, 40.0, 40.0, 34.0, 40.0, 53.0, 47.0, 41.0, 61.0, 56.0, 43.0, 60.0, 54.0, 42.0, 36.0, 31.0, 24.0, 27.0, 19.0, 19.0, 7.0, 10.0, 7.0, 6.0, 4.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37890625, -4.21435546875, -4.0498046875, -3.88525390625, -3.720703125, -3.55615234375, -3.3916015625, -3.22705078125, -3.0625, -2.89794921875, -2.7333984375, -2.56884765625, -2.404296875, -2.23974609375, -2.0751953125, -1.91064453125, -1.74609375, -1.58154296875, -1.4169921875, -1.25244140625, -1.087890625, -0.92333984375, -0.7587890625, -0.59423828125, -0.4296875, -0.26513671875, -0.1005859375, 0.06396484375, 0.228515625, 0.39306640625, 0.5576171875, 0.72216796875, 0.88671875, 1.05126953125, 1.2158203125, 1.38037109375, 1.544921875, 1.70947265625, 1.8740234375, 2.03857421875, 2.203125, 2.36767578125, 2.5322265625, 2.69677734375, 2.861328125, 3.02587890625, 3.1904296875, 3.35498046875, 3.51953125, 3.68408203125, 3.8486328125, 4.01318359375, 4.177734375, 4.34228515625, 4.5068359375, 4.67138671875, 4.8359375, 5.00048828125, 5.1650390625, 5.32958984375, 5.494140625, 5.65869140625, 5.8232421875, 5.98779296875, 6.15234375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 9.0, 6.0, 14.0, 19.0, 31.0, 53.0, 72.0, 152.0, 337.0, 750.0, 2228.0, 10194.0, 231033.0, 781011.0, 17689.0, 3124.0, 1063.0, 379.0, 165.0, 92.0, 49.0, 33.0, 19.0, 8.0, 12.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4765625, -4.3228759765625, -4.169189453125, -4.0155029296875, -3.86181640625, -3.7081298828125, -3.554443359375, -3.4007568359375, -3.2470703125, -3.0933837890625, -2.939697265625, -2.7860107421875, -2.63232421875, -2.4786376953125, -2.324951171875, -2.1712646484375, -2.017578125, -1.8638916015625, -1.710205078125, -1.5565185546875, -1.40283203125, -1.2491455078125, -1.095458984375, -0.9417724609375, -0.7880859375, -0.6343994140625, -0.480712890625, -0.3270263671875, -0.17333984375, -0.0196533203125, 0.134033203125, 0.2877197265625, 0.44140625, 0.5950927734375, 0.748779296875, 0.9024658203125, 1.05615234375, 1.2098388671875, 1.363525390625, 1.5172119140625, 1.6708984375, 1.8245849609375, 1.978271484375, 2.1319580078125, 2.28564453125, 2.4393310546875, 2.593017578125, 2.7467041015625, 2.900390625, 3.0540771484375, 3.207763671875, 3.3614501953125, 3.51513671875, 3.6688232421875, 3.822509765625, 3.9761962890625, 4.1298828125, 4.2835693359375, 4.437255859375, 4.5909423828125, 4.74462890625, 4.8983154296875, 5.052001953125, 5.2056884765625, 5.359375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 5.0, 5.0, 7.0, 9.0, 9.0, 17.0, 14.0, 29.0, 40.0, 51.0, 111.0, 142.0, 212.0, 136.0, 70.0, 41.0, 31.0, 19.0, 11.0, 8.0, 8.0, 5.0, 4.0, 6.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.000698089599609375, -0.0006788596510887146, -0.0006596297025680542, -0.0006403997540473938, -0.0006211698055267334, -0.000601939857006073, -0.0005827099084854126, -0.0005634799599647522, -0.0005442500114440918, -0.0005250200629234314, -0.000505790114402771, -0.0004865601658821106, -0.0004673302173614502, -0.0004481002688407898, -0.0004288703203201294, -0.000409640371799469, -0.0003904104232788086, -0.0003711804747581482, -0.0003519505262374878, -0.0003327205777168274, -0.000313490629196167, -0.0002942606806755066, -0.0002750307321548462, -0.0002558007836341858, -0.0002365708351135254, -0.000217340886592865, -0.0001981109380722046, -0.0001788809895515442, -0.0001596510410308838, -0.0001404210925102234, -0.00012119114398956299, -0.00010196119546890259, -8.273124694824219e-05, -6.350129842758179e-05, -4.427134990692139e-05, -2.5041401386260986e-05, -5.811452865600586e-06, 1.3418495655059814e-05, 3.2648444175720215e-05, 5.1878392696380615e-05, 7.110834121704102e-05, 9.033828973770142e-05, 0.00010956823825836182, 0.00012879818677902222, 0.00014802813529968262, 0.00016725808382034302, 0.00018648803234100342, 0.00020571798086166382, 0.00022494792938232422, 0.0002441778779029846, 0.000263407826423645, 0.0002826377749443054, 0.0003018677234649658, 0.0003210976719856262, 0.0003403276205062866, 0.000359557569026947, 0.0003787875175476074, 0.0003980174660682678, 0.0004172474145889282, 0.0004364773631095886, 0.000455707311630249, 0.0004749372601509094, 0.0004941672086715698, 0.0005133971571922302, 0.0005326271057128906]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 3.0, 8.0, 5.0, 19.0, 11.0, 24.0, 38.0, 55.0, 107.0, 203.0, 372.0, 991.0, 2306.0, 7012.0, 34770.0, 638855.0, 329464.0, 25043.0, 5662.0, 1985.0, 796.0, 387.0, 172.0, 108.0, 39.0, 33.0, 18.0, 13.0, 8.0, 8.0, 7.0, 6.0, 5.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.85546875, -2.7659912109375, -2.676513671875, -2.5870361328125, -2.49755859375, -2.4080810546875, -2.318603515625, -2.2291259765625, -2.1396484375, -2.0501708984375, -1.960693359375, -1.8712158203125, -1.78173828125, -1.6922607421875, -1.602783203125, -1.5133056640625, -1.423828125, -1.3343505859375, -1.244873046875, -1.1553955078125, -1.06591796875, -0.9764404296875, -0.886962890625, -0.7974853515625, -0.7080078125, -0.6185302734375, -0.529052734375, -0.4395751953125, -0.35009765625, -0.2606201171875, -0.171142578125, -0.0816650390625, 0.0078125, 0.0972900390625, 0.186767578125, 0.2762451171875, 0.36572265625, 0.4552001953125, 0.544677734375, 0.6341552734375, 0.7236328125, 0.8131103515625, 0.902587890625, 0.9920654296875, 1.08154296875, 1.1710205078125, 1.260498046875, 1.3499755859375, 1.439453125, 1.5289306640625, 1.618408203125, 1.7078857421875, 1.79736328125, 1.8868408203125, 1.976318359375, 2.0657958984375, 2.1552734375, 2.2447509765625, 2.334228515625, 2.4237060546875, 2.51318359375, 2.6026611328125, 2.692138671875, 2.7816162109375, 2.87109375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 8.0, 7.0, 5.0, 15.0, 19.0, 17.0, 31.0, 38.0, 49.0, 47.0, 72.0, 78.0, 104.0, 104.0, 95.0, 67.0, 57.0, 35.0, 23.0, 22.0, 10.0, 18.0, 13.0, 12.0, 5.0, 9.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.7841796875, -1.7313079833984375, -1.678436279296875, -1.6255645751953125, -1.57269287109375, -1.5198211669921875, -1.466949462890625, -1.4140777587890625, -1.3612060546875, -1.3083343505859375, -1.255462646484375, -1.2025909423828125, -1.14971923828125, -1.0968475341796875, -1.043975830078125, -0.9911041259765625, -0.938232421875, -0.8853607177734375, -0.832489013671875, -0.7796173095703125, -0.72674560546875, -0.6738739013671875, -0.621002197265625, -0.5681304931640625, -0.5152587890625, -0.4623870849609375, -0.409515380859375, -0.3566436767578125, -0.30377197265625, -0.2509002685546875, -0.198028564453125, -0.1451568603515625, -0.09228515625, -0.0394134521484375, 0.013458251953125, 0.0663299560546875, 0.11920166015625, 0.1720733642578125, 0.224945068359375, 0.2778167724609375, 0.3306884765625, 0.3835601806640625, 0.436431884765625, 0.4893035888671875, 0.54217529296875, 0.5950469970703125, 0.647918701171875, 0.7007904052734375, 0.753662109375, 0.8065338134765625, 0.859405517578125, 0.9122772216796875, 0.96514892578125, 1.0180206298828125, 1.070892333984375, 1.1237640380859375, 1.1766357421875, 1.2295074462890625, 1.282379150390625, 1.3352508544921875, 1.38812255859375, 1.4409942626953125, 1.493865966796875, 1.5467376708984375, 1.599609375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 19.0, 52.0, 100.0, 193.0, 304.0, 186.0, 77.0, 32.0, 18.0, 6.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.90874671936035, -22.266468048095703, -20.624187469482422, -18.981908798217773, -17.339630126953125, -15.697351455688477, -14.055071830749512, -12.412792205810547, -10.770513534545898, -9.12823486328125, -7.485955238342285, -5.8436760902404785, -4.201396942138672, -2.5591182708740234, -0.9168386459350586, 0.7254409790039062, 2.3677196502685547, 4.009998798370361, 5.652277946472168, 7.294557094573975, 8.936836242675781, 10.57911491394043, 12.221394538879395, 13.86367416381836, 15.505952835083008, 17.148231506347656, 18.790512084960938, 20.432790756225586, 22.075069427490234, 23.717348098754883, 25.35962677001953, 27.001907348632812, 28.644187927246094, 30.286466598510742, 31.92874526977539, 33.57102584838867, 35.21330261230469, 36.85558319091797, 38.49786376953125, 40.14014434814453, 41.78242111206055, 43.42470169067383, 45.066978454589844, 46.709259033203125, 48.351539611816406, 49.99381637573242, 51.6360969543457, 53.27837371826172, 54.920654296875, 56.56293487548828, 58.2052116394043, 59.84749221801758, 61.489768981933594, 63.132049560546875, 64.77433013916016, 66.41661071777344, 68.05888366699219, 69.70116424560547, 71.34344482421875, 72.9857177734375, 74.62799835205078, 76.27027893066406, 77.91255950927734, 79.55484008789062, 81.1971206665039]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 8.0, 11.0, 11.0, 8.0, 19.0, 23.0, 25.0, 31.0, 34.0, 47.0, 43.0, 57.0, 63.0, 57.0, 68.0, 69.0, 54.0, 61.0, 39.0, 47.0, 32.0, 25.0, 33.0, 33.0, 20.0, 20.0, 13.0, 9.0, 9.0, 7.0, 11.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.260976791381836, -21.49321746826172, -20.725460052490234, -19.957700729370117, -19.18994140625, -18.422183990478516, -17.6544246673584, -16.88666534423828, -16.118907928466797, -15.351149559020996, -14.583391189575195, -13.815631866455078, -13.047873497009277, -12.280115127563477, -11.51235580444336, -10.744597434997559, -9.976839065551758, -9.209080696105957, -8.441322326660156, -7.673563003540039, -6.905804634094238, -6.1380462646484375, -5.3702874183654785, -4.6025285720825195, -3.8347702026367188, -3.067011594772339, -2.299252986907959, -1.531494379043579, -0.7637357711791992, 0.004022836685180664, 0.7717814445495605, 1.5395402908325195, 2.3072986602783203, 3.0750572681427, 3.84281587600708, 4.610574722290039, 5.37833309173584, 6.146091461181641, 6.9138503074646, 7.681609153747559, 8.44936752319336, 9.21712589263916, 9.984884262084961, 10.752643585205078, 11.520401954650879, 12.28816032409668, 13.055919647216797, 13.823678016662598, 14.591436386108398, 15.3591947555542, 16.126953125, 16.894712448120117, 17.662471771240234, 18.43022918701172, 19.197988510131836, 19.965747833251953, 20.733505249023438, 21.501264572143555, 22.26902198791504, 23.036781311035156, 23.80453872680664, 24.572298049926758, 25.340057373046875, 26.10781478881836, 26.875574111938477]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 10.0, 13.0, 23.0, 18.0, 34.0, 50.0, 92.0, 156.0, 257.0, 566.0, 1097.0, 2463.0, 6469.0, 18881.0, 78682.0, 593475.0, 2690571.0, 681418.0, 87548.0, 20427.0, 6740.0, 2702.0, 1147.0, 637.0, 312.0, 173.0, 108.0, 59.0, 35.0, 29.0, 26.0, 13.0, 13.0, 5.0, 5.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.810546875, -1.749237060546875, -1.68792724609375, -1.626617431640625, -1.5653076171875, -1.503997802734375, -1.44268798828125, -1.381378173828125, -1.320068359375, -1.258758544921875, -1.19744873046875, -1.136138916015625, -1.0748291015625, -1.013519287109375, -0.95220947265625, -0.890899658203125, -0.82958984375, -0.768280029296875, -0.70697021484375, -0.645660400390625, -0.5843505859375, -0.523040771484375, -0.46173095703125, -0.400421142578125, -0.339111328125, -0.277801513671875, -0.21649169921875, -0.155181884765625, -0.0938720703125, -0.032562255859375, 0.02874755859375, 0.090057373046875, 0.1513671875, 0.212677001953125, 0.27398681640625, 0.335296630859375, 0.3966064453125, 0.457916259765625, 0.51922607421875, 0.580535888671875, 0.641845703125, 0.703155517578125, 0.76446533203125, 0.825775146484375, 0.8870849609375, 0.948394775390625, 1.00970458984375, 1.071014404296875, 1.13232421875, 1.193634033203125, 1.25494384765625, 1.316253662109375, 1.3775634765625, 1.438873291015625, 1.50018310546875, 1.561492919921875, 1.622802734375, 1.684112548828125, 1.74542236328125, 1.806732177734375, 1.8680419921875, 1.929351806640625, 1.99066162109375, 2.051971435546875, 2.11328125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 14.0, 12.0, 28.0, 55.0, 75.0, 88.0, 95.0, 101.0, 117.0, 127.0, 96.0, 73.0, 50.0, 35.0, 17.0, 15.0, 10.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.697265625, -2.61065673828125, -2.5240478515625, -2.43743896484375, -2.350830078125, -2.26422119140625, -2.1776123046875, -2.09100341796875, -2.00439453125, -1.91778564453125, -1.8311767578125, -1.74456787109375, -1.657958984375, -1.57135009765625, -1.4847412109375, -1.39813232421875, -1.3115234375, -1.22491455078125, -1.1383056640625, -1.05169677734375, -0.965087890625, -0.87847900390625, -0.7918701171875, -0.70526123046875, -0.61865234375, -0.53204345703125, -0.4454345703125, -0.35882568359375, -0.272216796875, -0.18560791015625, -0.0989990234375, -0.01239013671875, 0.07421875, 0.16082763671875, 0.2474365234375, 0.33404541015625, 0.420654296875, 0.50726318359375, 0.5938720703125, 0.68048095703125, 0.76708984375, 0.85369873046875, 0.9403076171875, 1.02691650390625, 1.113525390625, 1.20013427734375, 1.2867431640625, 1.37335205078125, 1.4599609375, 1.54656982421875, 1.6331787109375, 1.71978759765625, 1.806396484375, 1.89300537109375, 1.9796142578125, 2.06622314453125, 2.15283203125, 2.23944091796875, 2.3260498046875, 2.41265869140625, 2.499267578125, 2.58587646484375, 2.6724853515625, 2.75909423828125, 2.845703125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 5.0, 5.0, 9.0, 9.0, 22.0, 27.0, 48.0, 54.0, 91.0, 128.0, 227.0, 341.0, 613.0, 1343.0, 3356.0, 11596.0, 57492.0, 620269.0, 3204267.0, 252239.0, 30461.0, 7006.0, 2408.0, 1036.0, 542.0, 276.0, 179.0, 84.0, 38.0, 32.0, 31.0, 10.0, 8.0, 11.0, 11.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.994140625, -3.88720703125, -3.7802734375, -3.67333984375, -3.56640625, -3.45947265625, -3.3525390625, -3.24560546875, -3.138671875, -3.03173828125, -2.9248046875, -2.81787109375, -2.7109375, -2.60400390625, -2.4970703125, -2.39013671875, -2.283203125, -2.17626953125, -2.0693359375, -1.96240234375, -1.85546875, -1.74853515625, -1.6416015625, -1.53466796875, -1.427734375, -1.32080078125, -1.2138671875, -1.10693359375, -1.0, -0.89306640625, -0.7861328125, -0.67919921875, -0.572265625, -0.46533203125, -0.3583984375, -0.25146484375, -0.14453125, -0.03759765625, 0.0693359375, 0.17626953125, 0.283203125, 0.39013671875, 0.4970703125, 0.60400390625, 0.7109375, 0.81787109375, 0.9248046875, 1.03173828125, 1.138671875, 1.24560546875, 1.3525390625, 1.45947265625, 1.56640625, 1.67333984375, 1.7802734375, 1.88720703125, 1.994140625, 2.10107421875, 2.2080078125, 2.31494140625, 2.421875, 2.52880859375, 2.6357421875, 2.74267578125, 2.849609375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 11.0, 11.0, 18.0, 29.0, 39.0, 65.0, 79.0, 152.0, 248.0, 444.0, 756.0, 864.0, 575.0, 326.0, 187.0, 99.0, 53.0, 30.0, 33.0, 13.0, 10.0, 15.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.15234375, -5.013916015625, -4.87548828125, -4.737060546875, -4.5986328125, -4.460205078125, -4.32177734375, -4.183349609375, -4.044921875, -3.906494140625, -3.76806640625, -3.629638671875, -3.4912109375, -3.352783203125, -3.21435546875, -3.075927734375, -2.9375, -2.799072265625, -2.66064453125, -2.522216796875, -2.3837890625, -2.245361328125, -2.10693359375, -1.968505859375, -1.830078125, -1.691650390625, -1.55322265625, -1.414794921875, -1.2763671875, -1.137939453125, -0.99951171875, -0.861083984375, -0.72265625, -0.584228515625, -0.44580078125, -0.307373046875, -0.1689453125, -0.030517578125, 0.10791015625, 0.246337890625, 0.384765625, 0.523193359375, 0.66162109375, 0.800048828125, 0.9384765625, 1.076904296875, 1.21533203125, 1.353759765625, 1.4921875, 1.630615234375, 1.76904296875, 1.907470703125, 2.0458984375, 2.184326171875, 2.32275390625, 2.461181640625, 2.599609375, 2.738037109375, 2.87646484375, 3.014892578125, 3.1533203125, 3.291748046875, 3.43017578125, 3.568603515625, 3.70703125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 9.0, 17.0, 26.0, 75.0, 167.0, 247.0, 252.0, 124.0, 45.0, 14.0, 11.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.46420669555664, -44.862308502197266, -43.26041030883789, -41.65851593017578, -40.056617736816406, -38.45471954345703, -36.852821350097656, -35.25092315673828, -33.649024963378906, -32.04712677001953, -30.44523048400879, -28.843332290649414, -27.241436004638672, -25.639537811279297, -24.037639617919922, -22.435741424560547, -20.833847045898438, -19.231948852539062, -17.63005256652832, -16.028154373168945, -14.426257133483887, -12.824359893798828, -11.222461700439453, -9.620564460754395, -8.018667221069336, -6.416769981384277, -4.8148722648620605, -3.2129745483398438, -1.6110773086547852, -0.009180068969726562, 1.5927181243896484, 3.194615364074707, 4.796516418457031, 6.39841365814209, 8.000310897827148, 9.602209091186523, 11.204106330871582, 12.80600357055664, 14.407901763916016, 16.00979995727539, 17.611696243286133, 19.213594436645508, 20.81549072265625, 22.417388916015625, 24.019287109375, 25.621183395385742, 27.223081588745117, 28.82497787475586, 30.426876068115234, 32.02877426147461, 33.630672454833984, 35.232566833496094, 36.83446502685547, 38.436363220214844, 40.03826141357422, 41.640159606933594, 43.24205780029297, 44.843955993652344, 46.44585418701172, 48.047752380371094, 49.6496467590332, 51.25154495239258, 52.85344314575195, 54.45534133911133, 56.05723571777344]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 3.0, 6.0, 8.0, 17.0, 10.0, 15.0, 32.0, 44.0, 49.0, 59.0, 65.0, 64.0, 72.0, 78.0, 85.0, 72.0, 59.0, 46.0, 47.0, 45.0, 34.0, 27.0, 20.0, 12.0, 13.0, 6.0, 9.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.02616310119629, -18.256975173950195, -17.48778533935547, -16.718597412109375, -15.949407577514648, -15.180219650268555, -14.411030769348145, -13.641841888427734, -12.872653007507324, -12.103464126586914, -11.334275245666504, -10.565086364746094, -9.7958984375, -9.026708602905273, -8.25752067565918, -7.4883317947387695, -6.719142913818359, -5.949954032897949, -5.180765151977539, -4.411576747894287, -3.642387866973877, -2.873198986053467, -2.104010581970215, -1.3348217010498047, -0.5656328201293945, 0.20355594158172607, 0.9727447032928467, 1.7419333457946777, 2.511122226715088, 3.280311107635498, 4.04949951171875, 4.81868839263916, 5.587879180908203, 6.357068061828613, 7.126256942749023, 7.895445346832275, 8.664634704589844, 9.433822631835938, 10.203011512756348, 10.972200393676758, 11.741389274597168, 12.510578155517578, 13.279767036437988, 14.048955917358398, 14.818143844604492, 15.587333679199219, 16.356521606445312, 17.125709533691406, 17.894899368286133, 18.664087295532227, 19.433277130126953, 20.202465057373047, 20.971654891967773, 21.740842819213867, 22.510032653808594, 23.279220581054688, 24.04840850830078, 24.817596435546875, 25.5867862701416, 26.355974197387695, 27.125164031982422, 27.894351959228516, 28.66353988647461, 29.432729721069336, 30.201919555664062]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 5.0, 1.0, 7.0, 8.0, 20.0, 29.0, 41.0, 62.0, 91.0, 157.0, 234.0, 380.0, 655.0, 1142.0, 2087.0, 4125.0, 8527.0, 19085.0, 45018.0, 113229.0, 293741.0, 331600.0, 133891.0, 52440.0, 22137.0, 9636.0, 4750.0, 2330.0, 1321.0, 721.0, 437.0, 238.0, 136.0, 98.0, 48.0, 42.0, 21.0, 25.0, 10.0, 16.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.10546875, -2.0330810546875, -1.960693359375, -1.8883056640625, -1.81591796875, -1.7435302734375, -1.671142578125, -1.5987548828125, -1.5263671875, -1.4539794921875, -1.381591796875, -1.3092041015625, -1.23681640625, -1.1644287109375, -1.092041015625, -1.0196533203125, -0.947265625, -0.8748779296875, -0.802490234375, -0.7301025390625, -0.65771484375, -0.5853271484375, -0.512939453125, -0.4405517578125, -0.3681640625, -0.2957763671875, -0.223388671875, -0.1510009765625, -0.07861328125, -0.0062255859375, 0.066162109375, 0.1385498046875, 0.2109375, 0.2833251953125, 0.355712890625, 0.4281005859375, 0.50048828125, 0.5728759765625, 0.645263671875, 0.7176513671875, 0.7900390625, 0.8624267578125, 0.934814453125, 1.0072021484375, 1.07958984375, 1.1519775390625, 1.224365234375, 1.2967529296875, 1.369140625, 1.4415283203125, 1.513916015625, 1.5863037109375, 1.65869140625, 1.7310791015625, 1.803466796875, 1.8758544921875, 1.9482421875, 2.0206298828125, 2.093017578125, 2.1654052734375, 2.23779296875, 2.3101806640625, 2.382568359375, 2.4549560546875, 2.52734375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 10.0, 14.0, 11.0, 26.0, 28.0, 37.0, 49.0, 42.0, 63.0, 69.0, 66.0, 62.0, 65.0, 57.0, 66.0, 67.0, 47.0, 50.0, 42.0, 29.0, 27.0, 25.0, 14.0, 10.0, 11.0, 9.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.9736328125, -1.920806884765625, -1.86798095703125, -1.815155029296875, -1.7623291015625, -1.709503173828125, -1.65667724609375, -1.603851318359375, -1.551025390625, -1.498199462890625, -1.44537353515625, -1.392547607421875, -1.3397216796875, -1.286895751953125, -1.23406982421875, -1.181243896484375, -1.12841796875, -1.075592041015625, -1.02276611328125, -0.969940185546875, -0.9171142578125, -0.864288330078125, -0.81146240234375, -0.758636474609375, -0.705810546875, -0.652984619140625, -0.60015869140625, -0.547332763671875, -0.4945068359375, -0.441680908203125, -0.38885498046875, -0.336029052734375, -0.283203125, -0.230377197265625, -0.17755126953125, -0.124725341796875, -0.0718994140625, -0.019073486328125, 0.03375244140625, 0.086578369140625, 0.139404296875, 0.192230224609375, 0.24505615234375, 0.297882080078125, 0.3507080078125, 0.403533935546875, 0.45635986328125, 0.509185791015625, 0.56201171875, 0.614837646484375, 0.66766357421875, 0.720489501953125, 0.7733154296875, 0.826141357421875, 0.87896728515625, 0.931793212890625, 0.984619140625, 1.037445068359375, 1.09027099609375, 1.143096923828125, 1.1959228515625, 1.248748779296875, 1.30157470703125, 1.354400634765625, 1.4072265625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 6.0, 4.0, 5.0, 10.0, 4.0, 13.0, 14.0, 22.0, 19.0, 37.0, 45.0, 77.0, 116.0, 158.0, 208.0, 299.0, 451.0, 726.0, 1320.0, 2488.0, 5803.0, 21527.0, 147637.0, 736722.0, 103696.0, 16847.0, 4986.0, 2142.0, 1167.0, 623.0, 456.0, 262.0, 199.0, 131.0, 96.0, 64.0, 48.0, 26.0, 31.0, 18.0, 16.0, 9.0, 11.0, 5.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.17578125, -5.01104736328125, -4.8463134765625, -4.68157958984375, -4.516845703125, -4.35211181640625, -4.1873779296875, -4.02264404296875, -3.85791015625, -3.69317626953125, -3.5284423828125, -3.36370849609375, -3.198974609375, -3.03424072265625, -2.8695068359375, -2.70477294921875, -2.5400390625, -2.37530517578125, -2.2105712890625, -2.04583740234375, -1.881103515625, -1.71636962890625, -1.5516357421875, -1.38690185546875, -1.22216796875, -1.05743408203125, -0.8927001953125, -0.72796630859375, -0.563232421875, -0.39849853515625, -0.2337646484375, -0.06903076171875, 0.095703125, 0.26043701171875, 0.4251708984375, 0.58990478515625, 0.754638671875, 0.91937255859375, 1.0841064453125, 1.24884033203125, 1.41357421875, 1.57830810546875, 1.7430419921875, 1.90777587890625, 2.072509765625, 2.23724365234375, 2.4019775390625, 2.56671142578125, 2.7314453125, 2.89617919921875, 3.0609130859375, 3.22564697265625, 3.390380859375, 3.55511474609375, 3.7198486328125, 3.88458251953125, 4.04931640625, 4.21405029296875, 4.3787841796875, 4.54351806640625, 4.708251953125, 4.87298583984375, 5.0377197265625, 5.20245361328125, 5.3671875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 6.0, 3.0, 3.0, 9.0, 11.0, 9.0, 15.0, 17.0, 18.0, 31.0, 25.0, 41.0, 45.0, 48.0, 43.0, 55.0, 73.0, 67.0, 61.0, 51.0, 66.0, 40.0, 50.0, 47.0, 34.0, 34.0, 17.0, 21.0, 9.0, 16.0, 17.0, 7.0, 2.0, 6.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.01953125, -6.78741455078125, -6.5552978515625, -6.32318115234375, -6.091064453125, -5.85894775390625, -5.6268310546875, -5.39471435546875, -5.16259765625, -4.93048095703125, -4.6983642578125, -4.46624755859375, -4.234130859375, -4.00201416015625, -3.7698974609375, -3.53778076171875, -3.3056640625, -3.07354736328125, -2.8414306640625, -2.60931396484375, -2.377197265625, -2.14508056640625, -1.9129638671875, -1.68084716796875, -1.44873046875, -1.21661376953125, -0.9844970703125, -0.75238037109375, -0.520263671875, -0.28814697265625, -0.0560302734375, 0.17608642578125, 0.408203125, 0.64031982421875, 0.8724365234375, 1.10455322265625, 1.336669921875, 1.56878662109375, 1.8009033203125, 2.03302001953125, 2.26513671875, 2.49725341796875, 2.7293701171875, 2.96148681640625, 3.193603515625, 3.42572021484375, 3.6578369140625, 3.88995361328125, 4.1220703125, 4.35418701171875, 4.5863037109375, 4.81842041015625, 5.050537109375, 5.28265380859375, 5.5147705078125, 5.74688720703125, 5.97900390625, 6.21112060546875, 6.4432373046875, 6.67535400390625, 6.907470703125, 7.13958740234375, 7.3717041015625, 7.60382080078125, 7.8359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 11.0, 8.0, 19.0, 19.0, 34.0, 51.0, 96.0, 116.0, 215.0, 438.0, 849.0, 2317.0, 7304.0, 37104.0, 341700.0, 598301.0, 46760.0, 8570.0, 2530.0, 1044.0, 457.0, 244.0, 136.0, 82.0, 55.0, 32.0, 18.0, 11.0, 10.0, 6.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03125, -1.9501953125, -1.869140625, -1.7880859375, -1.70703125, -1.6259765625, -1.544921875, -1.4638671875, -1.3828125, -1.3017578125, -1.220703125, -1.1396484375, -1.05859375, -0.9775390625, -0.896484375, -0.8154296875, -0.734375, -0.6533203125, -0.572265625, -0.4912109375, -0.41015625, -0.3291015625, -0.248046875, -0.1669921875, -0.0859375, -0.0048828125, 0.076171875, 0.1572265625, 0.23828125, 0.3193359375, 0.400390625, 0.4814453125, 0.5625, 0.6435546875, 0.724609375, 0.8056640625, 0.88671875, 0.9677734375, 1.048828125, 1.1298828125, 1.2109375, 1.2919921875, 1.373046875, 1.4541015625, 1.53515625, 1.6162109375, 1.697265625, 1.7783203125, 1.859375, 1.9404296875, 2.021484375, 2.1025390625, 2.18359375, 2.2646484375, 2.345703125, 2.4267578125, 2.5078125, 2.5888671875, 2.669921875, 2.7509765625, 2.83203125, 2.9130859375, 2.994140625, 3.0751953125, 3.15625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 3.0, 9.0, 11.0, 7.0, 13.0, 15.0, 13.0, 21.0, 26.0, 24.0, 37.0, 29.0, 48.0, 78.0, 103.0, 129.0, 95.0, 65.0, 40.0, 38.0, 31.0, 29.0, 19.0, 23.0, 17.0, 17.0, 11.0, 5.0, 4.0, 6.0, 3.0, 5.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0004513263702392578, -0.0004369206726551056, -0.00042251497507095337, -0.00040810927748680115, -0.0003937035799026489, -0.0003792978823184967, -0.0003648921847343445, -0.00035048648715019226, -0.00033608078956604004, -0.0003216750919818878, -0.0003072693943977356, -0.0002928636968135834, -0.00027845799922943115, -0.00026405230164527893, -0.0002496466040611267, -0.0002352409064769745, -0.00022083520889282227, -0.00020642951130867004, -0.00019202381372451782, -0.0001776181161403656, -0.00016321241855621338, -0.00014880672097206116, -0.00013440102338790894, -0.00011999532580375671, -0.00010558962821960449, -9.118393063545227e-05, -7.677823305130005e-05, -6.237253546714783e-05, -4.7966837882995605e-05, -3.3561140298843384e-05, -1.9155442714691162e-05, -4.7497451305389404e-06, 9.655952453613281e-06, 2.4061650037765503e-05, 3.8467347621917725e-05, 5.2873045206069946e-05, 6.727874279022217e-05, 8.168444037437439e-05, 9.609013795852661e-05, 0.00011049583554267883, 0.00012490153312683105, 0.00013930723071098328, 0.0001537129282951355, 0.00016811862587928772, 0.00018252432346343994, 0.00019693002104759216, 0.00021133571863174438, 0.0002257414162158966, 0.00024014711380004883, 0.00025455281138420105, 0.00026895850896835327, 0.0002833642065525055, 0.0002977699041366577, 0.00031217560172080994, 0.00032658129930496216, 0.0003409869968891144, 0.0003553926944732666, 0.0003697983920574188, 0.00038420408964157104, 0.00039860978722572327, 0.0004130154848098755, 0.0004274211823940277, 0.00044182687997817993, 0.00045623257756233215, 0.0004706382751464844]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 8.0, 8.0, 13.0, 15.0, 17.0, 40.0, 58.0, 100.0, 151.0, 266.0, 393.0, 711.0, 1416.0, 3319.0, 10211.0, 50350.0, 632787.0, 300149.0, 34901.0, 8081.0, 2685.0, 1191.0, 679.0, 390.0, 216.0, 116.0, 102.0, 77.0, 42.0, 24.0, 9.0, 7.0, 8.0, 9.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.283203125, -2.204193115234375, -2.12518310546875, -2.046173095703125, -1.9671630859375, -1.888153076171875, -1.80914306640625, -1.730133056640625, -1.651123046875, -1.572113037109375, -1.49310302734375, -1.414093017578125, -1.3350830078125, -1.256072998046875, -1.17706298828125, -1.098052978515625, -1.01904296875, -0.940032958984375, -0.86102294921875, -0.782012939453125, -0.7030029296875, -0.623992919921875, -0.54498291015625, -0.465972900390625, -0.386962890625, -0.307952880859375, -0.22894287109375, -0.149932861328125, -0.0709228515625, 0.008087158203125, 0.08709716796875, 0.166107177734375, 0.2451171875, 0.324127197265625, 0.40313720703125, 0.482147216796875, 0.5611572265625, 0.640167236328125, 0.71917724609375, 0.798187255859375, 0.877197265625, 0.956207275390625, 1.03521728515625, 1.114227294921875, 1.1932373046875, 1.272247314453125, 1.35125732421875, 1.430267333984375, 1.50927734375, 1.588287353515625, 1.66729736328125, 1.746307373046875, 1.8253173828125, 1.904327392578125, 1.98333740234375, 2.062347412109375, 2.141357421875, 2.220367431640625, 2.29937744140625, 2.378387451171875, 2.4573974609375, 2.536407470703125, 2.61541748046875, 2.694427490234375, 2.7734375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 9.0, 3.0, 9.0, 6.0, 8.0, 10.0, 6.0, 7.0, 12.0, 21.0, 17.0, 22.0, 22.0, 34.0, 37.0, 43.0, 56.0, 60.0, 66.0, 73.0, 75.0, 62.0, 55.0, 56.0, 43.0, 40.0, 32.0, 19.0, 24.0, 14.0, 14.0, 5.0, 3.0, 8.0, 3.0, 6.0, 8.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.751953125, -1.69964599609375, -1.6473388671875, -1.59503173828125, -1.542724609375, -1.49041748046875, -1.4381103515625, -1.38580322265625, -1.33349609375, -1.28118896484375, -1.2288818359375, -1.17657470703125, -1.124267578125, -1.07196044921875, -1.0196533203125, -0.96734619140625, -0.9150390625, -0.86273193359375, -0.8104248046875, -0.75811767578125, -0.705810546875, -0.65350341796875, -0.6011962890625, -0.54888916015625, -0.49658203125, -0.44427490234375, -0.3919677734375, -0.33966064453125, -0.287353515625, -0.23504638671875, -0.1827392578125, -0.13043212890625, -0.078125, -0.02581787109375, 0.0264892578125, 0.07879638671875, 0.131103515625, 0.18341064453125, 0.2357177734375, 0.28802490234375, 0.34033203125, 0.39263916015625, 0.4449462890625, 0.49725341796875, 0.549560546875, 0.60186767578125, 0.6541748046875, 0.70648193359375, 0.7587890625, 0.81109619140625, 0.8634033203125, 0.91571044921875, 0.968017578125, 1.02032470703125, 1.0726318359375, 1.12493896484375, 1.17724609375, 1.22955322265625, 1.2818603515625, 1.33416748046875, 1.386474609375, 1.43878173828125, 1.4910888671875, 1.54339599609375, 1.595703125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 0.0, 3.0, 7.0, 29.0, 65.0, 131.0, 259.0, 253.0, 111.0, 66.0, 29.0, 13.0, 10.0, 5.0, 7.0, 4.0, 4.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.31217575073242, -34.790931701660156, -33.26968765258789, -31.748445510864258, -30.227201461791992, -28.70595932006836, -27.184715270996094, -25.663471221923828, -24.142227172851562, -22.620983123779297, -21.099740982055664, -19.5784969329834, -18.057252883911133, -16.5360107421875, -15.014766693115234, -13.493522644042969, -11.972280502319336, -10.451037406921387, -8.929793357849121, -7.408550262451172, -5.8873066902160645, -4.366063117980957, -2.844820022583008, -1.3235759735107422, 0.19766712188720703, 1.718910574913025, 3.2401540279388428, 4.761397361755371, 6.2826409339904785, 7.803884506225586, 9.325127601623535, 10.8463716506958, 12.36761474609375, 13.8888578414917, 15.410101890563965, 16.931344985961914, 18.45258903503418, 19.973831176757812, 21.495075225830078, 23.016319274902344, 24.53756332397461, 26.058807373046875, 27.580049514770508, 29.101293563842773, 30.62253761291504, 32.14377975463867, 33.66502380371094, 35.1862678527832, 36.70751190185547, 38.228755950927734, 39.75, 41.271240234375, 42.792484283447266, 44.31372833251953, 45.8349723815918, 47.35621643066406, 48.87745666503906, 50.39870071411133, 51.919944763183594, 53.441184997558594, 54.96242904663086, 56.483673095703125, 58.00491714477539, 59.526161193847656, 61.04740524291992]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 6.0, 3.0, 7.0, 4.0, 7.0, 9.0, 10.0, 6.0, 23.0, 19.0, 21.0, 21.0, 21.0, 26.0, 26.0, 32.0, 31.0, 34.0, 34.0, 53.0, 54.0, 71.0, 58.0, 68.0, 44.0, 36.0, 39.0, 31.0, 26.0, 32.0, 38.0, 17.0, 15.0, 21.0, 7.0, 13.0, 11.0, 3.0, 8.0, 6.0, 3.0, 7.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.101200103759766, -22.39780044555664, -21.694400787353516, -20.99100112915039, -20.287601470947266, -19.58420181274414, -18.880802154541016, -18.177404403686523, -17.4740047454834, -16.770605087280273, -16.06720542907715, -15.363805770874023, -14.660407066345215, -13.95700740814209, -13.253607749938965, -12.550209045410156, -11.846808433532715, -11.14340877532959, -10.440009117126465, -9.736610412597656, -9.033210754394531, -8.329811096191406, -7.626411437988281, -6.9230122566223145, -6.2196125984191895, -5.5162129402160645, -4.812813758850098, -4.109414100646973, -3.4060146808624268, -2.702615261077881, -1.9992156028747559, -1.295816421508789, -0.5924167633056641, 0.11098271608352661, 0.8143821954727173, 1.5177817344665527, 2.2211811542510986, 2.9245805740356445, 3.6279802322387695, 4.331379413604736, 5.034779071807861, 5.738178730010986, 6.441577911376953, 7.144977569580078, 7.848377227783203, 8.551776885986328, 9.255176544189453, 9.958575248718262, 10.661974906921387, 11.365374565124512, 12.068774223327637, 12.772172927856445, 13.47557258605957, 14.178972244262695, 14.88237190246582, 15.585771560668945, 16.28917121887207, 16.992570877075195, 17.69597053527832, 18.399370193481445, 19.10276985168457, 19.806167602539062, 20.509567260742188, 21.212966918945312, 21.916366577148438]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 4.0, 8.0, 9.0, 15.0, 34.0, 34.0, 56.0, 81.0, 172.0, 289.0, 514.0, 1009.0, 2116.0, 5218.0, 16991.0, 85412.0, 950994.0, 2752532.0, 320942.0, 41139.0, 10055.0, 3479.0, 1448.0, 721.0, 379.0, 240.0, 129.0, 83.0, 58.0, 33.0, 32.0, 15.0, 10.0, 6.0, 8.0, 9.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.2578125, -2.187896728515625, -2.11798095703125, -2.048065185546875, -1.9781494140625, -1.908233642578125, -1.83831787109375, -1.768402099609375, -1.698486328125, -1.628570556640625, -1.55865478515625, -1.488739013671875, -1.4188232421875, -1.348907470703125, -1.27899169921875, -1.209075927734375, -1.13916015625, -1.069244384765625, -0.99932861328125, -0.929412841796875, -0.8594970703125, -0.789581298828125, -0.71966552734375, -0.649749755859375, -0.579833984375, -0.509918212890625, -0.44000244140625, -0.370086669921875, -0.3001708984375, -0.230255126953125, -0.16033935546875, -0.090423583984375, -0.0205078125, 0.049407958984375, 0.11932373046875, 0.189239501953125, 0.2591552734375, 0.329071044921875, 0.39898681640625, 0.468902587890625, 0.538818359375, 0.608734130859375, 0.67864990234375, 0.748565673828125, 0.8184814453125, 0.888397216796875, 0.95831298828125, 1.028228759765625, 1.09814453125, 1.168060302734375, 1.23797607421875, 1.307891845703125, 1.3778076171875, 1.447723388671875, 1.51763916015625, 1.587554931640625, 1.657470703125, 1.727386474609375, 1.79730224609375, 1.867218017578125, 1.9371337890625, 2.007049560546875, 2.07696533203125, 2.146881103515625, 2.216796875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 8.0, 10.0, 10.0, 13.0, 19.0, 31.0, 43.0, 27.0, 44.0, 59.0, 71.0, 69.0, 48.0, 76.0, 56.0, 70.0, 59.0, 54.0, 53.0, 43.0, 30.0, 31.0, 22.0, 13.0, 17.0, 11.0, 7.0, 8.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6806640625, -1.6257476806640625, -1.570831298828125, -1.5159149169921875, -1.46099853515625, -1.4060821533203125, -1.351165771484375, -1.2962493896484375, -1.2413330078125, -1.1864166259765625, -1.131500244140625, -1.0765838623046875, -1.02166748046875, -0.9667510986328125, -0.911834716796875, -0.8569183349609375, -0.802001953125, -0.7470855712890625, -0.692169189453125, -0.6372528076171875, -0.58233642578125, -0.5274200439453125, -0.472503662109375, -0.4175872802734375, -0.3626708984375, -0.3077545166015625, -0.252838134765625, -0.1979217529296875, -0.14300537109375, -0.0880889892578125, -0.033172607421875, 0.0217437744140625, 0.07666015625, 0.1315765380859375, 0.186492919921875, 0.2414093017578125, 0.29632568359375, 0.3512420654296875, 0.406158447265625, 0.4610748291015625, 0.5159912109375, 0.5709075927734375, 0.625823974609375, 0.6807403564453125, 0.73565673828125, 0.7905731201171875, 0.845489501953125, 0.9004058837890625, 0.955322265625, 1.0102386474609375, 1.065155029296875, 1.1200714111328125, 1.17498779296875, 1.2299041748046875, 1.284820556640625, 1.3397369384765625, 1.3946533203125, 1.4495697021484375, 1.504486083984375, 1.5594024658203125, 1.61431884765625, 1.6692352294921875, 1.724151611328125, 1.7790679931640625, 1.833984375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 9.0, 6.0, 8.0, 18.0, 34.0, 61.0, 123.0, 213.0, 402.0, 841.0, 1700.0, 4370.0, 18748.0, 164416.0, 3301498.0, 647314.0, 41371.0, 8192.0, 2679.0, 1082.0, 515.0, 277.0, 156.0, 98.0, 52.0, 38.0, 23.0, 12.0, 12.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.896636962890625, -3.77374267578125, -3.650848388671875, -3.5279541015625, -3.405059814453125, -3.28216552734375, -3.159271240234375, -3.036376953125, -2.913482666015625, -2.79058837890625, -2.667694091796875, -2.5447998046875, -2.421905517578125, -2.29901123046875, -2.176116943359375, -2.05322265625, -1.930328369140625, -1.80743408203125, -1.684539794921875, -1.5616455078125, -1.438751220703125, -1.31585693359375, -1.192962646484375, -1.070068359375, -0.947174072265625, -0.82427978515625, -0.701385498046875, -0.5784912109375, -0.455596923828125, -0.33270263671875, -0.209808349609375, -0.0869140625, 0.035980224609375, 0.15887451171875, 0.281768798828125, 0.4046630859375, 0.527557373046875, 0.65045166015625, 0.773345947265625, 0.896240234375, 1.019134521484375, 1.14202880859375, 1.264923095703125, 1.3878173828125, 1.510711669921875, 1.63360595703125, 1.756500244140625, 1.87939453125, 2.002288818359375, 2.12518310546875, 2.248077392578125, 2.3709716796875, 2.493865966796875, 2.61676025390625, 2.739654541015625, 2.862548828125, 2.985443115234375, 3.10833740234375, 3.231231689453125, 3.3541259765625, 3.477020263671875, 3.59991455078125, 3.722808837890625, 3.845703125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 5.0, 5.0, 11.0, 10.0, 20.0, 34.0, 49.0, 95.0, 157.0, 212.0, 415.0, 686.0, 840.0, 612.0, 404.0, 179.0, 129.0, 62.0, 43.0, 26.0, 25.0, 16.0, 9.0, 4.0, 1.0, 3.0, 5.0, 0.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.63671875, -3.5128173828125, -3.388916015625, -3.2650146484375, -3.14111328125, -3.0172119140625, -2.893310546875, -2.7694091796875, -2.6455078125, -2.5216064453125, -2.397705078125, -2.2738037109375, -2.14990234375, -2.0260009765625, -1.902099609375, -1.7781982421875, -1.654296875, -1.5303955078125, -1.406494140625, -1.2825927734375, -1.15869140625, -1.0347900390625, -0.910888671875, -0.7869873046875, -0.6630859375, -0.5391845703125, -0.415283203125, -0.2913818359375, -0.16748046875, -0.0435791015625, 0.080322265625, 0.2042236328125, 0.328125, 0.4520263671875, 0.575927734375, 0.6998291015625, 0.82373046875, 0.9476318359375, 1.071533203125, 1.1954345703125, 1.3193359375, 1.4432373046875, 1.567138671875, 1.6910400390625, 1.81494140625, 1.9388427734375, 2.062744140625, 2.1866455078125, 2.310546875, 2.4344482421875, 2.558349609375, 2.6822509765625, 2.80615234375, 2.9300537109375, 3.053955078125, 3.1778564453125, 3.3017578125, 3.4256591796875, 3.549560546875, 3.6734619140625, 3.79736328125, 3.9212646484375, 4.045166015625, 4.1690673828125, 4.29296875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 13.0, 20.0, 53.0, 135.0, 208.0, 265.0, 160.0, 77.0, 34.0, 14.0, 5.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.488746643066406, -43.065185546875, -41.641624450683594, -40.21806335449219, -38.79450225830078, -37.370941162109375, -35.94738006591797, -34.52382278442383, -33.10026168823242, -31.676700592041016, -30.25313949584961, -28.829578399658203, -27.40601921081543, -25.982458114624023, -24.558897018432617, -23.135337829589844, -21.711774826049805, -20.2882137298584, -18.864652633666992, -17.44109344482422, -16.017532348632812, -14.593971252441406, -13.17041015625, -11.74685001373291, -10.323288917541504, -8.899727821350098, -7.476167678833008, -6.052606582641602, -4.6290459632873535, -3.2054853439331055, -1.7819242477416992, -0.3583641052246094, 1.0651969909667969, 2.488757610321045, 3.912318468093872, 5.335879325866699, 6.759439945220947, 8.183000564575195, 9.606561660766602, 11.030121803283691, 12.453682899475098, 13.877243995666504, 15.300804138183594, 16.724365234375, 18.147926330566406, 19.571487426757812, 20.99504852294922, 22.418607711791992, 23.8421688079834, 25.265729904174805, 26.68929100036621, 28.112850189208984, 29.53641128540039, 30.959972381591797, 32.3835334777832, 33.80709457397461, 35.230655670166016, 36.65421676635742, 38.07777786254883, 39.501338958740234, 40.92490005493164, 42.34845733642578, 43.77201843261719, 45.195579528808594, 46.619140625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 6.0, 5.0, 11.0, 14.0, 22.0, 24.0, 24.0, 35.0, 47.0, 51.0, 66.0, 60.0, 74.0, 61.0, 81.0, 76.0, 56.0, 69.0, 34.0, 42.0, 35.0, 28.0, 21.0, 19.0, 13.0, 10.0, 5.0, 2.0, 7.0, 2.0, 3.0, 0.0, 1.0, 3.0], "bins": [-30.841285705566406, -30.13622283935547, -29.4311580657959, -28.72609519958496, -28.021032333374023, -27.315967559814453, -26.610904693603516, -25.905841827392578, -25.20077896118164, -24.495716094970703, -23.790651321411133, -23.085588455200195, -22.380525588989258, -21.675460815429688, -20.97039794921875, -20.265335083007812, -19.560270309448242, -18.855207443237305, -18.150142669677734, -17.445079803466797, -16.74001693725586, -16.034954071044922, -15.329889297485352, -14.624826431274414, -13.91976261138916, -13.214698791503906, -12.509635925292969, -11.804572105407715, -11.099508285522461, -10.394445419311523, -9.68938159942627, -8.984317779541016, -8.279253005981445, -7.57418966293335, -6.869126319885254, -6.1640625, -5.458999156951904, -4.753935813903809, -4.048871994018555, -3.343808650970459, -2.6387453079223633, -1.933681845664978, -1.2286183834075928, -0.523554801940918, 0.18150854110717773, 0.8865718841552734, 1.5916357040405273, 2.296699047088623, 3.0017623901367188, 3.7068257331848145, 4.41188907623291, 5.116952896118164, 5.82201623916626, 6.5270795822143555, 7.232143402099609, 7.937206745147705, 8.6422700881958, 9.347333908081055, 10.052396774291992, 10.757460594177246, 11.4625244140625, 12.167587280273438, 12.872651100158691, 13.577714920043945, 14.282777786254883]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 9.0, 11.0, 26.0, 20.0, 45.0, 59.0, 85.0, 178.0, 273.0, 500.0, 955.0, 1909.0, 4310.0, 10895.0, 31034.0, 107203.0, 414460.0, 348585.0, 85247.0, 25963.0, 9283.0, 3826.0, 1689.0, 830.0, 418.0, 292.0, 153.0, 125.0, 51.0, 38.0, 25.0, 15.0, 11.0, 7.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.876953125, -2.780792236328125, -2.68463134765625, -2.588470458984375, -2.4923095703125, -2.396148681640625, -2.29998779296875, -2.203826904296875, -2.107666015625, -2.011505126953125, -1.91534423828125, -1.819183349609375, -1.7230224609375, -1.626861572265625, -1.53070068359375, -1.434539794921875, -1.33837890625, -1.242218017578125, -1.14605712890625, -1.049896240234375, -0.9537353515625, -0.857574462890625, -0.76141357421875, -0.665252685546875, -0.569091796875, -0.472930908203125, -0.37677001953125, -0.280609130859375, -0.1844482421875, -0.088287353515625, 0.00787353515625, 0.104034423828125, 0.2001953125, 0.296356201171875, 0.39251708984375, 0.488677978515625, 0.5848388671875, 0.680999755859375, 0.77716064453125, 0.873321533203125, 0.969482421875, 1.065643310546875, 1.16180419921875, 1.257965087890625, 1.3541259765625, 1.450286865234375, 1.54644775390625, 1.642608642578125, 1.73876953125, 1.834930419921875, 1.93109130859375, 2.027252197265625, 2.1234130859375, 2.219573974609375, 2.31573486328125, 2.411895751953125, 2.508056640625, 2.604217529296875, 2.70037841796875, 2.796539306640625, 2.8927001953125, 2.988861083984375, 3.08502197265625, 3.181182861328125, 3.27734375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 10.0, 8.0, 7.0, 14.0, 11.0, 19.0, 19.0, 30.0, 37.0, 34.0, 36.0, 47.0, 39.0, 43.0, 45.0, 53.0, 48.0, 42.0, 46.0, 53.0, 52.0, 39.0, 35.0, 37.0, 28.0, 43.0, 34.0, 20.0, 14.0, 11.0, 7.0, 10.0, 7.0, 6.0, 4.0, 1.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.4599609375, -1.4166259765625, -1.373291015625, -1.3299560546875, -1.28662109375, -1.2432861328125, -1.199951171875, -1.1566162109375, -1.11328125, -1.0699462890625, -1.026611328125, -0.9832763671875, -0.93994140625, -0.8966064453125, -0.853271484375, -0.8099365234375, -0.7666015625, -0.7232666015625, -0.679931640625, -0.6365966796875, -0.59326171875, -0.5499267578125, -0.506591796875, -0.4632568359375, -0.419921875, -0.3765869140625, -0.333251953125, -0.2899169921875, -0.24658203125, -0.2032470703125, -0.159912109375, -0.1165771484375, -0.0732421875, -0.0299072265625, 0.013427734375, 0.0567626953125, 0.10009765625, 0.1434326171875, 0.186767578125, 0.2301025390625, 0.2734375, 0.3167724609375, 0.360107421875, 0.4034423828125, 0.44677734375, 0.4901123046875, 0.533447265625, 0.5767822265625, 0.6201171875, 0.6634521484375, 0.706787109375, 0.7501220703125, 0.79345703125, 0.8367919921875, 0.880126953125, 0.9234619140625, 0.966796875, 1.0101318359375, 1.053466796875, 1.0968017578125, 1.14013671875, 1.1834716796875, 1.226806640625, 1.2701416015625, 1.3134765625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 8.0, 5.0, 7.0, 13.0, 22.0, 15.0, 41.0, 43.0, 56.0, 80.0, 147.0, 172.0, 300.0, 489.0, 827.0, 1718.0, 4675.0, 15993.0, 94671.0, 784312.0, 117640.0, 18260.0, 4894.0, 1772.0, 893.0, 483.0, 316.0, 194.0, 141.0, 86.0, 68.0, 53.0, 45.0, 27.0, 16.0, 17.0, 13.0, 15.0, 8.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.23046875, -5.0472412109375, -4.864013671875, -4.6807861328125, -4.49755859375, -4.3143310546875, -4.131103515625, -3.9478759765625, -3.7646484375, -3.5814208984375, -3.398193359375, -3.2149658203125, -3.03173828125, -2.8485107421875, -2.665283203125, -2.4820556640625, -2.298828125, -2.1156005859375, -1.932373046875, -1.7491455078125, -1.56591796875, -1.3826904296875, -1.199462890625, -1.0162353515625, -0.8330078125, -0.6497802734375, -0.466552734375, -0.2833251953125, -0.10009765625, 0.0831298828125, 0.266357421875, 0.4495849609375, 0.6328125, 0.8160400390625, 0.999267578125, 1.1824951171875, 1.36572265625, 1.5489501953125, 1.732177734375, 1.9154052734375, 2.0986328125, 2.2818603515625, 2.465087890625, 2.6483154296875, 2.83154296875, 3.0147705078125, 3.197998046875, 3.3812255859375, 3.564453125, 3.7476806640625, 3.930908203125, 4.1141357421875, 4.29736328125, 4.4805908203125, 4.663818359375, 4.8470458984375, 5.0302734375, 5.2135009765625, 5.396728515625, 5.5799560546875, 5.76318359375, 5.9464111328125, 6.129638671875, 6.3128662109375, 6.49609375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 1.0, 4.0, 11.0, 2.0, 7.0, 11.0, 8.0, 9.0, 12.0, 17.0, 16.0, 27.0, 14.0, 37.0, 31.0, 37.0, 45.0, 39.0, 44.0, 49.0, 59.0, 44.0, 48.0, 47.0, 48.0, 47.0, 41.0, 40.0, 28.0, 29.0, 19.0, 27.0, 20.0, 14.0, 17.0, 10.0, 12.0, 7.0, 9.0, 7.0, 2.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.10546875, -4.9326171875, -4.759765625, -4.5869140625, -4.4140625, -4.2412109375, -4.068359375, -3.8955078125, -3.72265625, -3.5498046875, -3.376953125, -3.2041015625, -3.03125, -2.8583984375, -2.685546875, -2.5126953125, -2.33984375, -2.1669921875, -1.994140625, -1.8212890625, -1.6484375, -1.4755859375, -1.302734375, -1.1298828125, -0.95703125, -0.7841796875, -0.611328125, -0.4384765625, -0.265625, -0.0927734375, 0.080078125, 0.2529296875, 0.42578125, 0.5986328125, 0.771484375, 0.9443359375, 1.1171875, 1.2900390625, 1.462890625, 1.6357421875, 1.80859375, 1.9814453125, 2.154296875, 2.3271484375, 2.5, 2.6728515625, 2.845703125, 3.0185546875, 3.19140625, 3.3642578125, 3.537109375, 3.7099609375, 3.8828125, 4.0556640625, 4.228515625, 4.4013671875, 4.57421875, 4.7470703125, 4.919921875, 5.0927734375, 5.265625, 5.4384765625, 5.611328125, 5.7841796875, 5.95703125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 5.0, 3.0, 4.0, 2.0, 7.0, 5.0, 13.0, 10.0, 23.0, 24.0, 33.0, 43.0, 56.0, 62.0, 117.0, 169.0, 255.0, 470.0, 784.0, 1647.0, 3776.0, 9856.0, 32572.0, 143470.0, 697763.0, 114409.0, 27358.0, 8825.0, 3397.0, 1467.0, 717.0, 435.0, 220.0, 168.0, 110.0, 68.0, 46.0, 34.0, 34.0, 22.0, 13.0, 20.0, 8.0, 10.0, 6.0, 4.0, 1.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.27734375, -2.211212158203125, -2.14508056640625, -2.078948974609375, -2.0128173828125, -1.946685791015625, -1.88055419921875, -1.814422607421875, -1.748291015625, -1.682159423828125, -1.61602783203125, -1.549896240234375, -1.4837646484375, -1.417633056640625, -1.35150146484375, -1.285369873046875, -1.21923828125, -1.153106689453125, -1.08697509765625, -1.020843505859375, -0.9547119140625, -0.888580322265625, -0.82244873046875, -0.756317138671875, -0.690185546875, -0.624053955078125, -0.55792236328125, -0.491790771484375, -0.4256591796875, -0.359527587890625, -0.29339599609375, -0.227264404296875, -0.1611328125, -0.095001220703125, -0.02886962890625, 0.037261962890625, 0.1033935546875, 0.169525146484375, 0.23565673828125, 0.301788330078125, 0.367919921875, 0.434051513671875, 0.50018310546875, 0.566314697265625, 0.6324462890625, 0.698577880859375, 0.76470947265625, 0.830841064453125, 0.89697265625, 0.963104248046875, 1.02923583984375, 1.095367431640625, 1.1614990234375, 1.227630615234375, 1.29376220703125, 1.359893798828125, 1.426025390625, 1.492156982421875, 1.55828857421875, 1.624420166015625, 1.6905517578125, 1.756683349609375, 1.82281494140625, 1.888946533203125, 1.955078125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 10.0, 6.0, 9.0, 4.0, 7.0, 9.0, 16.0, 13.0, 23.0, 34.0, 40.0, 62.0, 101.0, 165.0, 190.0, 112.0, 57.0, 36.0, 29.0, 16.0, 19.0, 10.0, 7.0, 11.0, 3.0, 8.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006399154663085938, -0.0006179586052894592, -0.0005960017442703247, -0.0005740448832511902, -0.0005520880222320557, -0.0005301311612129211, -0.0005081743001937866, -0.0004862174391746521, -0.0004642605781555176, -0.00044230371713638306, -0.00042034685611724854, -0.000398389995098114, -0.0003764331340789795, -0.00035447627305984497, -0.00033251941204071045, -0.00031056255102157593, -0.0002886056900024414, -0.0002666488289833069, -0.00024469196796417236, -0.00022273510694503784, -0.00020077824592590332, -0.0001788213849067688, -0.00015686452388763428, -0.00013490766286849976, -0.00011295080184936523, -9.099394083023071e-05, -6.903707981109619e-05, -4.708021879196167e-05, -2.512335777282715e-05, -3.166496753692627e-06, 1.8790364265441895e-05, 4.0747225284576416e-05, 6.270408630371094e-05, 8.466094732284546e-05, 0.00010661780834197998, 0.0001285746693611145, 0.00015053153038024902, 0.00017248839139938354, 0.00019444525241851807, 0.0002164021134376526, 0.0002383589744567871, 0.00026031583547592163, 0.00028227269649505615, 0.0003042295575141907, 0.0003261864185333252, 0.0003481432795524597, 0.00037010014057159424, 0.00039205700159072876, 0.0004140138626098633, 0.0004359707236289978, 0.0004579275846481323, 0.00047988444566726685, 0.0005018413066864014, 0.0005237981677055359, 0.0005457550287246704, 0.0005677118897438049, 0.0005896687507629395, 0.000611625611782074, 0.0006335824728012085, 0.000655539333820343, 0.0006774961948394775, 0.0006994530558586121, 0.0007214099168777466, 0.0007433667778968811, 0.0007653236389160156]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 1.0, 0.0, 5.0, 7.0, 11.0, 13.0, 17.0, 28.0, 40.0, 59.0, 99.0, 150.0, 264.0, 421.0, 760.0, 1688.0, 4542.0, 16091.0, 87507.0, 758037.0, 145112.0, 23458.0, 5786.0, 2154.0, 970.0, 514.0, 293.0, 184.0, 108.0, 83.0, 45.0, 35.0, 27.0, 12.0, 15.0, 7.0, 3.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.798828125, -2.717987060546875, -2.63714599609375, -2.556304931640625, -2.4754638671875, -2.394622802734375, -2.31378173828125, -2.232940673828125, -2.152099609375, -2.071258544921875, -1.99041748046875, -1.909576416015625, -1.8287353515625, -1.747894287109375, -1.66705322265625, -1.586212158203125, -1.50537109375, -1.424530029296875, -1.34368896484375, -1.262847900390625, -1.1820068359375, -1.101165771484375, -1.02032470703125, -0.939483642578125, -0.858642578125, -0.777801513671875, -0.69696044921875, -0.616119384765625, -0.5352783203125, -0.454437255859375, -0.37359619140625, -0.292755126953125, -0.2119140625, -0.131072998046875, -0.05023193359375, 0.030609130859375, 0.1114501953125, 0.192291259765625, 0.27313232421875, 0.353973388671875, 0.434814453125, 0.515655517578125, 0.59649658203125, 0.677337646484375, 0.7581787109375, 0.839019775390625, 0.91986083984375, 1.000701904296875, 1.08154296875, 1.162384033203125, 1.24322509765625, 1.324066162109375, 1.4049072265625, 1.485748291015625, 1.56658935546875, 1.647430419921875, 1.728271484375, 1.809112548828125, 1.88995361328125, 1.970794677734375, 2.0516357421875, 2.132476806640625, 2.21331787109375, 2.294158935546875, 2.375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 6.0, 2.0, 1.0, 7.0, 7.0, 13.0, 9.0, 14.0, 17.0, 22.0, 32.0, 34.0, 57.0, 65.0, 81.0, 105.0, 95.0, 99.0, 88.0, 43.0, 32.0, 38.0, 30.0, 12.0, 18.0, 16.0, 6.0, 15.0, 5.0, 6.0, 5.0, 6.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.328125, -2.257843017578125, -2.18756103515625, -2.117279052734375, -2.0469970703125, -1.976715087890625, -1.90643310546875, -1.836151123046875, -1.765869140625, -1.695587158203125, -1.62530517578125, -1.555023193359375, -1.4847412109375, -1.414459228515625, -1.34417724609375, -1.273895263671875, -1.20361328125, -1.133331298828125, -1.06304931640625, -0.992767333984375, -0.9224853515625, -0.852203369140625, -0.78192138671875, -0.711639404296875, -0.641357421875, -0.571075439453125, -0.50079345703125, -0.430511474609375, -0.3602294921875, -0.289947509765625, -0.21966552734375, -0.149383544921875, -0.0791015625, -0.008819580078125, 0.06146240234375, 0.131744384765625, 0.2020263671875, 0.272308349609375, 0.34259033203125, 0.412872314453125, 0.483154296875, 0.553436279296875, 0.62371826171875, 0.694000244140625, 0.7642822265625, 0.834564208984375, 0.90484619140625, 0.975128173828125, 1.04541015625, 1.115692138671875, 1.18597412109375, 1.256256103515625, 1.3265380859375, 1.396820068359375, 1.46710205078125, 1.537384033203125, 1.607666015625, 1.677947998046875, 1.74822998046875, 1.818511962890625, 1.8887939453125, 1.959075927734375, 2.02935791015625, 2.099639892578125, 2.169921875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 1.0, 1.0, 2.0, 3.0, 9.0, 26.0, 44.0, 123.0, 314.0, 279.0, 126.0, 41.0, 11.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.91436004638672, -67.9073486328125, -65.90034484863281, -63.893333435058594, -61.886322021484375, -59.879310607910156, -57.8723030090332, -55.86529541015625, -53.85828399658203, -51.85127258300781, -49.84426498413086, -47.837257385253906, -45.83024597167969, -43.82323455810547, -41.816226959228516, -39.80921936035156, -37.802207946777344, -35.795196533203125, -33.78818893432617, -31.781179428100586, -29.774169921875, -27.767160415649414, -25.760150909423828, -23.753141403198242, -21.746131896972656, -19.73912239074707, -17.732112884521484, -15.725103378295898, -13.718093872070312, -11.711084365844727, -9.70407485961914, -7.697065353393555, -5.6900482177734375, -3.6830387115478516, -1.6760292053222656, 0.3309803009033203, 2.3379898071289062, 4.344999313354492, 6.352008819580078, 8.359018325805664, 10.36602783203125, 12.373037338256836, 14.380046844482422, 16.387056350708008, 18.394065856933594, 20.40107536315918, 22.408084869384766, 24.41509437561035, 26.422103881835938, 28.429113388061523, 30.43612289428711, 32.44313049316406, 34.45014190673828, 36.4571533203125, 38.46416091918945, 40.471168518066406, 42.478179931640625, 44.485191345214844, 46.4921989440918, 48.49920654296875, 50.50621795654297, 52.51322937011719, 54.52023696899414, 56.527244567871094, 58.53425598144531]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 12.0, 3.0, 6.0, 9.0, 12.0, 8.0, 12.0, 13.0, 18.0, 19.0, 26.0, 15.0, 19.0, 28.0, 25.0, 39.0, 37.0, 47.0, 61.0, 61.0, 70.0, 59.0, 32.0, 30.0, 37.0, 22.0, 25.0, 30.0, 29.0, 22.0, 22.0, 16.0, 17.0, 20.0, 11.0, 14.0, 13.0, 14.0, 11.0, 5.0, 3.0, 5.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.839733123779297, -19.225675582885742, -18.611618041992188, -17.997560501098633, -17.383502960205078, -16.769447326660156, -16.1553897857666, -15.541332244873047, -14.927274703979492, -14.313217163085938, -13.699159622192383, -13.085103034973145, -12.47104549407959, -11.856987953186035, -11.242931365966797, -10.628873825073242, -10.014816284179688, -9.400758743286133, -8.786701202392578, -8.17264461517334, -7.558587074279785, -6.9445295333862305, -6.330472469329834, -5.7164154052734375, -5.102357864379883, -4.488300323486328, -3.8742432594299316, -3.260185956954956, -2.6461286544799805, -2.032071352005005, -1.4180140495300293, -0.8039569854736328, -0.1898975372314453, 0.4241597652435303, 1.0382170677185059, 1.6522743701934814, 2.266331672668457, 2.8803889751434326, 3.494446277618408, 4.108503341674805, 4.722560882568359, 5.336618423461914, 5.9506754875183105, 6.564732551574707, 7.178790092468262, 7.792847633361816, 8.406904220581055, 9.02096176147461, 9.635019302368164, 10.249076843261719, 10.863134384155273, 11.477190971374512, 12.091248512268066, 12.705306053161621, 13.31936264038086, 13.933420181274414, 14.547477722167969, 15.161535263061523, 15.775592803955078, 16.389650344848633, 17.003707885742188, 17.61776351928711, 18.231821060180664, 18.84587860107422, 19.459936141967773]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 6.0, 13.0, 9.0, 24.0, 22.0, 42.0, 58.0, 92.0, 154.0, 260.0, 487.0, 996.0, 2055.0, 5309.0, 16973.0, 93386.0, 1591107.0, 2317402.0, 133319.0, 21113.0, 6410.0, 2525.0, 1136.0, 576.0, 318.0, 178.0, 104.0, 73.0, 30.0, 33.0, 13.0, 13.0, 11.0, 9.0, 4.0, 3.0, 4.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.607421875, -2.528594970703125, -2.44976806640625, -2.370941162109375, -2.2921142578125, -2.213287353515625, -2.13446044921875, -2.055633544921875, -1.976806640625, -1.897979736328125, -1.81915283203125, -1.740325927734375, -1.6614990234375, -1.582672119140625, -1.50384521484375, -1.425018310546875, -1.34619140625, -1.267364501953125, -1.18853759765625, -1.109710693359375, -1.0308837890625, -0.952056884765625, -0.87322998046875, -0.794403076171875, -0.715576171875, -0.636749267578125, -0.55792236328125, -0.479095458984375, -0.4002685546875, -0.321441650390625, -0.24261474609375, -0.163787841796875, -0.0849609375, -0.006134033203125, 0.07269287109375, 0.151519775390625, 0.2303466796875, 0.309173583984375, 0.38800048828125, 0.466827392578125, 0.545654296875, 0.624481201171875, 0.70330810546875, 0.782135009765625, 0.8609619140625, 0.939788818359375, 1.01861572265625, 1.097442626953125, 1.17626953125, 1.255096435546875, 1.33392333984375, 1.412750244140625, 1.4915771484375, 1.570404052734375, 1.64923095703125, 1.728057861328125, 1.806884765625, 1.885711669921875, 1.96453857421875, 2.043365478515625, 2.1221923828125, 2.201019287109375, 2.27984619140625, 2.358673095703125, 2.4375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 7.0, 13.0, 14.0, 22.0, 25.0, 39.0, 44.0, 64.0, 82.0, 89.0, 110.0, 74.0, 76.0, 68.0, 63.0, 51.0, 42.0, 39.0, 28.0, 14.0, 15.0, 9.0, 5.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.599609375, -2.529754638671875, -2.45989990234375, -2.390045166015625, -2.3201904296875, -2.250335693359375, -2.18048095703125, -2.110626220703125, -2.040771484375, -1.970916748046875, -1.90106201171875, -1.831207275390625, -1.7613525390625, -1.691497802734375, -1.62164306640625, -1.551788330078125, -1.48193359375, -1.412078857421875, -1.34222412109375, -1.272369384765625, -1.2025146484375, -1.132659912109375, -1.06280517578125, -0.992950439453125, -0.923095703125, -0.853240966796875, -0.78338623046875, -0.713531494140625, -0.6436767578125, -0.573822021484375, -0.50396728515625, -0.434112548828125, -0.3642578125, -0.294403076171875, -0.22454833984375, -0.154693603515625, -0.0848388671875, -0.014984130859375, 0.05487060546875, 0.124725341796875, 0.194580078125, 0.264434814453125, 0.33428955078125, 0.404144287109375, 0.4739990234375, 0.543853759765625, 0.61370849609375, 0.683563232421875, 0.75341796875, 0.823272705078125, 0.89312744140625, 0.962982177734375, 1.0328369140625, 1.102691650390625, 1.17254638671875, 1.242401123046875, 1.312255859375, 1.382110595703125, 1.45196533203125, 1.521820068359375, 1.5916748046875, 1.661529541015625, 1.73138427734375, 1.801239013671875, 1.87109375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 10.0, 20.0, 32.0, 40.0, 71.0, 139.0, 296.0, 623.0, 1436.0, 4066.0, 15652.0, 174437.0, 3780675.0, 190910.0, 17977.0, 4691.0, 1714.0, 710.0, 335.0, 182.0, 102.0, 67.0, 35.0, 13.0, 16.0, 9.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.30859375, -4.1519775390625, -3.995361328125, -3.8387451171875, -3.68212890625, -3.5255126953125, -3.368896484375, -3.2122802734375, -3.0556640625, -2.8990478515625, -2.742431640625, -2.5858154296875, -2.42919921875, -2.2725830078125, -2.115966796875, -1.9593505859375, -1.802734375, -1.6461181640625, -1.489501953125, -1.3328857421875, -1.17626953125, -1.0196533203125, -0.863037109375, -0.7064208984375, -0.5498046875, -0.3931884765625, -0.236572265625, -0.0799560546875, 0.07666015625, 0.2332763671875, 0.389892578125, 0.5465087890625, 0.703125, 0.8597412109375, 1.016357421875, 1.1729736328125, 1.32958984375, 1.4862060546875, 1.642822265625, 1.7994384765625, 1.9560546875, 2.1126708984375, 2.269287109375, 2.4259033203125, 2.58251953125, 2.7391357421875, 2.895751953125, 3.0523681640625, 3.208984375, 3.3656005859375, 3.522216796875, 3.6788330078125, 3.83544921875, 3.9920654296875, 4.148681640625, 4.3052978515625, 4.4619140625, 4.6185302734375, 4.775146484375, 4.9317626953125, 5.08837890625, 5.2449951171875, 5.401611328125, 5.5582275390625, 5.71484375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 9.0, 6.0, 12.0, 20.0, 16.0, 35.0, 36.0, 90.0, 128.0, 263.0, 428.0, 721.0, 838.0, 608.0, 329.0, 180.0, 120.0, 62.0, 39.0, 27.0, 32.0, 11.0, 12.0, 9.0, 8.0, 4.0, 4.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.068359375, -2.96002197265625, -2.8516845703125, -2.74334716796875, -2.635009765625, -2.52667236328125, -2.4183349609375, -2.30999755859375, -2.20166015625, -2.09332275390625, -1.9849853515625, -1.87664794921875, -1.768310546875, -1.65997314453125, -1.5516357421875, -1.44329833984375, -1.3349609375, -1.22662353515625, -1.1182861328125, -1.00994873046875, -0.901611328125, -0.79327392578125, -0.6849365234375, -0.57659912109375, -0.46826171875, -0.35992431640625, -0.2515869140625, -0.14324951171875, -0.034912109375, 0.07342529296875, 0.1817626953125, 0.29010009765625, 0.3984375, 0.50677490234375, 0.6151123046875, 0.72344970703125, 0.831787109375, 0.94012451171875, 1.0484619140625, 1.15679931640625, 1.26513671875, 1.37347412109375, 1.4818115234375, 1.59014892578125, 1.698486328125, 1.80682373046875, 1.9151611328125, 2.02349853515625, 2.1318359375, 2.24017333984375, 2.3485107421875, 2.45684814453125, 2.565185546875, 2.67352294921875, 2.7818603515625, 2.89019775390625, 2.99853515625, 3.10687255859375, 3.2152099609375, 3.32354736328125, 3.431884765625, 3.54022216796875, 3.6485595703125, 3.75689697265625, 3.865234375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 3.0, 7.0, 5.0, 1.0, 23.0, 43.0, 74.0, 170.0, 207.0, 192.0, 137.0, 64.0, 35.0, 16.0, 6.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.580963134765625, -31.366004943847656, -30.151046752929688, -28.936086654663086, -27.721128463745117, -26.50617027282715, -25.291210174560547, -24.076251983642578, -22.86129379272461, -21.64633560180664, -20.431377410888672, -19.21641731262207, -18.0014591217041, -16.786500930786133, -15.571541786193848, -14.356582641601562, -13.141624450683594, -11.926666259765625, -10.71170711517334, -9.496747970581055, -8.281789779663086, -7.066831111907959, -5.851872444152832, -4.636913299560547, -3.421955108642578, -2.206996440887451, -0.9920377731323242, 0.22292089462280273, 1.4378795623779297, 2.6528382301330566, 3.8677968978881836, 5.082756042480469, 6.297718048095703, 7.51267671585083, 8.727635383605957, 9.942594528198242, 11.157552719116211, 12.37251091003418, 13.587470054626465, 14.80242919921875, 16.01738739013672, 17.232345581054688, 18.447303771972656, 19.662263870239258, 20.877222061157227, 22.092180252075195, 23.307140350341797, 24.522098541259766, 25.737056732177734, 26.952014923095703, 28.166973114013672, 29.381933212280273, 30.596891403198242, 31.81184959411621, 33.02680969238281, 34.24176788330078, 35.45672607421875, 36.67168426513672, 37.88664245605469, 39.101600646972656, 40.316558837890625, 41.53152084350586, 42.74647903442383, 43.9614372253418, 45.176395416259766]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 5.0, 5.0, 8.0, 15.0, 27.0, 20.0, 42.0, 39.0, 51.0, 53.0, 60.0, 52.0, 55.0, 53.0, 59.0, 52.0, 49.0, 57.0, 60.0, 45.0, 35.0, 35.0, 29.0, 24.0, 23.0, 13.0, 12.0, 3.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.701509475708008, -18.143112182617188, -17.584716796875, -17.02631950378418, -16.46792221069336, -15.909525871276855, -15.351129531860352, -14.792732238769531, -14.234335899353027, -13.675939559936523, -13.117542266845703, -12.5591459274292, -12.000749588012695, -11.442352294921875, -10.883955955505371, -10.325559616088867, -9.767162322998047, -9.208765983581543, -8.650368690490723, -8.091972351074219, -7.533575534820557, -6.9751787185668945, -6.416782379150391, -5.8583855628967285, -5.299988746643066, -4.741591930389404, -4.183195114135742, -3.6247987747192383, -3.066401958465576, -2.508005142211914, -1.949608564376831, -1.391211986541748, -0.8328151702880859, -0.2744184732437134, 0.2839782238006592, 0.8423749208450317, 1.4007716178894043, 1.9591684341430664, 2.5175650119781494, 3.0759615898132324, 3.6343584060668945, 4.192755222320557, 4.751152038574219, 5.309548377990723, 5.867945194244385, 6.426342010498047, 6.984738349914551, 7.543135166168213, 8.101531982421875, 8.659928321838379, 9.2183256149292, 9.776721954345703, 10.335119247436523, 10.893515586853027, 11.451911926269531, 12.010309219360352, 12.568705558776855, 13.12710189819336, 13.68549919128418, 14.243895530700684, 14.802291870117188, 15.360689163208008, 15.919085502624512, 16.477481842041016, 17.035879135131836]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 10.0, 7.0, 17.0, 27.0, 47.0, 67.0, 133.0, 191.0, 402.0, 757.0, 1798.0, 4882.0, 17536.0, 86356.0, 447766.0, 394139.0, 71694.0, 15149.0, 4446.0, 1574.0, 707.0, 360.0, 194.0, 101.0, 58.0, 47.0, 28.0, 13.0, 16.0, 9.0, 5.0, 5.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.37109375, -3.27178955078125, -3.1724853515625, -3.07318115234375, -2.973876953125, -2.87457275390625, -2.7752685546875, -2.67596435546875, -2.57666015625, -2.47735595703125, -2.3780517578125, -2.27874755859375, -2.179443359375, -2.08013916015625, -1.9808349609375, -1.88153076171875, -1.7822265625, -1.68292236328125, -1.5836181640625, -1.48431396484375, -1.385009765625, -1.28570556640625, -1.1864013671875, -1.08709716796875, -0.98779296875, -0.88848876953125, -0.7891845703125, -0.68988037109375, -0.590576171875, -0.49127197265625, -0.3919677734375, -0.29266357421875, -0.193359375, -0.09405517578125, 0.0052490234375, 0.10455322265625, 0.203857421875, 0.30316162109375, 0.4024658203125, 0.50177001953125, 0.60107421875, 0.70037841796875, 0.7996826171875, 0.89898681640625, 0.998291015625, 1.09759521484375, 1.1968994140625, 1.29620361328125, 1.3955078125, 1.49481201171875, 1.5941162109375, 1.69342041015625, 1.792724609375, 1.89202880859375, 1.9913330078125, 2.09063720703125, 2.18994140625, 2.28924560546875, 2.3885498046875, 2.48785400390625, 2.587158203125, 2.68646240234375, 2.7857666015625, 2.88507080078125, 2.984375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 5.0, 5.0, 8.0, 13.0, 14.0, 11.0, 15.0, 16.0, 18.0, 34.0, 31.0, 29.0, 40.0, 61.0, 45.0, 54.0, 39.0, 47.0, 45.0, 56.0, 43.0, 40.0, 43.0, 44.0, 25.0, 35.0, 31.0, 29.0, 19.0, 19.0, 20.0, 15.0, 11.0, 7.0, 12.0, 8.0, 1.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3994140625, -1.3551788330078125, -1.310943603515625, -1.2667083740234375, -1.22247314453125, -1.1782379150390625, -1.134002685546875, -1.0897674560546875, -1.0455322265625, -1.0012969970703125, -0.957061767578125, -0.9128265380859375, -0.86859130859375, -0.8243560791015625, -0.780120849609375, -0.7358856201171875, -0.691650390625, -0.6474151611328125, -0.603179931640625, -0.5589447021484375, -0.51470947265625, -0.4704742431640625, -0.426239013671875, -0.3820037841796875, -0.3377685546875, -0.2935333251953125, -0.249298095703125, -0.2050628662109375, -0.16082763671875, -0.1165924072265625, -0.072357177734375, -0.0281219482421875, 0.01611328125, 0.0603485107421875, 0.104583740234375, 0.1488189697265625, 0.19305419921875, 0.2372894287109375, 0.281524658203125, 0.3257598876953125, 0.3699951171875, 0.4142303466796875, 0.458465576171875, 0.5027008056640625, 0.54693603515625, 0.5911712646484375, 0.635406494140625, 0.6796417236328125, 0.723876953125, 0.7681121826171875, 0.812347412109375, 0.8565826416015625, 0.90081787109375, 0.9450531005859375, 0.989288330078125, 1.0335235595703125, 1.0777587890625, 1.1219940185546875, 1.166229248046875, 1.2104644775390625, 1.25469970703125, 1.2989349365234375, 1.343170166015625, 1.3874053955078125, 1.431640625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 4.0, 3.0, 7.0, 15.0, 12.0, 8.0, 24.0, 25.0, 40.0, 43.0, 89.0, 135.0, 196.0, 351.0, 694.0, 1502.0, 4229.0, 15038.0, 87913.0, 673522.0, 222255.0, 31007.0, 6965.0, 2360.0, 964.0, 459.0, 239.0, 147.0, 77.0, 59.0, 54.0, 28.0, 27.0, 15.0, 18.0, 7.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.626953125, -3.51611328125, -3.4052734375, -3.29443359375, -3.18359375, -3.07275390625, -2.9619140625, -2.85107421875, -2.740234375, -2.62939453125, -2.5185546875, -2.40771484375, -2.296875, -2.18603515625, -2.0751953125, -1.96435546875, -1.853515625, -1.74267578125, -1.6318359375, -1.52099609375, -1.41015625, -1.29931640625, -1.1884765625, -1.07763671875, -0.966796875, -0.85595703125, -0.7451171875, -0.63427734375, -0.5234375, -0.41259765625, -0.3017578125, -0.19091796875, -0.080078125, 0.03076171875, 0.1416015625, 0.25244140625, 0.36328125, 0.47412109375, 0.5849609375, 0.69580078125, 0.806640625, 0.91748046875, 1.0283203125, 1.13916015625, 1.25, 1.36083984375, 1.4716796875, 1.58251953125, 1.693359375, 1.80419921875, 1.9150390625, 2.02587890625, 2.13671875, 2.24755859375, 2.3583984375, 2.46923828125, 2.580078125, 2.69091796875, 2.8017578125, 2.91259765625, 3.0234375, 3.13427734375, 3.2451171875, 3.35595703125, 3.466796875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 7.0, 7.0, 14.0, 9.0, 10.0, 19.0, 15.0, 19.0, 20.0, 17.0, 32.0, 30.0, 37.0, 48.0, 49.0, 43.0, 54.0, 32.0, 58.0, 47.0, 43.0, 56.0, 44.0, 38.0, 34.0, 32.0, 26.0, 21.0, 26.0, 27.0, 15.0, 15.0, 10.0, 10.0, 8.0, 5.0, 7.0, 4.0, 2.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.99609375, -4.84039306640625, -4.6846923828125, -4.52899169921875, -4.373291015625, -4.21759033203125, -4.0618896484375, -3.90618896484375, -3.75048828125, -3.59478759765625, -3.4390869140625, -3.28338623046875, -3.127685546875, -2.97198486328125, -2.8162841796875, -2.66058349609375, -2.5048828125, -2.34918212890625, -2.1934814453125, -2.03778076171875, -1.882080078125, -1.72637939453125, -1.5706787109375, -1.41497802734375, -1.25927734375, -1.10357666015625, -0.9478759765625, -0.79217529296875, -0.636474609375, -0.48077392578125, -0.3250732421875, -0.16937255859375, -0.013671875, 0.14202880859375, 0.2977294921875, 0.45343017578125, 0.609130859375, 0.76483154296875, 0.9205322265625, 1.07623291015625, 1.23193359375, 1.38763427734375, 1.5433349609375, 1.69903564453125, 1.854736328125, 2.01043701171875, 2.1661376953125, 2.32183837890625, 2.4775390625, 2.63323974609375, 2.7889404296875, 2.94464111328125, 3.100341796875, 3.25604248046875, 3.4117431640625, 3.56744384765625, 3.72314453125, 3.87884521484375, 4.0345458984375, 4.19024658203125, 4.345947265625, 4.50164794921875, 4.6573486328125, 4.81304931640625, 4.96875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 4.0, 8.0, 8.0, 14.0, 21.0, 36.0, 62.0, 112.0, 209.0, 457.0, 894.0, 2406.0, 7505.0, 29194.0, 178661.0, 698872.0, 102259.0, 19195.0, 5287.0, 1851.0, 739.0, 337.0, 184.0, 93.0, 51.0, 36.0, 23.0, 12.0, 5.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4951171875, -1.44891357421875, -1.4027099609375, -1.35650634765625, -1.310302734375, -1.26409912109375, -1.2178955078125, -1.17169189453125, -1.12548828125, -1.07928466796875, -1.0330810546875, -0.98687744140625, -0.940673828125, -0.89447021484375, -0.8482666015625, -0.80206298828125, -0.755859375, -0.70965576171875, -0.6634521484375, -0.61724853515625, -0.571044921875, -0.52484130859375, -0.4786376953125, -0.43243408203125, -0.38623046875, -0.34002685546875, -0.2938232421875, -0.24761962890625, -0.201416015625, -0.15521240234375, -0.1090087890625, -0.06280517578125, -0.0166015625, 0.02960205078125, 0.0758056640625, 0.12200927734375, 0.168212890625, 0.21441650390625, 0.2606201171875, 0.30682373046875, 0.35302734375, 0.39923095703125, 0.4454345703125, 0.49163818359375, 0.537841796875, 0.58404541015625, 0.6302490234375, 0.67645263671875, 0.72265625, 0.76885986328125, 0.8150634765625, 0.86126708984375, 0.907470703125, 0.95367431640625, 0.9998779296875, 1.04608154296875, 1.09228515625, 1.13848876953125, 1.1846923828125, 1.23089599609375, 1.277099609375, 1.32330322265625, 1.3695068359375, 1.41571044921875, 1.4619140625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 10.0, 9.0, 17.0, 33.0, 48.0, 55.0, 79.0, 101.0, 151.0, 125.0, 102.0, 83.0, 47.0, 28.0, 24.0, 12.0, 11.0, 9.0, 10.0, 11.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00034618377685546875, -0.00033419206738471985, -0.00032220035791397095, -0.00031020864844322205, -0.00029821693897247314, -0.00028622522950172424, -0.00027423352003097534, -0.00026224181056022644, -0.00025025010108947754, -0.00023825839161872864, -0.00022626668214797974, -0.00021427497267723083, -0.00020228326320648193, -0.00019029155373573303, -0.00017829984426498413, -0.00016630813479423523, -0.00015431642532348633, -0.00014232471585273743, -0.00013033300638198853, -0.00011834129691123962, -0.00010634958744049072, -9.435787796974182e-05, -8.236616849899292e-05, -7.037445902824402e-05, -5.838274955749512e-05, -4.6391040086746216e-05, -3.4399330615997314e-05, -2.2407621145248413e-05, -1.0415911674499512e-05, 1.5757977962493896e-06, 1.3567507266998291e-05, 2.5559216737747192e-05, 3.7550926208496094e-05, 4.9542635679244995e-05, 6.15343451499939e-05, 7.35260546207428e-05, 8.55177640914917e-05, 9.75094735622406e-05, 0.0001095011830329895, 0.0001214928925037384, 0.0001334846019744873, 0.0001454763114452362, 0.0001574680209159851, 0.000169459730386734, 0.0001814514398574829, 0.0001934431493282318, 0.0002054348587989807, 0.00021742656826972961, 0.00022941827774047852, 0.00024140998721122742, 0.0002534016966819763, 0.0002653934061527252, 0.0002773851156234741, 0.000289376825094223, 0.0003013685345649719, 0.0003133602440357208, 0.0003253519535064697, 0.00033734366297721863, 0.00034933537244796753, 0.00036132708191871643, 0.00037331879138946533, 0.00038531050086021423, 0.00039730221033096313, 0.00040929391980171204, 0.00042128562927246094]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 7.0, 16.0, 29.0, 51.0, 105.0, 217.0, 498.0, 1400.0, 5197.0, 28015.0, 278305.0, 672444.0, 51094.0, 8041.0, 1926.0, 666.0, 272.0, 107.0, 73.0, 47.0, 22.0, 15.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1328125, -2.0721282958984375, -2.011444091796875, -1.9507598876953125, -1.89007568359375, -1.8293914794921875, -1.768707275390625, -1.7080230712890625, -1.6473388671875, -1.5866546630859375, -1.525970458984375, -1.4652862548828125, -1.40460205078125, -1.3439178466796875, -1.283233642578125, -1.2225494384765625, -1.161865234375, -1.1011810302734375, -1.040496826171875, -0.9798126220703125, -0.91912841796875, -0.8584442138671875, -0.797760009765625, -0.7370758056640625, -0.6763916015625, -0.6157073974609375, -0.555023193359375, -0.4943389892578125, -0.43365478515625, -0.3729705810546875, -0.312286376953125, -0.2516021728515625, -0.19091796875, -0.1302337646484375, -0.069549560546875, -0.0088653564453125, 0.05181884765625, 0.1125030517578125, 0.173187255859375, 0.2338714599609375, 0.2945556640625, 0.3552398681640625, 0.415924072265625, 0.4766082763671875, 0.53729248046875, 0.5979766845703125, 0.658660888671875, 0.7193450927734375, 0.780029296875, 0.8407135009765625, 0.901397705078125, 0.9620819091796875, 1.02276611328125, 1.0834503173828125, 1.144134521484375, 1.2048187255859375, 1.2655029296875, 1.3261871337890625, 1.386871337890625, 1.4475555419921875, 1.50823974609375, 1.5689239501953125, 1.629608154296875, 1.6902923583984375, 1.7509765625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 6.0, 10.0, 13.0, 24.0, 35.0, 47.0, 78.0, 95.0, 120.0, 138.0, 126.0, 90.0, 62.0, 55.0, 42.0, 21.0, 13.0, 10.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.623046875, -1.564208984375, -1.50537109375, -1.446533203125, -1.3876953125, -1.328857421875, -1.27001953125, -1.211181640625, -1.15234375, -1.093505859375, -1.03466796875, -0.975830078125, -0.9169921875, -0.858154296875, -0.79931640625, -0.740478515625, -0.681640625, -0.622802734375, -0.56396484375, -0.505126953125, -0.4462890625, -0.387451171875, -0.32861328125, -0.269775390625, -0.2109375, -0.152099609375, -0.09326171875, -0.034423828125, 0.0244140625, 0.083251953125, 0.14208984375, 0.200927734375, 0.259765625, 0.318603515625, 0.37744140625, 0.436279296875, 0.4951171875, 0.553955078125, 0.61279296875, 0.671630859375, 0.73046875, 0.789306640625, 0.84814453125, 0.906982421875, 0.9658203125, 1.024658203125, 1.08349609375, 1.142333984375, 1.201171875, 1.260009765625, 1.31884765625, 1.377685546875, 1.4365234375, 1.495361328125, 1.55419921875, 1.613037109375, 1.671875, 1.730712890625, 1.78955078125, 1.848388671875, 1.9072265625, 1.966064453125, 2.02490234375, 2.083740234375, 2.142578125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 7.0, 21.0, 33.0, 110.0, 257.0, 355.0, 151.0, 40.0, 14.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-65.16654968261719, -63.66020965576172, -62.153873443603516, -60.64753341674805, -59.141197204589844, -57.634857177734375, -56.12852096557617, -54.6221809387207, -53.1158447265625, -51.60950469970703, -50.10316848754883, -48.59682846069336, -47.090492248535156, -45.58415222167969, -44.077816009521484, -42.571475982666016, -41.06513977050781, -39.558799743652344, -38.05246353149414, -36.54612350463867, -35.03978729248047, -33.533447265625, -32.0271110534668, -30.520771026611328, -29.01443099975586, -27.508092880249023, -26.001754760742188, -24.49541664123535, -22.989078521728516, -21.48274040222168, -19.976402282714844, -18.470062255859375, -16.963726043701172, -15.457387924194336, -13.9510498046875, -12.444711685180664, -10.938373565673828, -9.432035446166992, -7.92569637298584, -6.419358253479004, -4.913020133972168, -3.406682014465332, -1.900343656539917, -0.39400529861450195, 1.112332820892334, 2.61867094039917, 4.125009536743164, 5.63134765625, 7.137685775756836, 8.644023895263672, 10.150362014770508, 11.656700134277344, 13.16303825378418, 14.669376373291016, 16.175716400146484, 17.682052612304688, 19.188392639160156, 20.694730758666992, 22.201068878173828, 23.707406997680664, 25.2137451171875, 26.720083236694336, 28.226421356201172, 29.73276138305664, 31.239097595214844]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 3.0, 6.0, 9.0, 15.0, 11.0, 19.0, 23.0, 27.0, 23.0, 21.0, 26.0, 30.0, 43.0, 39.0, 56.0, 61.0, 80.0, 77.0, 72.0, 43.0, 44.0, 43.0, 35.0, 27.0, 21.0, 24.0, 26.0, 22.0, 6.0, 10.0, 9.0, 9.0, 11.0, 7.0, 4.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-22.80035400390625, -22.16496467590332, -21.529577255249023, -20.894187927246094, -20.258800506591797, -19.623411178588867, -18.98802375793457, -18.35263442993164, -17.717247009277344, -17.081857681274414, -16.446470260620117, -15.811081886291504, -15.17569351196289, -14.540304183959961, -13.904915809631348, -13.269527435302734, -12.634138107299805, -11.998749732971191, -11.363361358642578, -10.727972984313965, -10.092584609985352, -9.457195281982422, -8.821806907653809, -8.186418533325195, -7.551030158996582, -6.915641784667969, -6.2802534103393555, -5.644864559173584, -5.009476184844971, -4.374087810516357, -3.738699197769165, -3.1033105850219727, -2.4679203033447266, -1.8325318098068237, -1.197143316268921, -0.5617548227310181, 0.07363367080688477, 0.709022045135498, 1.3444106578826904, 1.9797992706298828, 2.615187644958496, 3.2505760192871094, 3.8859646320343018, 4.521353244781494, 5.156741619110107, 5.792129993438721, 6.427518844604492, 7.0629072189331055, 7.698295593261719, 8.333683967590332, 8.969072341918945, 9.604460716247559, 10.239849090576172, 10.875238418579102, 11.510626792907715, 12.146015167236328, 12.781403541564941, 13.416791915893555, 14.052180290222168, 14.687568664550781, 15.322957992553711, 15.958345413208008, 16.593734741210938, 17.229122161865234, 17.864511489868164]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 8.0, 10.0, 22.0, 27.0, 36.0, 35.0, 82.0, 127.0, 189.0, 376.0, 675.0, 1462.0, 3253.0, 8691.0, 31586.0, 223963.0, 2324994.0, 1437455.0, 126533.0, 22230.0, 7054.0, 2811.0, 1210.0, 650.0, 334.0, 175.0, 107.0, 75.0, 30.0, 25.0, 15.0, 20.0, 5.0, 7.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.29296875, -2.2272186279296875, -2.161468505859375, -2.0957183837890625, -2.02996826171875, -1.9642181396484375, -1.898468017578125, -1.8327178955078125, -1.7669677734375, -1.7012176513671875, -1.635467529296875, -1.5697174072265625, -1.50396728515625, -1.4382171630859375, -1.372467041015625, -1.3067169189453125, -1.240966796875, -1.1752166748046875, -1.109466552734375, -1.0437164306640625, -0.97796630859375, -0.9122161865234375, -0.846466064453125, -0.7807159423828125, -0.7149658203125, -0.6492156982421875, -0.583465576171875, -0.5177154541015625, -0.45196533203125, -0.3862152099609375, -0.320465087890625, -0.2547149658203125, -0.18896484375, -0.1232147216796875, -0.057464599609375, 0.0082855224609375, 0.07403564453125, 0.1397857666015625, 0.205535888671875, 0.2712860107421875, 0.3370361328125, 0.4027862548828125, 0.468536376953125, 0.5342864990234375, 0.60003662109375, 0.6657867431640625, 0.731536865234375, 0.7972869873046875, 0.863037109375, 0.9287872314453125, 0.994537353515625, 1.0602874755859375, 1.12603759765625, 1.1917877197265625, 1.257537841796875, 1.3232879638671875, 1.3890380859375, 1.4547882080078125, 1.520538330078125, 1.5862884521484375, 1.65203857421875, 1.7177886962890625, 1.783538818359375, 1.8492889404296875, 1.9150390625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 9.0, 7.0, 13.0, 13.0, 17.0, 15.0, 27.0, 33.0, 27.0, 45.0, 51.0, 45.0, 56.0, 44.0, 41.0, 54.0, 52.0, 61.0, 43.0, 51.0, 40.0, 36.0, 43.0, 33.0, 25.0, 20.0, 18.0, 10.0, 13.0, 13.0, 12.0, 6.0, 2.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.341796875, -1.296630859375, -1.25146484375, -1.206298828125, -1.1611328125, -1.115966796875, -1.07080078125, -1.025634765625, -0.98046875, -0.935302734375, -0.89013671875, -0.844970703125, -0.7998046875, -0.754638671875, -0.70947265625, -0.664306640625, -0.619140625, -0.573974609375, -0.52880859375, -0.483642578125, -0.4384765625, -0.393310546875, -0.34814453125, -0.302978515625, -0.2578125, -0.212646484375, -0.16748046875, -0.122314453125, -0.0771484375, -0.031982421875, 0.01318359375, 0.058349609375, 0.103515625, 0.148681640625, 0.19384765625, 0.239013671875, 0.2841796875, 0.329345703125, 0.37451171875, 0.419677734375, 0.46484375, 0.510009765625, 0.55517578125, 0.600341796875, 0.6455078125, 0.690673828125, 0.73583984375, 0.781005859375, 0.826171875, 0.871337890625, 0.91650390625, 0.961669921875, 1.0068359375, 1.052001953125, 1.09716796875, 1.142333984375, 1.1875, 1.232666015625, 1.27783203125, 1.322998046875, 1.3681640625, 1.413330078125, 1.45849609375, 1.503662109375, 1.548828125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 13.0, 27.0, 34.0, 85.0, 141.0, 288.0, 610.0, 1732.0, 12467.0, 1389734.0, 2769268.0, 16314.0, 2086.0, 733.0, 347.0, 179.0, 117.0, 53.0, 24.0, 8.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.11328125, -5.87860107421875, -5.6439208984375, -5.40924072265625, -5.174560546875, -4.93988037109375, -4.7052001953125, -4.47052001953125, -4.23583984375, -4.00115966796875, -3.7664794921875, -3.53179931640625, -3.297119140625, -3.06243896484375, -2.8277587890625, -2.59307861328125, -2.3583984375, -2.12371826171875, -1.8890380859375, -1.65435791015625, -1.419677734375, -1.18499755859375, -0.9503173828125, -0.71563720703125, -0.48095703125, -0.24627685546875, -0.0115966796875, 0.22308349609375, 0.457763671875, 0.69244384765625, 0.9271240234375, 1.16180419921875, 1.396484375, 1.63116455078125, 1.8658447265625, 2.10052490234375, 2.335205078125, 2.56988525390625, 2.8045654296875, 3.03924560546875, 3.27392578125, 3.50860595703125, 3.7432861328125, 3.97796630859375, 4.212646484375, 4.44732666015625, 4.6820068359375, 4.91668701171875, 5.1513671875, 5.38604736328125, 5.6207275390625, 5.85540771484375, 6.090087890625, 6.32476806640625, 6.5594482421875, 6.79412841796875, 7.02880859375, 7.26348876953125, 7.4981689453125, 7.73284912109375, 7.967529296875, 8.20220947265625, 8.4368896484375, 8.67156982421875, 8.90625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 11.0, 20.0, 30.0, 33.0, 69.0, 150.0, 332.0, 758.0, 1195.0, 809.0, 322.0, 144.0, 82.0, 38.0, 26.0, 18.0, 16.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.427734375, -3.275604248046875, -3.12347412109375, -2.971343994140625, -2.8192138671875, -2.667083740234375, -2.51495361328125, -2.362823486328125, -2.210693359375, -2.058563232421875, -1.90643310546875, -1.754302978515625, -1.6021728515625, -1.450042724609375, -1.29791259765625, -1.145782470703125, -0.99365234375, -0.841522216796875, -0.68939208984375, -0.537261962890625, -0.3851318359375, -0.233001708984375, -0.08087158203125, 0.071258544921875, 0.223388671875, 0.375518798828125, 0.52764892578125, 0.679779052734375, 0.8319091796875, 0.984039306640625, 1.13616943359375, 1.288299560546875, 1.4404296875, 1.592559814453125, 1.74468994140625, 1.896820068359375, 2.0489501953125, 2.201080322265625, 2.35321044921875, 2.505340576171875, 2.657470703125, 2.809600830078125, 2.96173095703125, 3.113861083984375, 3.2659912109375, 3.418121337890625, 3.57025146484375, 3.722381591796875, 3.87451171875, 4.026641845703125, 4.17877197265625, 4.330902099609375, 4.4830322265625, 4.635162353515625, 4.78729248046875, 4.939422607421875, 5.091552734375, 5.243682861328125, 5.39581298828125, 5.547943115234375, 5.7000732421875, 5.852203369140625, 6.00433349609375, 6.156463623046875, 6.30859375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 7.0, 17.0, 28.0, 55.0, 82.0, 146.0, 205.0, 176.0, 123.0, 74.0, 43.0, 16.0, 13.0, 4.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.545799255371094, -37.470001220703125, -36.39420700073242, -35.31841278076172, -34.24261474609375, -33.16681671142578, -32.09102249145508, -31.015226364135742, -29.939430236816406, -28.86363410949707, -27.787837982177734, -26.7120418548584, -25.636245727539062, -24.560449600219727, -23.48465347290039, -22.408857345581055, -21.33306121826172, -20.257265090942383, -19.181468963623047, -18.10567283630371, -17.029876708984375, -15.954080581665039, -14.878284454345703, -13.802488327026367, -12.726692199707031, -11.650896072387695, -10.57509994506836, -9.499303817749023, -8.423507690429688, -7.347711563110352, -6.271915435791016, -5.19611930847168, -4.120326995849609, -3.0445308685302734, -1.9687347412109375, -0.8929386138916016, 0.18285751342773438, 1.2586536407470703, 2.3344497680664062, 3.410245895385742, 4.486042022705078, 5.561838150024414, 6.63763427734375, 7.713430404663086, 8.789226531982422, 9.865022659301758, 10.940818786621094, 12.01661491394043, 13.092411041259766, 14.168207168579102, 15.244003295898438, 16.319799423217773, 17.39559555053711, 18.471391677856445, 19.54718780517578, 20.622983932495117, 21.698780059814453, 22.77457618713379, 23.850372314453125, 24.92616844177246, 26.001964569091797, 27.077760696411133, 28.15355682373047, 29.229352951049805, 30.30514907836914]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 6.0, 14.0, 11.0, 15.0, 20.0, 22.0, 34.0, 28.0, 32.0, 45.0, 47.0, 42.0, 42.0, 52.0, 56.0, 50.0, 46.0, 48.0, 47.0, 54.0, 43.0, 40.0, 35.0, 33.0, 24.0, 18.0, 18.0, 13.0, 15.0, 17.0, 8.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9271879196167, -12.476917266845703, -12.026646614074707, -11.576375961303711, -11.126104354858398, -10.675833702087402, -10.225563049316406, -9.77529239654541, -9.325021743774414, -8.874751091003418, -8.424480438232422, -7.974209308624268, -7.523938179016113, -7.073667526245117, -6.623396873474121, -6.173126220703125, -5.7228546142578125, -5.272583961486816, -4.822312831878662, -4.372042179107666, -3.921771287918091, -3.4715003967285156, -3.0212297439575195, -2.5709588527679443, -2.120687961578369, -1.670417070388794, -1.2201462984085083, -0.7698755264282227, -0.31960463523864746, 0.13066625595092773, 0.5809369087219238, 1.031207799911499, 1.4814777374267578, 1.931748628616333, 2.382019519805908, 2.8322901725769043, 3.2825610637664795, 3.7328319549560547, 4.183102607727051, 4.633373260498047, 5.083644390106201, 5.533915042877197, 5.984186172485352, 6.434456825256348, 6.884727478027344, 7.334998607635498, 7.785269260406494, 8.235540390014648, 8.685811042785645, 9.13608169555664, 9.586352348327637, 10.036623001098633, 10.486894607543945, 10.937165260314941, 11.387435913085938, 11.837706565856934, 12.28797721862793, 12.738247871398926, 13.188518524169922, 13.638790130615234, 14.08906078338623, 14.539331436157227, 14.989602088928223, 15.439872741699219, 15.890144348144531]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 12.0, 12.0, 12.0, 26.0, 26.0, 40.0, 63.0, 99.0, 130.0, 253.0, 384.0, 644.0, 1195.0, 2424.0, 5108.0, 12932.0, 38407.0, 141702.0, 448758.0, 285413.0, 73482.0, 22034.0, 7940.0, 3529.0, 1731.0, 899.0, 494.0, 280.0, 188.0, 104.0, 72.0, 47.0, 33.0, 27.0, 16.0, 7.0, 7.0, 8.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.408203125, -2.334686279296875, -2.26116943359375, -2.187652587890625, -2.1141357421875, -2.040618896484375, -1.96710205078125, -1.893585205078125, -1.820068359375, -1.746551513671875, -1.67303466796875, -1.599517822265625, -1.5260009765625, -1.452484130859375, -1.37896728515625, -1.305450439453125, -1.23193359375, -1.158416748046875, -1.08489990234375, -1.011383056640625, -0.9378662109375, -0.864349365234375, -0.79083251953125, -0.717315673828125, -0.643798828125, -0.570281982421875, -0.49676513671875, -0.423248291015625, -0.3497314453125, -0.276214599609375, -0.20269775390625, -0.129180908203125, -0.0556640625, 0.017852783203125, 0.09136962890625, 0.164886474609375, 0.2384033203125, 0.311920166015625, 0.38543701171875, 0.458953857421875, 0.532470703125, 0.605987548828125, 0.67950439453125, 0.753021240234375, 0.8265380859375, 0.900054931640625, 0.97357177734375, 1.047088623046875, 1.12060546875, 1.194122314453125, 1.26763916015625, 1.341156005859375, 1.4146728515625, 1.488189697265625, 1.56170654296875, 1.635223388671875, 1.708740234375, 1.782257080078125, 1.85577392578125, 1.929290771484375, 2.0028076171875, 2.076324462890625, 2.14984130859375, 2.223358154296875, 2.296875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 5.0, 9.0, 8.0, 9.0, 16.0, 20.0, 20.0, 28.0, 30.0, 25.0, 28.0, 32.0, 43.0, 46.0, 37.0, 41.0, 44.0, 42.0, 41.0, 45.0, 52.0, 47.0, 35.0, 29.0, 38.0, 33.0, 40.0, 22.0, 26.0, 17.0, 21.0, 13.0, 17.0, 10.0, 4.0, 5.0, 3.0, 8.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3798828125, -1.337066650390625, -1.29425048828125, -1.251434326171875, -1.2086181640625, -1.165802001953125, -1.12298583984375, -1.080169677734375, -1.037353515625, -0.994537353515625, -0.95172119140625, -0.908905029296875, -0.8660888671875, -0.823272705078125, -0.78045654296875, -0.737640380859375, -0.69482421875, -0.652008056640625, -0.60919189453125, -0.566375732421875, -0.5235595703125, -0.480743408203125, -0.43792724609375, -0.395111083984375, -0.352294921875, -0.309478759765625, -0.26666259765625, -0.223846435546875, -0.1810302734375, -0.138214111328125, -0.09539794921875, -0.052581787109375, -0.009765625, 0.033050537109375, 0.07586669921875, 0.118682861328125, 0.1614990234375, 0.204315185546875, 0.24713134765625, 0.289947509765625, 0.332763671875, 0.375579833984375, 0.41839599609375, 0.461212158203125, 0.5040283203125, 0.546844482421875, 0.58966064453125, 0.632476806640625, 0.67529296875, 0.718109130859375, 0.76092529296875, 0.803741455078125, 0.8465576171875, 0.889373779296875, 0.93218994140625, 0.975006103515625, 1.017822265625, 1.060638427734375, 1.10345458984375, 1.146270751953125, 1.1890869140625, 1.231903076171875, 1.27471923828125, 1.317535400390625, 1.3603515625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 2.0, 3.0, 10.0, 6.0, 10.0, 15.0, 13.0, 19.0, 48.0, 62.0, 68.0, 89.0, 148.0, 212.0, 466.0, 920.0, 2464.0, 9538.0, 65888.0, 780467.0, 163707.0, 17880.0, 3869.0, 1259.0, 582.0, 287.0, 157.0, 112.0, 82.0, 47.0, 40.0, 19.0, 16.0, 15.0, 3.0, 8.0, 8.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.515625, -4.37744140625, -4.2392578125, -4.10107421875, -3.962890625, -3.82470703125, -3.6865234375, -3.54833984375, -3.41015625, -3.27197265625, -3.1337890625, -2.99560546875, -2.857421875, -2.71923828125, -2.5810546875, -2.44287109375, -2.3046875, -2.16650390625, -2.0283203125, -1.89013671875, -1.751953125, -1.61376953125, -1.4755859375, -1.33740234375, -1.19921875, -1.06103515625, -0.9228515625, -0.78466796875, -0.646484375, -0.50830078125, -0.3701171875, -0.23193359375, -0.09375, 0.04443359375, 0.1826171875, 0.32080078125, 0.458984375, 0.59716796875, 0.7353515625, 0.87353515625, 1.01171875, 1.14990234375, 1.2880859375, 1.42626953125, 1.564453125, 1.70263671875, 1.8408203125, 1.97900390625, 2.1171875, 2.25537109375, 2.3935546875, 2.53173828125, 2.669921875, 2.80810546875, 2.9462890625, 3.08447265625, 3.22265625, 3.36083984375, 3.4990234375, 3.63720703125, 3.775390625, 3.91357421875, 4.0517578125, 4.18994140625, 4.328125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 4.0, 5.0, 4.0, 5.0, 12.0, 11.0, 17.0, 16.0, 22.0, 29.0, 27.0, 31.0, 43.0, 54.0, 51.0, 62.0, 55.0, 57.0, 73.0, 56.0, 49.0, 66.0, 41.0, 37.0, 25.0, 34.0, 30.0, 17.0, 10.0, 15.0, 8.0, 13.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.91015625, -6.7261962890625, -6.542236328125, -6.3582763671875, -6.17431640625, -5.9903564453125, -5.806396484375, -5.6224365234375, -5.4384765625, -5.2545166015625, -5.070556640625, -4.8865966796875, -4.70263671875, -4.5186767578125, -4.334716796875, -4.1507568359375, -3.966796875, -3.7828369140625, -3.598876953125, -3.4149169921875, -3.23095703125, -3.0469970703125, -2.863037109375, -2.6790771484375, -2.4951171875, -2.3111572265625, -2.127197265625, -1.9432373046875, -1.75927734375, -1.5753173828125, -1.391357421875, -1.2073974609375, -1.0234375, -0.8394775390625, -0.655517578125, -0.4715576171875, -0.28759765625, -0.1036376953125, 0.080322265625, 0.2642822265625, 0.4482421875, 0.6322021484375, 0.816162109375, 1.0001220703125, 1.18408203125, 1.3680419921875, 1.552001953125, 1.7359619140625, 1.919921875, 2.1038818359375, 2.287841796875, 2.4718017578125, 2.65576171875, 2.8397216796875, 3.023681640625, 3.2076416015625, 3.3916015625, 3.5755615234375, 3.759521484375, 3.9434814453125, 4.12744140625, 4.3114013671875, 4.495361328125, 4.6793212890625, 4.86328125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 12.0, 16.0, 33.0, 52.0, 79.0, 146.0, 253.0, 538.0, 1291.0, 3528.0, 10145.0, 36915.0, 219167.0, 681892.0, 69400.0, 16514.0, 5132.0, 1848.0, 771.0, 351.0, 187.0, 102.0, 74.0, 41.0, 23.0, 12.0, 10.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3984375, -1.355010986328125, -1.31158447265625, -1.268157958984375, -1.2247314453125, -1.181304931640625, -1.13787841796875, -1.094451904296875, -1.051025390625, -1.007598876953125, -0.96417236328125, -0.920745849609375, -0.8773193359375, -0.833892822265625, -0.79046630859375, -0.747039794921875, -0.70361328125, -0.660186767578125, -0.61676025390625, -0.573333740234375, -0.5299072265625, -0.486480712890625, -0.44305419921875, -0.399627685546875, -0.356201171875, -0.312774658203125, -0.26934814453125, -0.225921630859375, -0.1824951171875, -0.139068603515625, -0.09564208984375, -0.052215576171875, -0.0087890625, 0.034637451171875, 0.07806396484375, 0.121490478515625, 0.1649169921875, 0.208343505859375, 0.25177001953125, 0.295196533203125, 0.338623046875, 0.382049560546875, 0.42547607421875, 0.468902587890625, 0.5123291015625, 0.555755615234375, 0.59918212890625, 0.642608642578125, 0.68603515625, 0.729461669921875, 0.77288818359375, 0.816314697265625, 0.8597412109375, 0.903167724609375, 0.94659423828125, 0.990020751953125, 1.033447265625, 1.076873779296875, 1.12030029296875, 1.163726806640625, 1.2071533203125, 1.250579833984375, 1.29400634765625, 1.337432861328125, 1.380859375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 1.0, 4.0, 4.0, 6.0, 5.0, 6.0, 13.0, 14.0, 14.0, 16.0, 15.0, 36.0, 57.0, 72.0, 96.0, 127.0, 123.0, 98.0, 88.0, 55.0, 39.0, 22.0, 14.0, 18.0, 16.0, 7.0, 6.0, 10.0, 6.0, 4.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00039577484130859375, -0.0003844723105430603, -0.00037316977977752686, -0.0003618672490119934, -0.00035056471824645996, -0.0003392621874809265, -0.00032795965671539307, -0.0003166571259498596, -0.00030535459518432617, -0.0002940520644187927, -0.0002827495336532593, -0.00027144700288772583, -0.0002601444721221924, -0.00024884194135665894, -0.0002375394105911255, -0.00022623687982559204, -0.0002149343490600586, -0.00020363181829452515, -0.0001923292875289917, -0.00018102675676345825, -0.0001697242259979248, -0.00015842169523239136, -0.0001471191644668579, -0.00013581663370132446, -0.00012451410293579102, -0.00011321157217025757, -0.00010190904140472412, -9.060651063919067e-05, -7.930397987365723e-05, -6.800144910812378e-05, -5.669891834259033e-05, -4.5396387577056885e-05, -3.409385681152344e-05, -2.279132604598999e-05, -1.1488795280456543e-05, -1.862645149230957e-07, 1.1116266250610352e-05, 2.24187970161438e-05, 3.3721327781677246e-05, 4.502385854721069e-05, 5.632638931274414e-05, 6.762892007827759e-05, 7.893145084381104e-05, 9.023398160934448e-05, 0.00010153651237487793, 0.00011283904314041138, 0.00012414157390594482, 0.00013544410467147827, 0.00014674663543701172, 0.00015804916620254517, 0.0001693516969680786, 0.00018065422773361206, 0.0001919567584991455, 0.00020325928926467896, 0.0002145618200302124, 0.00022586435079574585, 0.0002371668815612793, 0.00024846941232681274, 0.0002597719430923462, 0.00027107447385787964, 0.0002823770046234131, 0.00029367953538894653, 0.00030498206615448, 0.00031628459692001343, 0.0003275871276855469]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 11.0, 15.0, 26.0, 26.0, 34.0, 55.0, 68.0, 95.0, 155.0, 218.0, 382.0, 687.0, 1365.0, 3331.0, 7944.0, 22529.0, 78188.0, 600408.0, 252284.0, 53082.0, 16165.0, 6158.0, 2540.0, 1207.0, 625.0, 337.0, 197.0, 165.0, 69.0, 55.0, 35.0, 26.0, 22.0, 14.0, 10.0, 7.0, 3.0, 5.0, 7.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.2548828125, -1.2198867797851562, -1.1848907470703125, -1.1498947143554688, -1.114898681640625, -1.0799026489257812, -1.0449066162109375, -1.0099105834960938, -0.97491455078125, -0.9399185180664062, -0.9049224853515625, -0.8699264526367188, -0.834930419921875, -0.7999343872070312, -0.7649383544921875, -0.7299423217773438, -0.6949462890625, -0.6599502563476562, -0.6249542236328125, -0.5899581909179688, -0.554962158203125, -0.5199661254882812, -0.4849700927734375, -0.44997406005859375, -0.41497802734375, -0.37998199462890625, -0.3449859619140625, -0.30998992919921875, -0.274993896484375, -0.23999786376953125, -0.2050018310546875, -0.17000579833984375, -0.135009765625, -0.10001373291015625, -0.0650177001953125, -0.03002166748046875, 0.004974365234375, 0.03997039794921875, 0.0749664306640625, 0.10996246337890625, 0.14495849609375, 0.17995452880859375, 0.2149505615234375, 0.24994659423828125, 0.284942626953125, 0.31993865966796875, 0.3549346923828125, 0.38993072509765625, 0.4249267578125, 0.45992279052734375, 0.4949188232421875, 0.5299148559570312, 0.564910888671875, 0.5999069213867188, 0.6349029541015625, 0.6698989868164062, 0.70489501953125, 0.7398910522460938, 0.7748870849609375, 0.8098831176757812, 0.844879150390625, 0.8798751831054688, 0.9148712158203125, 0.9498672485351562, 0.98486328125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 12.0, 8.0, 14.0, 16.0, 20.0, 19.0, 28.0, 33.0, 54.0, 65.0, 63.0, 84.0, 96.0, 108.0, 79.0, 60.0, 50.0, 33.0, 25.0, 23.0, 24.0, 16.0, 16.0, 7.0, 11.0, 9.0, 4.0, 0.0, 1.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.234375, -1.198486328125, -1.16259765625, -1.126708984375, -1.0908203125, -1.054931640625, -1.01904296875, -0.983154296875, -0.947265625, -0.911376953125, -0.87548828125, -0.839599609375, -0.8037109375, -0.767822265625, -0.73193359375, -0.696044921875, -0.66015625, -0.624267578125, -0.58837890625, -0.552490234375, -0.5166015625, -0.480712890625, -0.44482421875, -0.408935546875, -0.373046875, -0.337158203125, -0.30126953125, -0.265380859375, -0.2294921875, -0.193603515625, -0.15771484375, -0.121826171875, -0.0859375, -0.050048828125, -0.01416015625, 0.021728515625, 0.0576171875, 0.093505859375, 0.12939453125, 0.165283203125, 0.201171875, 0.237060546875, 0.27294921875, 0.308837890625, 0.3447265625, 0.380615234375, 0.41650390625, 0.452392578125, 0.48828125, 0.524169921875, 0.56005859375, 0.595947265625, 0.6318359375, 0.667724609375, 0.70361328125, 0.739501953125, 0.775390625, 0.811279296875, 0.84716796875, 0.883056640625, 0.9189453125, 0.954833984375, 0.99072265625, 1.026611328125, 1.0625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 11.0, 13.0, 26.0, 50.0, 109.0, 139.0, 310.0, 134.0, 86.0, 51.0, 27.0, 19.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.7954158782959, -24.820581436157227, -23.845746994018555, -22.870912551879883, -21.89607810974121, -20.92124366760254, -19.946407318115234, -18.971572875976562, -17.99673843383789, -17.02190399169922, -16.047069549560547, -15.072235107421875, -14.097400665283203, -13.122566223144531, -12.147730827331543, -11.172896385192871, -10.198062896728516, -9.223228454589844, -8.248394012451172, -7.273559093475342, -6.29872465133667, -5.323890209197998, -4.349055290222168, -3.374220848083496, -2.399386405944824, -1.4245518445968628, -0.44971728324890137, 0.5251173973083496, 1.4999518394470215, 2.4747862815856934, 3.4496212005615234, 4.424455642700195, 5.399288177490234, 6.374122619628906, 7.348957061767578, 8.32379150390625, 9.298625946044922, 10.273460388183594, 11.248295783996582, 12.223130226135254, 13.197964668273926, 14.172799110412598, 15.14763355255127, 16.122468948364258, 17.09730339050293, 18.0721378326416, 19.046972274780273, 20.021806716918945, 20.996641159057617, 21.97147560119629, 22.94631004333496, 23.921144485473633, 24.895978927612305, 25.870813369750977, 26.84564971923828, 27.820484161376953, 28.795318603515625, 29.770153045654297, 30.74498748779297, 31.71982192993164, 32.69465637207031, 33.669490814208984, 34.644325256347656, 35.61915969848633, 36.593994140625]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 3.0, 5.0, 7.0, 7.0, 11.0, 10.0, 19.0, 22.0, 23.0, 21.0, 27.0, 29.0, 35.0, 32.0, 45.0, 69.0, 108.0, 99.0, 71.0, 67.0, 49.0, 36.0, 26.0, 28.0, 27.0, 24.0, 13.0, 13.0, 21.0, 12.0, 8.0, 11.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.428274154663086, -23.751670837402344, -23.0750675201416, -22.39846420288086, -21.721858978271484, -21.045255661010742, -20.36865234375, -19.692049026489258, -19.015445709228516, -18.338842391967773, -17.66223907470703, -16.98563575744629, -16.309032440185547, -15.632428169250488, -14.95582389831543, -14.279220581054688, -13.602617263793945, -12.926013946533203, -12.249410629272461, -11.572806358337402, -10.89620304107666, -10.219599723815918, -9.54299545288086, -8.866392135620117, -8.189788818359375, -7.513185501098633, -6.836581707000732, -6.159977912902832, -5.48337459564209, -4.806771278381348, -4.130167484283447, -3.453563690185547, -2.7769603729248047, -2.1003568172454834, -1.423753261566162, -0.7471497058868408, -0.07054615020751953, 0.6060574054718018, 1.282660961151123, 1.9592647552490234, 2.6358680725097656, 3.312471628189087, 3.989075183868408, 4.665678977966309, 5.342282295227051, 6.018885612487793, 6.695489406585693, 7.372093200683594, 8.048696517944336, 8.725299835205078, 9.40190315246582, 10.078507423400879, 10.755110740661621, 11.431714057922363, 12.108318328857422, 12.784921646118164, 13.461524963378906, 14.138128280639648, 14.81473159790039, 15.49133586883545, 16.167938232421875, 16.84454345703125, 17.521146774291992, 18.197750091552734, 18.874353408813477]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 12.0, 8.0, 17.0, 11.0, 45.0, 54.0, 80.0, 103.0, 192.0, 294.0, 592.0, 995.0, 1926.0, 4154.0, 9859.0, 29451.0, 146800.0, 1260648.0, 2328391.0, 333919.0, 51148.0, 14412.0, 5498.0, 2581.0, 1343.0, 686.0, 403.0, 224.0, 138.0, 89.0, 71.0, 49.0, 17.0, 15.0, 14.0, 12.0, 11.0, 9.0, 3.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.208984375, -2.140380859375, -2.07177734375, -2.003173828125, -1.9345703125, -1.865966796875, -1.79736328125, -1.728759765625, -1.66015625, -1.591552734375, -1.52294921875, -1.454345703125, -1.3857421875, -1.317138671875, -1.24853515625, -1.179931640625, -1.111328125, -1.042724609375, -0.97412109375, -0.905517578125, -0.8369140625, -0.768310546875, -0.69970703125, -0.631103515625, -0.5625, -0.493896484375, -0.42529296875, -0.356689453125, -0.2880859375, -0.219482421875, -0.15087890625, -0.082275390625, -0.013671875, 0.054931640625, 0.12353515625, 0.192138671875, 0.2607421875, 0.329345703125, 0.39794921875, 0.466552734375, 0.53515625, 0.603759765625, 0.67236328125, 0.740966796875, 0.8095703125, 0.878173828125, 0.94677734375, 1.015380859375, 1.083984375, 1.152587890625, 1.22119140625, 1.289794921875, 1.3583984375, 1.427001953125, 1.49560546875, 1.564208984375, 1.6328125, 1.701416015625, 1.77001953125, 1.838623046875, 1.9072265625, 1.975830078125, 2.04443359375, 2.113037109375, 2.181640625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 5.0, 6.0, 9.0, 7.0, 11.0, 16.0, 14.0, 16.0, 19.0, 16.0, 35.0, 28.0, 46.0, 52.0, 55.0, 51.0, 43.0, 51.0, 56.0, 59.0, 50.0, 59.0, 43.0, 44.0, 28.0, 30.0, 28.0, 27.0, 29.0, 22.0, 8.0, 16.0, 5.0, 7.0, 5.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4501953125, -1.400421142578125, -1.35064697265625, -1.300872802734375, -1.2510986328125, -1.201324462890625, -1.15155029296875, -1.101776123046875, -1.052001953125, -1.002227783203125, -0.95245361328125, -0.902679443359375, -0.8529052734375, -0.803131103515625, -0.75335693359375, -0.703582763671875, -0.65380859375, -0.604034423828125, -0.55426025390625, -0.504486083984375, -0.4547119140625, -0.404937744140625, -0.35516357421875, -0.305389404296875, -0.255615234375, -0.205841064453125, -0.15606689453125, -0.106292724609375, -0.0565185546875, -0.006744384765625, 0.04302978515625, 0.092803955078125, 0.142578125, 0.192352294921875, 0.24212646484375, 0.291900634765625, 0.3416748046875, 0.391448974609375, 0.44122314453125, 0.490997314453125, 0.540771484375, 0.590545654296875, 0.64031982421875, 0.690093994140625, 0.7398681640625, 0.789642333984375, 0.83941650390625, 0.889190673828125, 0.93896484375, 0.988739013671875, 1.03851318359375, 1.088287353515625, 1.1380615234375, 1.187835693359375, 1.23760986328125, 1.287384033203125, 1.337158203125, 1.386932373046875, 1.43670654296875, 1.486480712890625, 1.5362548828125, 1.586029052734375, 1.63580322265625, 1.685577392578125, 1.7353515625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 9.0, 9.0, 29.0, 45.0, 82.0, 160.0, 399.0, 1451.0, 9923.0, 1823617.0, 2345635.0, 10591.0, 1525.0, 434.0, 172.0, 88.0, 53.0, 24.0, 11.0, 12.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6875, -10.373291015625, -10.05908203125, -9.744873046875, -9.4306640625, -9.116455078125, -8.80224609375, -8.488037109375, -8.173828125, -7.859619140625, -7.54541015625, -7.231201171875, -6.9169921875, -6.602783203125, -6.28857421875, -5.974365234375, -5.66015625, -5.345947265625, -5.03173828125, -4.717529296875, -4.4033203125, -4.089111328125, -3.77490234375, -3.460693359375, -3.146484375, -2.832275390625, -2.51806640625, -2.203857421875, -1.8896484375, -1.575439453125, -1.26123046875, -0.947021484375, -0.6328125, -0.318603515625, -0.00439453125, 0.309814453125, 0.6240234375, 0.938232421875, 1.25244140625, 1.566650390625, 1.880859375, 2.195068359375, 2.50927734375, 2.823486328125, 3.1376953125, 3.451904296875, 3.76611328125, 4.080322265625, 4.39453125, 4.708740234375, 5.02294921875, 5.337158203125, 5.6513671875, 5.965576171875, 6.27978515625, 6.593994140625, 6.908203125, 7.222412109375, 7.53662109375, 7.850830078125, 8.1650390625, 8.479248046875, 8.79345703125, 9.107666015625, 9.421875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 8.0, 12.0, 18.0, 27.0, 46.0, 71.0, 174.0, 357.0, 744.0, 1157.0, 738.0, 353.0, 142.0, 105.0, 52.0, 21.0, 19.0, 6.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.96484375, -4.79071044921875, -4.6165771484375, -4.44244384765625, -4.268310546875, -4.09417724609375, -3.9200439453125, -3.74591064453125, -3.57177734375, -3.39764404296875, -3.2235107421875, -3.04937744140625, -2.875244140625, -2.70111083984375, -2.5269775390625, -2.35284423828125, -2.1787109375, -2.00457763671875, -1.8304443359375, -1.65631103515625, -1.482177734375, -1.30804443359375, -1.1339111328125, -0.95977783203125, -0.78564453125, -0.61151123046875, -0.4373779296875, -0.26324462890625, -0.089111328125, 0.08502197265625, 0.2591552734375, 0.43328857421875, 0.607421875, 0.78155517578125, 0.9556884765625, 1.12982177734375, 1.303955078125, 1.47808837890625, 1.6522216796875, 1.82635498046875, 2.00048828125, 2.17462158203125, 2.3487548828125, 2.52288818359375, 2.697021484375, 2.87115478515625, 3.0452880859375, 3.21942138671875, 3.3935546875, 3.56768798828125, 3.7418212890625, 3.91595458984375, 4.090087890625, 4.26422119140625, 4.4383544921875, 4.61248779296875, 4.78662109375, 4.96075439453125, 5.1348876953125, 5.30902099609375, 5.483154296875, 5.65728759765625, 5.8314208984375, 6.00555419921875, 6.1796875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 8.0, 12.0, 23.0, 53.0, 95.0, 122.0, 196.0, 204.0, 126.0, 73.0, 40.0, 19.0, 6.0, 9.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.15872573852539, -48.99431228637695, -47.82989501953125, -46.66548156738281, -45.501068115234375, -44.33665084838867, -43.172237396240234, -42.00782012939453, -40.843406677246094, -39.678993225097656, -38.51457595825195, -37.350162506103516, -36.18574523925781, -35.021331787109375, -33.85691833496094, -32.6925048828125, -31.528087615966797, -30.363672256469727, -29.199256896972656, -28.03484344482422, -26.87042808532715, -25.706012725830078, -24.54159927368164, -23.37718391418457, -22.2127685546875, -21.04835319519043, -19.88393783569336, -18.719524383544922, -17.55510902404785, -16.39069366455078, -15.226279258728027, -14.061864852905273, -12.897453308105469, -11.733037948608398, -10.568623542785645, -9.40420913696289, -8.23979377746582, -7.075378894805908, -5.910964012145996, -4.746549606323242, -3.582134246826172, -2.4177193641662598, -1.2533044815063477, -0.08888959884643555, 1.0755252838134766, 2.2399401664733887, 3.404355049133301, 4.568769454956055, 5.733184814453125, 6.897599697113037, 8.06201457977295, 9.226428985595703, 10.390844345092773, 11.555259704589844, 12.719674110412598, 13.884088516235352, 15.048503875732422, 16.212919235229492, 17.377334594726562, 18.541748046875, 19.70616340637207, 20.87057876586914, 22.034992218017578, 23.19940757751465, 24.36382293701172]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 8.0, 11.0, 10.0, 14.0, 11.0, 12.0, 7.0, 13.0, 18.0, 21.0, 17.0, 30.0, 23.0, 27.0, 25.0, 40.0, 46.0, 45.0, 52.0, 56.0, 38.0, 43.0, 42.0, 44.0, 43.0, 36.0, 28.0, 31.0, 35.0, 23.0, 24.0, 21.0, 19.0, 8.0, 14.0, 13.0, 12.0, 7.0, 10.0, 6.0, 7.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.603311538696289, -12.183328628540039, -11.763345718383789, -11.343362808227539, -10.923379898071289, -10.503396987915039, -10.083414077758789, -9.663430213928223, -9.243447303771973, -8.823464393615723, -8.403481483459473, -7.983498573303223, -7.5635151863098145, -7.1435322761535645, -6.7235493659973145, -6.303565979003906, -5.8835835456848145, -5.4636006355285645, -5.0436177253723145, -4.623634338378906, -4.203651428222656, -3.7836685180664062, -3.3636856079101562, -2.943702459335327, -2.523719549179077, -2.103736639022827, -1.683753490447998, -1.263770580291748, -0.8437875509262085, -0.42380452156066895, -0.0038216114044189453, 0.41616153717041016, 0.8361444473266602, 1.2561274766921997, 1.6761105060577393, 2.0960934162139893, 2.5160765647888184, 2.9360594749450684, 3.3560423851013184, 3.7760255336761475, 4.196008682250977, 4.615991592407227, 5.035974502563477, 5.455957412719727, 5.875940799713135, 6.295923709869385, 6.715906620025635, 7.135890007019043, 7.555872440338135, 7.975855350494385, 8.395838737487793, 8.815821647644043, 9.235804557800293, 9.655787467956543, 10.075770378112793, 10.495753288269043, 10.915736198425293, 11.335719108581543, 11.755702018737793, 12.175684928894043, 12.595667839050293, 13.01565170288086, 13.43563461303711, 13.85561752319336, 14.27560043334961]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 6.0, 6.0, 10.0, 16.0, 22.0, 26.0, 55.0, 66.0, 130.0, 196.0, 281.0, 515.0, 921.0, 1980.0, 4256.0, 10454.0, 29747.0, 100947.0, 382457.0, 371000.0, 97749.0, 28992.0, 10223.0, 4225.0, 1953.0, 1000.0, 523.0, 294.0, 182.0, 110.0, 77.0, 55.0, 25.0, 22.0, 13.0, 12.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.166015625, -2.088623046875, -2.01123046875, -1.933837890625, -1.8564453125, -1.779052734375, -1.70166015625, -1.624267578125, -1.546875, -1.469482421875, -1.39208984375, -1.314697265625, -1.2373046875, -1.159912109375, -1.08251953125, -1.005126953125, -0.927734375, -0.850341796875, -0.77294921875, -0.695556640625, -0.6181640625, -0.540771484375, -0.46337890625, -0.385986328125, -0.30859375, -0.231201171875, -0.15380859375, -0.076416015625, 0.0009765625, 0.078369140625, 0.15576171875, 0.233154296875, 0.310546875, 0.387939453125, 0.46533203125, 0.542724609375, 0.6201171875, 0.697509765625, 0.77490234375, 0.852294921875, 0.9296875, 1.007080078125, 1.08447265625, 1.161865234375, 1.2392578125, 1.316650390625, 1.39404296875, 1.471435546875, 1.548828125, 1.626220703125, 1.70361328125, 1.781005859375, 1.8583984375, 1.935791015625, 2.01318359375, 2.090576171875, 2.16796875, 2.245361328125, 2.32275390625, 2.400146484375, 2.4775390625, 2.554931640625, 2.63232421875, 2.709716796875, 2.787109375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 4.0, 11.0, 10.0, 13.0, 16.0, 17.0, 23.0, 20.0, 39.0, 36.0, 27.0, 45.0, 45.0, 49.0, 34.0, 37.0, 51.0, 49.0, 60.0, 42.0, 43.0, 42.0, 35.0, 28.0, 35.0, 30.0, 22.0, 20.0, 30.0, 19.0, 11.0, 14.0, 10.0, 6.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5751953125, -1.52752685546875, -1.4798583984375, -1.43218994140625, -1.384521484375, -1.33685302734375, -1.2891845703125, -1.24151611328125, -1.19384765625, -1.14617919921875, -1.0985107421875, -1.05084228515625, -1.003173828125, -0.95550537109375, -0.9078369140625, -0.86016845703125, -0.8125, -0.76483154296875, -0.7171630859375, -0.66949462890625, -0.621826171875, -0.57415771484375, -0.5264892578125, -0.47882080078125, -0.43115234375, -0.38348388671875, -0.3358154296875, -0.28814697265625, -0.240478515625, -0.19281005859375, -0.1451416015625, -0.09747314453125, -0.0498046875, -0.00213623046875, 0.0455322265625, 0.09320068359375, 0.140869140625, 0.18853759765625, 0.2362060546875, 0.28387451171875, 0.33154296875, 0.37921142578125, 0.4268798828125, 0.47454833984375, 0.522216796875, 0.56988525390625, 0.6175537109375, 0.66522216796875, 0.712890625, 0.76055908203125, 0.8082275390625, 0.85589599609375, 0.903564453125, 0.95123291015625, 0.9989013671875, 1.04656982421875, 1.09423828125, 1.14190673828125, 1.1895751953125, 1.23724365234375, 1.284912109375, 1.33258056640625, 1.3802490234375, 1.42791748046875, 1.4755859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 7.0, 15.0, 17.0, 19.0, 28.0, 38.0, 39.0, 88.0, 121.0, 202.0, 266.0, 477.0, 849.0, 1938.0, 5920.0, 26757.0, 211391.0, 724542.0, 59482.0, 10566.0, 3082.0, 1139.0, 585.0, 320.0, 209.0, 142.0, 85.0, 62.0, 35.0, 41.0, 19.0, 13.0, 13.0, 13.0, 7.0, 2.0, 6.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.37890625, -4.254547119140625, -4.13018798828125, -4.005828857421875, -3.8814697265625, -3.757110595703125, -3.63275146484375, -3.508392333984375, -3.384033203125, -3.259674072265625, -3.13531494140625, -3.010955810546875, -2.8865966796875, -2.762237548828125, -2.63787841796875, -2.513519287109375, -2.38916015625, -2.264801025390625, -2.14044189453125, -2.016082763671875, -1.8917236328125, -1.767364501953125, -1.64300537109375, -1.518646240234375, -1.394287109375, -1.269927978515625, -1.14556884765625, -1.021209716796875, -0.8968505859375, -0.772491455078125, -0.64813232421875, -0.523773193359375, -0.3994140625, -0.275054931640625, -0.15069580078125, -0.026336669921875, 0.0980224609375, 0.222381591796875, 0.34674072265625, 0.471099853515625, 0.595458984375, 0.719818115234375, 0.84417724609375, 0.968536376953125, 1.0928955078125, 1.217254638671875, 1.34161376953125, 1.465972900390625, 1.59033203125, 1.714691162109375, 1.83905029296875, 1.963409423828125, 2.0877685546875, 2.212127685546875, 2.33648681640625, 2.460845947265625, 2.585205078125, 2.709564208984375, 2.83392333984375, 2.958282470703125, 3.0826416015625, 3.207000732421875, 3.33135986328125, 3.455718994140625, 3.580078125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 9.0, 7.0, 3.0, 9.0, 8.0, 9.0, 14.0, 20.0, 25.0, 27.0, 29.0, 46.0, 52.0, 51.0, 64.0, 52.0, 66.0, 73.0, 50.0, 55.0, 48.0, 51.0, 32.0, 30.0, 34.0, 23.0, 23.0, 25.0, 17.0, 9.0, 11.0, 7.0, 6.0, 6.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.8671875, -7.66033935546875, -7.4534912109375, -7.24664306640625, -7.039794921875, -6.83294677734375, -6.6260986328125, -6.41925048828125, -6.21240234375, -6.00555419921875, -5.7987060546875, -5.59185791015625, -5.385009765625, -5.17816162109375, -4.9713134765625, -4.76446533203125, -4.5576171875, -4.35076904296875, -4.1439208984375, -3.93707275390625, -3.730224609375, -3.52337646484375, -3.3165283203125, -3.10968017578125, -2.90283203125, -2.69598388671875, -2.4891357421875, -2.28228759765625, -2.075439453125, -1.86859130859375, -1.6617431640625, -1.45489501953125, -1.248046875, -1.04119873046875, -0.8343505859375, -0.62750244140625, -0.420654296875, -0.21380615234375, -0.0069580078125, 0.19989013671875, 0.40673828125, 0.61358642578125, 0.8204345703125, 1.02728271484375, 1.234130859375, 1.44097900390625, 1.6478271484375, 1.85467529296875, 2.0615234375, 2.26837158203125, 2.4752197265625, 2.68206787109375, 2.888916015625, 3.09576416015625, 3.3026123046875, 3.50946044921875, 3.71630859375, 3.92315673828125, 4.1300048828125, 4.33685302734375, 4.543701171875, 4.75054931640625, 4.9573974609375, 5.16424560546875, 5.37109375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 4.0, 6.0, 5.0, 3.0, 3.0, 8.0, 8.0, 5.0, 8.0, 10.0, 24.0, 22.0, 46.0, 53.0, 89.0, 149.0, 283.0, 608.0, 1754.0, 6598.0, 34947.0, 699702.0, 270595.0, 25681.0, 5261.0, 1477.0, 554.0, 220.0, 139.0, 97.0, 56.0, 37.0, 25.0, 27.0, 8.0, 6.0, 7.0, 4.0, 3.0, 2.0, 6.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.57421875, -1.5233001708984375, -1.472381591796875, -1.4214630126953125, -1.37054443359375, -1.3196258544921875, -1.268707275390625, -1.2177886962890625, -1.1668701171875, -1.1159515380859375, -1.065032958984375, -1.0141143798828125, -0.96319580078125, -0.9122772216796875, -0.861358642578125, -0.8104400634765625, -0.759521484375, -0.7086029052734375, -0.657684326171875, -0.6067657470703125, -0.55584716796875, -0.5049285888671875, -0.454010009765625, -0.4030914306640625, -0.3521728515625, -0.3012542724609375, -0.250335693359375, -0.1994171142578125, -0.14849853515625, -0.0975799560546875, -0.046661376953125, 0.0042572021484375, 0.05517578125, 0.1060943603515625, 0.157012939453125, 0.2079315185546875, 0.25885009765625, 0.3097686767578125, 0.360687255859375, 0.4116058349609375, 0.4625244140625, 0.5134429931640625, 0.564361572265625, 0.6152801513671875, 0.66619873046875, 0.7171173095703125, 0.768035888671875, 0.8189544677734375, 0.869873046875, 0.9207916259765625, 0.971710205078125, 1.0226287841796875, 1.07354736328125, 1.1244659423828125, 1.175384521484375, 1.2263031005859375, 1.2772216796875, 1.3281402587890625, 1.379058837890625, 1.4299774169921875, 1.48089599609375, 1.5318145751953125, 1.582733154296875, 1.6336517333984375, 1.6845703125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 6.0, 5.0, 13.0, 16.0, 15.0, 24.0, 34.0, 56.0, 79.0, 132.0, 178.0, 165.0, 91.0, 51.0, 25.0, 31.0, 12.0, 14.0, 11.0, 8.0, 5.0, 3.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0004718303680419922, -0.0004596114158630371, -0.00044739246368408203, -0.00043517351150512695, -0.0004229545593261719, -0.0004107356071472168, -0.0003985166549682617, -0.00038629770278930664, -0.00037407875061035156, -0.0003618597984313965, -0.0003496408462524414, -0.00033742189407348633, -0.00032520294189453125, -0.00031298398971557617, -0.0003007650375366211, -0.000288546085357666, -0.00027632713317871094, -0.00026410818099975586, -0.0002518892288208008, -0.0002396702766418457, -0.00022745132446289062, -0.00021523237228393555, -0.00020301342010498047, -0.0001907944679260254, -0.0001785755157470703, -0.00016635656356811523, -0.00015413761138916016, -0.00014191865921020508, -0.00012969970703125, -0.00011748075485229492, -0.00010526180267333984, -9.304285049438477e-05, -8.082389831542969e-05, -6.860494613647461e-05, -5.638599395751953e-05, -4.416704177856445e-05, -3.1948089599609375e-05, -1.9729137420654297e-05, -7.510185241699219e-06, 4.708766937255859e-06, 1.6927719116210938e-05, 2.9146671295166016e-05, 4.1365623474121094e-05, 5.358457565307617e-05, 6.580352783203125e-05, 7.802248001098633e-05, 9.02414321899414e-05, 0.00010246038436889648, 0.00011467933654785156, 0.00012689828872680664, 0.00013911724090576172, 0.0001513361930847168, 0.00016355514526367188, 0.00017577409744262695, 0.00018799304962158203, 0.0002002120018005371, 0.0002124309539794922, 0.00022464990615844727, 0.00023686885833740234, 0.0002490878105163574, 0.0002613067626953125, 0.0002735257148742676, 0.00028574466705322266, 0.00029796361923217773, 0.0003101825714111328]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 6.0, 4.0, 2.0, 5.0, 12.0, 17.0, 15.0, 19.0, 23.0, 38.0, 42.0, 74.0, 94.0, 158.0, 226.0, 374.0, 701.0, 1399.0, 3092.0, 7303.0, 20488.0, 70581.0, 608465.0, 253854.0, 53419.0, 16555.0, 6124.0, 2596.0, 1209.0, 654.0, 333.0, 225.0, 119.0, 87.0, 67.0, 49.0, 23.0, 28.0, 16.0, 11.0, 16.0, 11.0, 7.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9443359375, -0.9137725830078125, -0.883209228515625, -0.8526458740234375, -0.82208251953125, -0.7915191650390625, -0.760955810546875, -0.7303924560546875, -0.6998291015625, -0.6692657470703125, -0.638702392578125, -0.6081390380859375, -0.57757568359375, -0.5470123291015625, -0.516448974609375, -0.4858856201171875, -0.455322265625, -0.4247589111328125, -0.394195556640625, -0.3636322021484375, -0.33306884765625, -0.3025054931640625, -0.271942138671875, -0.2413787841796875, -0.2108154296875, -0.1802520751953125, -0.149688720703125, -0.1191253662109375, -0.08856201171875, -0.0579986572265625, -0.027435302734375, 0.0031280517578125, 0.03369140625, 0.0642547607421875, 0.094818115234375, 0.1253814697265625, 0.15594482421875, 0.1865081787109375, 0.217071533203125, 0.2476348876953125, 0.2781982421875, 0.3087615966796875, 0.339324951171875, 0.3698883056640625, 0.40045166015625, 0.4310150146484375, 0.461578369140625, 0.4921417236328125, 0.522705078125, 0.5532684326171875, 0.583831787109375, 0.6143951416015625, 0.64495849609375, 0.6755218505859375, 0.706085205078125, 0.7366485595703125, 0.7672119140625, 0.7977752685546875, 0.828338623046875, 0.8589019775390625, 0.88946533203125, 0.9200286865234375, 0.950592041015625, 0.9811553955078125, 1.01171875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 3.0, 5.0, 11.0, 10.0, 11.0, 11.0, 12.0, 30.0, 31.0, 34.0, 47.0, 71.0, 76.0, 100.0, 90.0, 96.0, 71.0, 42.0, 42.0, 46.0, 29.0, 35.0, 23.0, 17.0, 12.0, 12.0, 6.0, 8.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.185546875, -1.1519546508789062, -1.1183624267578125, -1.0847702026367188, -1.051177978515625, -1.0175857543945312, -0.9839935302734375, -0.9504013061523438, -0.91680908203125, -0.8832168579101562, -0.8496246337890625, -0.8160324096679688, -0.782440185546875, -0.7488479614257812, -0.7152557373046875, -0.6816635131835938, -0.6480712890625, -0.6144790649414062, -0.5808868408203125, -0.5472946166992188, -0.513702392578125, -0.48011016845703125, -0.4465179443359375, -0.41292572021484375, -0.37933349609375, -0.34574127197265625, -0.3121490478515625, -0.27855682373046875, -0.244964599609375, -0.21137237548828125, -0.1777801513671875, -0.14418792724609375, -0.110595703125, -0.07700347900390625, -0.0434112548828125, -0.00981903076171875, 0.023773193359375, 0.05736541748046875, 0.0909576416015625, 0.12454986572265625, 0.15814208984375, 0.19173431396484375, 0.2253265380859375, 0.25891876220703125, 0.292510986328125, 0.32610321044921875, 0.3596954345703125, 0.39328765869140625, 0.4268798828125, 0.46047210693359375, 0.4940643310546875, 0.5276565551757812, 0.561248779296875, 0.5948410034179688, 0.6284332275390625, 0.6620254516601562, 0.69561767578125, 0.7292098999023438, 0.7628021240234375, 0.7963943481445312, 0.829986572265625, 0.8635787963867188, 0.8971710205078125, 0.9307632446289062, 0.96435546875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 15.0, 41.0, 178.0, 514.0, 154.0, 57.0, 17.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.99948120117188, -63.04973602294922, -61.0999870300293, -59.15024185180664, -57.20049285888672, -55.25074768066406, -53.301002502441406, -51.351253509521484, -49.40150451660156, -47.451759338378906, -45.502010345458984, -43.55226516723633, -41.602516174316406, -39.65277099609375, -37.703025817871094, -35.75327682495117, -33.803531646728516, -31.853784561157227, -29.904037475585938, -27.95429229736328, -26.00454330444336, -24.054798126220703, -22.105051040649414, -20.155303955078125, -18.205556869506836, -16.255809783935547, -14.306062698364258, -12.356316566467285, -10.406569480895996, -8.456822395324707, -6.507076263427734, -4.557329177856445, -2.607585906982422, -0.6578390598297119, 1.291907787322998, 3.241654396057129, 5.191401481628418, 7.141148567199707, 9.09089469909668, 11.040641784667969, 12.990388870239258, 14.940135955810547, 16.889883041381836, 18.839630126953125, 20.78937530517578, 22.739124298095703, 24.68886947631836, 26.63861656188965, 28.588363647460938, 30.538110733032227, 32.487857818603516, 34.43760299682617, 36.387351989746094, 38.33709716796875, 40.286842346191406, 42.23659133911133, 44.18634033203125, 46.136085510253906, 48.08583450317383, 50.035579681396484, 51.985328674316406, 53.93507385253906, 55.88481903076172, 57.83456802368164, 59.7843132019043]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 2.0, 1.0, 3.0, 4.0, 7.0, 6.0, 13.0, 9.0, 9.0, 10.0, 17.0, 10.0, 20.0, 17.0, 28.0, 24.0, 29.0, 33.0, 35.0, 56.0, 89.0, 120.0, 86.0, 63.0, 38.0, 41.0, 32.0, 27.0, 35.0, 19.0, 17.0, 14.0, 21.0, 13.0, 13.0, 11.0, 6.0, 6.0, 4.0, 9.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.887174606323242, -22.163089752197266, -21.43900489807129, -20.714920043945312, -19.990835189819336, -19.26675033569336, -18.542665481567383, -17.818580627441406, -17.09449577331543, -16.370410919189453, -15.646326065063477, -14.9222412109375, -14.198156356811523, -13.474071502685547, -12.74998664855957, -12.025901794433594, -11.301816940307617, -10.57773208618164, -9.853647232055664, -9.129562377929688, -8.405477523803711, -7.681392669677734, -6.957307815551758, -6.233222961425781, -5.509138107299805, -4.785053253173828, -4.060968399047852, -3.336883544921875, -2.6127986907958984, -1.8887138366699219, -1.1646289825439453, -0.44054412841796875, 0.2835426330566406, 1.0076274871826172, 1.7317123413085938, 2.4557971954345703, 3.179882049560547, 3.9039669036865234, 4.6280517578125, 5.352136611938477, 6.076221466064453, 6.80030632019043, 7.524391174316406, 8.248476028442383, 8.97256088256836, 9.696645736694336, 10.420730590820312, 11.144815444946289, 11.868900299072266, 12.592985153198242, 13.317070007324219, 14.041154861450195, 14.765239715576172, 15.489324569702148, 16.213409423828125, 16.9374942779541, 17.661579132080078, 18.385663986206055, 19.10974884033203, 19.833833694458008, 20.557918548583984, 21.28200340270996, 22.006088256835938, 22.730173110961914, 23.45425796508789]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 6.0, 4.0, 9.0, 11.0, 19.0, 30.0, 47.0, 84.0, 82.0, 131.0, 217.0, 399.0, 685.0, 1172.0, 2003.0, 3658.0, 7407.0, 16828.0, 46104.0, 171522.0, 797598.0, 2012025.0, 867140.0, 184788.0, 48724.0, 17356.0, 7593.0, 3738.0, 1972.0, 1126.0, 634.0, 425.0, 232.0, 161.0, 118.0, 74.0, 47.0, 39.0, 24.0, 12.0, 11.0, 8.0, 8.0, 3.0, 4.0, 0.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.697265625, -2.6168212890625, -2.536376953125, -2.4559326171875, -2.37548828125, -2.2950439453125, -2.214599609375, -2.1341552734375, -2.0537109375, -1.9732666015625, -1.892822265625, -1.8123779296875, -1.73193359375, -1.6514892578125, -1.571044921875, -1.4906005859375, -1.41015625, -1.3297119140625, -1.249267578125, -1.1688232421875, -1.08837890625, -1.0079345703125, -0.927490234375, -0.8470458984375, -0.7666015625, -0.6861572265625, -0.605712890625, -0.5252685546875, -0.44482421875, -0.3643798828125, -0.283935546875, -0.2034912109375, -0.123046875, -0.0426025390625, 0.037841796875, 0.1182861328125, 0.19873046875, 0.2791748046875, 0.359619140625, 0.4400634765625, 0.5205078125, 0.6009521484375, 0.681396484375, 0.7618408203125, 0.84228515625, 0.9227294921875, 1.003173828125, 1.0836181640625, 1.1640625, 1.2445068359375, 1.324951171875, 1.4053955078125, 1.48583984375, 1.5662841796875, 1.646728515625, 1.7271728515625, 1.8076171875, 1.8880615234375, 1.968505859375, 2.0489501953125, 2.12939453125, 2.2098388671875, 2.290283203125, 2.3707275390625, 2.451171875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 2.0, 13.0, 10.0, 11.0, 26.0, 41.0, 33.0, 29.0, 44.0, 29.0, 53.0, 47.0, 47.0, 61.0, 58.0, 62.0, 55.0, 56.0, 50.0, 38.0, 38.0, 40.0, 25.0, 20.0, 21.0, 20.0, 15.0, 12.0, 10.0, 9.0, 5.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.9091796875, -1.8570709228515625, -1.804962158203125, -1.7528533935546875, -1.70074462890625, -1.6486358642578125, -1.596527099609375, -1.5444183349609375, -1.4923095703125, -1.4402008056640625, -1.388092041015625, -1.3359832763671875, -1.28387451171875, -1.2317657470703125, -1.179656982421875, -1.1275482177734375, -1.075439453125, -1.0233306884765625, -0.971221923828125, -0.9191131591796875, -0.86700439453125, -0.8148956298828125, -0.762786865234375, -0.7106781005859375, -0.6585693359375, -0.6064605712890625, -0.554351806640625, -0.5022430419921875, -0.45013427734375, -0.3980255126953125, -0.345916748046875, -0.2938079833984375, -0.24169921875, -0.1895904541015625, -0.137481689453125, -0.0853729248046875, -0.03326416015625, 0.0188446044921875, 0.070953369140625, 0.1230621337890625, 0.1751708984375, 0.2272796630859375, 0.279388427734375, 0.3314971923828125, 0.38360595703125, 0.4357147216796875, 0.487823486328125, 0.5399322509765625, 0.592041015625, 0.6441497802734375, 0.696258544921875, 0.7483673095703125, 0.80047607421875, 0.8525848388671875, 0.904693603515625, 0.9568023681640625, 1.0089111328125, 1.0610198974609375, 1.113128662109375, 1.1652374267578125, 1.21734619140625, 1.2694549560546875, 1.321563720703125, 1.3736724853515625, 1.42578125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 3.0, 5.0, 7.0, 14.0, 12.0, 23.0, 35.0, 47.0, 63.0, 125.0, 202.0, 351.0, 691.0, 1666.0, 5860.0, 83728.0, 4016356.0, 76301.0, 5706.0, 1498.0, 703.0, 374.0, 189.0, 124.0, 59.0, 46.0, 23.0, 13.0, 16.0, 16.0, 7.0, 8.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.3125, -11.9334716796875, -11.554443359375, -11.1754150390625, -10.79638671875, -10.4173583984375, -10.038330078125, -9.6593017578125, -9.2802734375, -8.9012451171875, -8.522216796875, -8.1431884765625, -7.76416015625, -7.3851318359375, -7.006103515625, -6.6270751953125, -6.248046875, -5.8690185546875, -5.489990234375, -5.1109619140625, -4.73193359375, -4.3529052734375, -3.973876953125, -3.5948486328125, -3.2158203125, -2.8367919921875, -2.457763671875, -2.0787353515625, -1.69970703125, -1.3206787109375, -0.941650390625, -0.5626220703125, -0.18359375, 0.1954345703125, 0.574462890625, 0.9534912109375, 1.33251953125, 1.7115478515625, 2.090576171875, 2.4696044921875, 2.8486328125, 3.2276611328125, 3.606689453125, 3.9857177734375, 4.36474609375, 4.7437744140625, 5.122802734375, 5.5018310546875, 5.880859375, 6.2598876953125, 6.638916015625, 7.0179443359375, 7.39697265625, 7.7760009765625, 8.155029296875, 8.5340576171875, 8.9130859375, 9.2921142578125, 9.671142578125, 10.0501708984375, 10.42919921875, 10.8082275390625, 11.187255859375, 11.5662841796875, 11.9453125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 6.0, 2.0, 5.0, 8.0, 8.0, 17.0, 11.0, 12.0, 14.0, 28.0, 39.0, 49.0, 71.0, 90.0, 99.0, 155.0, 211.0, 294.0, 374.0, 467.0, 468.0, 382.0, 307.0, 259.0, 162.0, 123.0, 112.0, 76.0, 56.0, 47.0, 31.0, 24.0, 22.0, 10.0, 12.0, 7.0, 4.0, 5.0, 4.0, 0.0, 7.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0], "bins": [-5.14453125, -5.005157470703125, -4.86578369140625, -4.726409912109375, -4.5870361328125, -4.447662353515625, -4.30828857421875, -4.168914794921875, -4.029541015625, -3.890167236328125, -3.75079345703125, -3.611419677734375, -3.4720458984375, -3.332672119140625, -3.19329833984375, -3.053924560546875, -2.91455078125, -2.775177001953125, -2.63580322265625, -2.496429443359375, -2.3570556640625, -2.217681884765625, -2.07830810546875, -1.938934326171875, -1.799560546875, -1.660186767578125, -1.52081298828125, -1.381439208984375, -1.2420654296875, -1.102691650390625, -0.96331787109375, -0.823944091796875, -0.6845703125, -0.545196533203125, -0.40582275390625, -0.266448974609375, -0.1270751953125, 0.012298583984375, 0.15167236328125, 0.291046142578125, 0.430419921875, 0.569793701171875, 0.70916748046875, 0.848541259765625, 0.9879150390625, 1.127288818359375, 1.26666259765625, 1.406036376953125, 1.54541015625, 1.684783935546875, 1.82415771484375, 1.963531494140625, 2.1029052734375, 2.242279052734375, 2.38165283203125, 2.521026611328125, 2.660400390625, 2.799774169921875, 2.93914794921875, 3.078521728515625, 3.2178955078125, 3.357269287109375, 3.49664306640625, 3.636016845703125, 3.775390625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 13.0, 11.0, 20.0, 35.0, 73.0, 97.0, 172.0, 181.0, 135.0, 86.0, 82.0, 34.0, 18.0, 13.0, 10.0, 6.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.66349792480469, -47.69705581665039, -45.730613708496094, -43.7641716003418, -41.7977294921875, -39.83129119873047, -37.86484909057617, -35.898406982421875, -33.93196487426758, -31.96552276611328, -29.999080657958984, -28.03264045715332, -26.066198348999023, -24.099756240844727, -22.133316040039062, -20.166873931884766, -18.20043182373047, -16.233989715576172, -14.267548561096191, -12.301107406616211, -10.334665298461914, -8.368223190307617, -6.401782035827637, -4.435340881347656, -2.4688987731933594, -0.5024571418762207, 1.463984489440918, 3.4304261207580566, 5.396867752075195, 7.363309860229492, 9.329751014709473, 11.296192169189453, 13.26263427734375, 15.229076385498047, 17.195518493652344, 19.161958694458008, 21.128400802612305, 23.0948429107666, 25.061283111572266, 27.027725219726562, 28.99416732788086, 30.960609436035156, 32.92705154418945, 34.89349365234375, 36.85993194580078, 38.826377868652344, 40.792816162109375, 42.75925827026367, 44.72570037841797, 46.692142486572266, 48.65858459472656, 50.62502670288086, 52.591468811035156, 54.55790710449219, 56.524349212646484, 58.49079132080078, 60.45723342895508, 62.423675537109375, 64.3901138305664, 66.35655975341797, 68.322998046875, 70.28944396972656, 72.2558822631836, 74.22232055664062, 76.18876647949219]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 9.0, 6.0, 7.0, 7.0, 8.0, 17.0, 14.0, 7.0, 12.0, 27.0, 20.0, 26.0, 22.0, 31.0, 29.0, 34.0, 38.0, 39.0, 35.0, 62.0, 55.0, 51.0, 42.0, 49.0, 49.0, 41.0, 39.0, 22.0, 25.0, 28.0, 19.0, 12.0, 12.0, 24.0, 13.0, 14.0, 12.0, 11.0, 11.0, 10.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0], "bins": [-28.799503326416016, -27.98301124572754, -27.166519165039062, -26.350025177001953, -25.533533096313477, -24.717041015625, -23.900548934936523, -23.084056854248047, -22.267562866210938, -21.45107078552246, -20.634578704833984, -19.818084716796875, -19.0015926361084, -18.185100555419922, -17.368608474731445, -16.55211639404297, -15.735624313354492, -14.919132232666016, -14.102639198303223, -13.286147117614746, -12.469654083251953, -11.653162002563477, -10.836669921875, -10.020177841186523, -9.20368480682373, -8.387192726135254, -7.570699691772461, -6.754207611083984, -5.93771505355835, -5.121222496032715, -4.304730415344238, -3.4882378578186035, -2.6717453002929688, -1.8552528619766235, -1.0387604236602783, -0.22226810455322266, 0.5942244529724121, 1.4107170104980469, 2.2272090911865234, 3.043701648712158, 3.860194206237793, 4.676686763763428, 5.4931793212890625, 6.309671401977539, 7.126163959503174, 7.942656517028809, 8.759148597717285, 9.575641632080078, 10.392133712768555, 11.208625793457031, 12.025118827819824, 12.8416109085083, 13.658103942871094, 14.47459602355957, 15.291088104248047, 16.107580184936523, 16.924072265625, 17.740564346313477, 18.557056427001953, 19.373550415039062, 20.19004249572754, 21.006534576416016, 21.823026657104492, 22.63951873779297, 23.456012725830078]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 1.0, 5.0, 9.0, 11.0, 12.0, 25.0, 41.0, 62.0, 77.0, 136.0, 238.0, 432.0, 808.0, 1620.0, 3252.0, 7767.0, 21137.0, 75852.0, 468300.0, 371642.0, 64858.0, 18951.0, 6973.0, 3012.0, 1442.0, 798.0, 458.0, 266.0, 141.0, 83.0, 50.0, 33.0, 18.0, 14.0, 9.0, 5.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.09765625, -3.003631591796875, -2.90960693359375, -2.815582275390625, -2.7215576171875, -2.627532958984375, -2.53350830078125, -2.439483642578125, -2.345458984375, -2.251434326171875, -2.15740966796875, -2.063385009765625, -1.9693603515625, -1.875335693359375, -1.78131103515625, -1.687286376953125, -1.59326171875, -1.499237060546875, -1.40521240234375, -1.311187744140625, -1.2171630859375, -1.123138427734375, -1.02911376953125, -0.935089111328125, -0.841064453125, -0.747039794921875, -0.65301513671875, -0.558990478515625, -0.4649658203125, -0.370941162109375, -0.27691650390625, -0.182891845703125, -0.0888671875, 0.005157470703125, 0.09918212890625, 0.193206787109375, 0.2872314453125, 0.381256103515625, 0.47528076171875, 0.569305419921875, 0.663330078125, 0.757354736328125, 0.85137939453125, 0.945404052734375, 1.0394287109375, 1.133453369140625, 1.22747802734375, 1.321502685546875, 1.41552734375, 1.509552001953125, 1.60357666015625, 1.697601318359375, 1.7916259765625, 1.885650634765625, 1.97967529296875, 2.073699951171875, 2.167724609375, 2.261749267578125, 2.35577392578125, 2.449798583984375, 2.5438232421875, 2.637847900390625, 2.73187255859375, 2.825897216796875, 2.919921875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 5.0, 4.0, 11.0, 19.0, 17.0, 20.0, 23.0, 24.0, 33.0, 36.0, 39.0, 54.0, 57.0, 80.0, 61.0, 64.0, 56.0, 52.0, 45.0, 57.0, 46.0, 51.0, 34.0, 25.0, 18.0, 19.0, 13.0, 15.0, 10.0, 4.0, 8.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.88671875, -2.80706787109375, -2.7274169921875, -2.64776611328125, -2.568115234375, -2.48846435546875, -2.4088134765625, -2.32916259765625, -2.24951171875, -2.16986083984375, -2.0902099609375, -2.01055908203125, -1.930908203125, -1.85125732421875, -1.7716064453125, -1.69195556640625, -1.6123046875, -1.53265380859375, -1.4530029296875, -1.37335205078125, -1.293701171875, -1.21405029296875, -1.1343994140625, -1.05474853515625, -0.97509765625, -0.89544677734375, -0.8157958984375, -0.73614501953125, -0.656494140625, -0.57684326171875, -0.4971923828125, -0.41754150390625, -0.337890625, -0.25823974609375, -0.1785888671875, -0.09893798828125, -0.019287109375, 0.06036376953125, 0.1400146484375, 0.21966552734375, 0.29931640625, 0.37896728515625, 0.4586181640625, 0.53826904296875, 0.617919921875, 0.69757080078125, 0.7772216796875, 0.85687255859375, 0.9365234375, 1.01617431640625, 1.0958251953125, 1.17547607421875, 1.255126953125, 1.33477783203125, 1.4144287109375, 1.49407958984375, 1.57373046875, 1.65338134765625, 1.7330322265625, 1.81268310546875, 1.892333984375, 1.97198486328125, 2.0516357421875, 2.13128662109375, 2.2109375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 9.0, 11.0, 21.0, 21.0, 40.0, 53.0, 92.0, 158.0, 324.0, 629.0, 1895.0, 8934.0, 122411.0, 884785.0, 23676.0, 3475.0, 974.0, 392.0, 239.0, 137.0, 78.0, 55.0, 33.0, 24.0, 17.0, 15.0, 12.0, 9.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.54296875, -5.37091064453125, -5.1988525390625, -5.02679443359375, -4.854736328125, -4.68267822265625, -4.5106201171875, -4.33856201171875, -4.16650390625, -3.99444580078125, -3.8223876953125, -3.65032958984375, -3.478271484375, -3.30621337890625, -3.1341552734375, -2.96209716796875, -2.7900390625, -2.61798095703125, -2.4459228515625, -2.27386474609375, -2.101806640625, -1.92974853515625, -1.7576904296875, -1.58563232421875, -1.41357421875, -1.24151611328125, -1.0694580078125, -0.89739990234375, -0.725341796875, -0.55328369140625, -0.3812255859375, -0.20916748046875, -0.037109375, 0.13494873046875, 0.3070068359375, 0.47906494140625, 0.651123046875, 0.82318115234375, 0.9952392578125, 1.16729736328125, 1.33935546875, 1.51141357421875, 1.6834716796875, 1.85552978515625, 2.027587890625, 2.19964599609375, 2.3717041015625, 2.54376220703125, 2.7158203125, 2.88787841796875, 3.0599365234375, 3.23199462890625, 3.404052734375, 3.57611083984375, 3.7481689453125, 3.92022705078125, 4.09228515625, 4.26434326171875, 4.4364013671875, 4.60845947265625, 4.780517578125, 4.95257568359375, 5.1246337890625, 5.29669189453125, 5.46875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 8.0, 6.0, 5.0, 6.0, 6.0, 7.0, 13.0, 11.0, 13.0, 19.0, 13.0, 21.0, 19.0, 27.0, 43.0, 32.0, 46.0, 50.0, 59.0, 68.0, 67.0, 77.0, 48.0, 34.0, 38.0, 36.0, 35.0, 20.0, 20.0, 29.0, 18.0, 29.0, 10.0, 15.0, 13.0, 9.0, 6.0, 0.0, 3.0, 5.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.46484375, -6.243408203125, -6.02197265625, -5.800537109375, -5.5791015625, -5.357666015625, -5.13623046875, -4.914794921875, -4.693359375, -4.471923828125, -4.25048828125, -4.029052734375, -3.8076171875, -3.586181640625, -3.36474609375, -3.143310546875, -2.921875, -2.700439453125, -2.47900390625, -2.257568359375, -2.0361328125, -1.814697265625, -1.59326171875, -1.371826171875, -1.150390625, -0.928955078125, -0.70751953125, -0.486083984375, -0.2646484375, -0.043212890625, 0.17822265625, 0.399658203125, 0.62109375, 0.842529296875, 1.06396484375, 1.285400390625, 1.5068359375, 1.728271484375, 1.94970703125, 2.171142578125, 2.392578125, 2.614013671875, 2.83544921875, 3.056884765625, 3.2783203125, 3.499755859375, 3.72119140625, 3.942626953125, 4.1640625, 4.385498046875, 4.60693359375, 4.828369140625, 5.0498046875, 5.271240234375, 5.49267578125, 5.714111328125, 5.935546875, 6.156982421875, 6.37841796875, 6.599853515625, 6.8212890625, 7.042724609375, 7.26416015625, 7.485595703125, 7.70703125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 6.0, 2.0, 4.0, 12.0, 11.0, 9.0, 14.0, 15.0, 26.0, 49.0, 71.0, 89.0, 162.0, 236.0, 449.0, 782.0, 1633.0, 3494.0, 9140.0, 30813.0, 227550.0, 720176.0, 35809.0, 10479.0, 3780.0, 1715.0, 808.0, 457.0, 248.0, 154.0, 103.0, 79.0, 53.0, 26.0, 31.0, 9.0, 15.0, 8.0, 10.0, 7.0, 2.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.6806640625, -0.6587448120117188, -0.6368255615234375, -0.6149063110351562, -0.592987060546875, -0.5710678100585938, -0.5491485595703125, -0.5272293090820312, -0.50531005859375, -0.48339080810546875, -0.4614715576171875, -0.43955230712890625, -0.417633056640625, -0.39571380615234375, -0.3737945556640625, -0.35187530517578125, -0.3299560546875, -0.30803680419921875, -0.2861175537109375, -0.26419830322265625, -0.242279052734375, -0.22035980224609375, -0.1984405517578125, -0.17652130126953125, -0.15460205078125, -0.13268280029296875, -0.1107635498046875, -0.08884429931640625, -0.066925048828125, -0.04500579833984375, -0.0230865478515625, -0.00116729736328125, 0.020751953125, 0.04267120361328125, 0.0645904541015625, 0.08650970458984375, 0.108428955078125, 0.13034820556640625, 0.1522674560546875, 0.17418670654296875, 0.19610595703125, 0.21802520751953125, 0.2399444580078125, 0.26186370849609375, 0.283782958984375, 0.30570220947265625, 0.3276214599609375, 0.34954071044921875, 0.3714599609375, 0.39337921142578125, 0.4152984619140625, 0.43721771240234375, 0.459136962890625, 0.48105621337890625, 0.5029754638671875, 0.5248947143554688, 0.54681396484375, 0.5687332153320312, 0.5906524658203125, 0.6125717163085938, 0.634490966796875, 0.6564102172851562, 0.6783294677734375, 0.7002487182617188, 0.72216796875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 8.0, 2.0, 6.0, 6.0, 8.0, 16.0, 22.0, 24.0, 45.0, 53.0, 111.0, 183.0, 207.0, 127.0, 66.0, 43.0, 26.0, 14.0, 10.0, 15.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.0004978179931640625, -0.00048679113388061523, -0.00047576427459716797, -0.0004647374153137207, -0.00045371055603027344, -0.00044268369674682617, -0.0004316568374633789, -0.00042062997817993164, -0.0004096031188964844, -0.0003985762596130371, -0.00038754940032958984, -0.0003765225410461426, -0.0003654956817626953, -0.00035446882247924805, -0.0003434419631958008, -0.0003324151039123535, -0.00032138824462890625, -0.000310361385345459, -0.0002993345260620117, -0.00028830766677856445, -0.0002772808074951172, -0.0002662539482116699, -0.00025522708892822266, -0.0002442002296447754, -0.00023317337036132812, -0.00022214651107788086, -0.0002111196517944336, -0.00020009279251098633, -0.00018906593322753906, -0.0001780390739440918, -0.00016701221466064453, -0.00015598535537719727, -0.00014495849609375, -0.00013393163681030273, -0.00012290477752685547, -0.0001118779182434082, -0.00010085105895996094, -8.982419967651367e-05, -7.87973403930664e-05, -6.777048110961914e-05, -5.6743621826171875e-05, -4.571676254272461e-05, -3.4689903259277344e-05, -2.3663043975830078e-05, -1.2636184692382812e-05, -1.6093254089355469e-06, 9.417533874511719e-06, 2.0444393157958984e-05, 3.147125244140625e-05, 4.2498111724853516e-05, 5.352497100830078e-05, 6.455183029174805e-05, 7.557868957519531e-05, 8.660554885864258e-05, 9.763240814208984e-05, 0.00010865926742553711, 0.00011968612670898438, 0.00013071298599243164, 0.0001417398452758789, 0.00015276670455932617, 0.00016379356384277344, 0.0001748204231262207, 0.00018584728240966797, 0.00019687414169311523, 0.0002079010009765625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 4.0, 6.0, 10.0, 6.0, 14.0, 16.0, 37.0, 49.0, 81.0, 113.0, 209.0, 411.0, 891.0, 2315.0, 6673.0, 24580.0, 182568.0, 777830.0, 38078.0, 9403.0, 2980.0, 1129.0, 490.0, 275.0, 143.0, 79.0, 43.0, 40.0, 29.0, 14.0, 11.0, 9.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9208984375, -0.8939208984375, -0.866943359375, -0.8399658203125, -0.81298828125, -0.7860107421875, -0.759033203125, -0.7320556640625, -0.705078125, -0.6781005859375, -0.651123046875, -0.6241455078125, -0.59716796875, -0.5701904296875, -0.543212890625, -0.5162353515625, -0.4892578125, -0.4622802734375, -0.435302734375, -0.4083251953125, -0.38134765625, -0.3543701171875, -0.327392578125, -0.3004150390625, -0.2734375, -0.2464599609375, -0.219482421875, -0.1925048828125, -0.16552734375, -0.1385498046875, -0.111572265625, -0.0845947265625, -0.0576171875, -0.0306396484375, -0.003662109375, 0.0233154296875, 0.05029296875, 0.0772705078125, 0.104248046875, 0.1312255859375, 0.158203125, 0.1851806640625, 0.212158203125, 0.2391357421875, 0.26611328125, 0.2930908203125, 0.320068359375, 0.3470458984375, 0.3740234375, 0.4010009765625, 0.427978515625, 0.4549560546875, 0.48193359375, 0.5089111328125, 0.535888671875, 0.5628662109375, 0.58984375, 0.6168212890625, 0.643798828125, 0.6707763671875, 0.69775390625, 0.7247314453125, 0.751708984375, 0.7786865234375, 0.8056640625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 5.0, 10.0, 5.0, 12.0, 8.0, 14.0, 13.0, 22.0, 15.0, 23.0, 32.0, 50.0, 51.0, 73.0, 67.0, 98.0, 83.0, 84.0, 72.0, 49.0, 40.0, 28.0, 23.0, 22.0, 11.0, 13.0, 8.0, 6.0, 7.0, 11.0, 8.0, 1.0, 9.0, 1.0, 3.0, 9.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.63330078125, -0.614166259765625, -0.59503173828125, -0.575897216796875, -0.5567626953125, -0.537628173828125, -0.51849365234375, -0.499359130859375, -0.480224609375, -0.461090087890625, -0.44195556640625, -0.422821044921875, -0.4036865234375, -0.384552001953125, -0.36541748046875, -0.346282958984375, -0.3271484375, -0.308013916015625, -0.28887939453125, -0.269744873046875, -0.2506103515625, -0.231475830078125, -0.21234130859375, -0.193206787109375, -0.174072265625, -0.154937744140625, -0.13580322265625, -0.116668701171875, -0.0975341796875, -0.078399658203125, -0.05926513671875, -0.040130615234375, -0.02099609375, -0.001861572265625, 0.01727294921875, 0.036407470703125, 0.0555419921875, 0.074676513671875, 0.09381103515625, 0.112945556640625, 0.132080078125, 0.151214599609375, 0.17034912109375, 0.189483642578125, 0.2086181640625, 0.227752685546875, 0.24688720703125, 0.266021728515625, 0.28515625, 0.304290771484375, 0.32342529296875, 0.342559814453125, 0.3616943359375, 0.380828857421875, 0.39996337890625, 0.419097900390625, 0.438232421875, 0.457366943359375, 0.47650146484375, 0.495635986328125, 0.5147705078125, 0.533905029296875, 0.55303955078125, 0.572174072265625, 0.59130859375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 41.0, 160.0, 610.0, 128.0, 27.0, 15.0, 8.0, 3.0, 3.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.25986099243164, -33.897499084472656, -31.53513526916504, -29.172771453857422, -26.810409545898438, -24.448047637939453, -22.085683822631836, -19.72332000732422, -17.360958099365234, -14.998595237731934, -12.636232376098633, -10.273869514465332, -7.911506652832031, -5.5491437911987305, -3.1867809295654297, -0.8244171142578125, 1.5379447937011719, 3.9003076553344727, 6.262670516967773, 8.625033378601074, 10.987396240234375, 13.349759101867676, 15.712121963500977, 18.074485778808594, 20.436847686767578, 22.799209594726562, 25.16157341003418, 27.523937225341797, 29.88629913330078, 32.248661041259766, 34.61102294921875, 36.973388671875, 39.33574676513672, 41.6981086730957, 44.06047058105469, 46.42283630371094, 48.78519821166992, 51.147560119628906, 53.509925842285156, 55.87228775024414, 58.234649658203125, 60.59701156616211, 62.959373474121094, 65.32173919677734, 67.68409729003906, 70.04646301269531, 72.40882873535156, 74.77119445800781, 77.13355255126953, 79.49591827392578, 81.8582763671875, 84.22064208984375, 86.5830078125, 88.94536590576172, 91.30773162841797, 93.67008972167969, 96.03245544433594, 98.39482116699219, 100.7571792602539, 103.11954498291016, 105.48190307617188, 107.84426879882812, 110.20663452148438, 112.56900024414062, 114.93135833740234]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 3.0, 2.0, 5.0, 4.0, 10.0, 13.0, 10.0, 11.0, 9.0, 19.0, 16.0, 19.0, 21.0, 59.0, 99.0, 117.0, 121.0, 130.0, 104.0, 43.0, 24.0, 30.0, 20.0, 14.0, 14.0, 16.0, 16.0, 14.0, 9.0, 4.0, 4.0, 5.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.4764461517334, -29.70205307006836, -28.927658081054688, -28.15326499938965, -27.37887191772461, -26.604476928710938, -25.8300838470459, -25.05569076538086, -24.281295776367188, -23.50690269470215, -22.732507705688477, -21.958114624023438, -21.183719635009766, -20.409326553344727, -19.634933471679688, -18.860538482666016, -18.086145401000977, -17.311752319335938, -16.537357330322266, -15.762964248657227, -14.988570213317871, -14.214176177978516, -13.439783096313477, -12.665389060974121, -11.890995025634766, -11.11660099029541, -10.342206954956055, -9.567813873291016, -8.79341983795166, -8.019025802612305, -7.244632244110107, -6.47023868560791, -5.695844650268555, -4.921450614929199, -4.147057056427002, -3.3726632595062256, -2.598269462585449, -1.8238756656646729, -1.0494818687438965, -0.2750883102416992, 0.49930572509765625, 1.2736995220184326, 2.048093318939209, 2.8224871158599854, 3.5968809127807617, 4.371274948120117, 5.1456685066223145, 5.920062065124512, 6.694456100463867, 7.468850135803223, 8.243244171142578, 9.017637252807617, 9.792031288146973, 10.566425323486328, 11.340818405151367, 12.115212440490723, 12.889606475830078, 13.664000511169434, 14.438394546508789, 15.212787628173828, 15.987181663513184, 16.76157569885254, 17.535968780517578, 18.31036376953125, 19.08475685119629]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 2.0, 2.0, 6.0, 5.0, 9.0, 10.0, 10.0, 19.0, 13.0, 19.0, 26.0, 36.0, 32.0, 29.0, 36.0, 56.0, 147.0, 172.0, 70.0, 45.0, 30.0, 34.0, 25.0, 27.0, 19.0, 19.0, 19.0, 7.0, 8.0, 10.0, 11.0, 7.0, 14.0, 6.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.140625, -2.0797882080078125, -2.018951416015625, -1.9581146240234375, -1.89727783203125, -1.8364410400390625, -1.775604248046875, -1.7147674560546875, -1.6539306640625, -1.5930938720703125, -1.532257080078125, -1.4714202880859375, -1.41058349609375, -1.3497467041015625, -1.288909912109375, -1.2280731201171875, -1.167236328125, -1.1063995361328125, -1.045562744140625, -0.9847259521484375, -0.92388916015625, -0.8630523681640625, -0.802215576171875, -0.7413787841796875, -0.6805419921875, -0.6197052001953125, -0.558868408203125, -0.4980316162109375, -0.43719482421875, -0.3763580322265625, -0.315521240234375, -0.2546844482421875, -0.19384765625, -0.1330108642578125, -0.072174072265625, -0.0113372802734375, 0.04949951171875, 0.1103363037109375, 0.171173095703125, 0.2320098876953125, 0.2928466796875, 0.3536834716796875, 0.414520263671875, 0.4753570556640625, 0.53619384765625, 0.5970306396484375, 0.657867431640625, 0.7187042236328125, 0.779541015625, 0.8403778076171875, 0.901214599609375, 0.9620513916015625, 1.02288818359375, 1.0837249755859375, 1.144561767578125, 1.2053985595703125, 1.2662353515625, 1.3270721435546875, 1.387908935546875, 1.4487457275390625, 1.50958251953125, 1.5704193115234375, 1.631256103515625, 1.6920928955078125, 1.7529296875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 12.0, 19.0, 12.0, 17.0, 31.0, 55.0, 77.0, 186.0, 460.0, 1801.0, 10799.0, 8350531.0, 20949.0, 2492.0, 604.0, 249.0, 126.0, 54.0, 36.0, 15.0, 15.0, 9.0, 3.0, 9.0, 4.0, 8.0, 7.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.393695831298828, -24.680822372436523, -23.967947006225586, -23.25507354736328, -22.542198181152344, -21.82932472229004, -21.116451263427734, -20.403575897216797, -19.69070053100586, -18.977827072143555, -18.264951705932617, -17.552078247070312, -16.839202880859375, -16.12632942199707, -15.41345500946045, -14.700580596923828, -13.987707138061523, -13.274832725524902, -12.561958312988281, -11.849084854125977, -11.136209487915039, -10.423336029052734, -9.710461616516113, -8.997587203979492, -8.284712791442871, -7.57183837890625, -6.858963966369629, -6.146090030670166, -5.433215618133545, -4.720341205596924, -4.007467269897461, -3.29459285736084, -2.5817203521728516, -1.86884605884552, -1.1559717655181885, -0.4430975914001465, 0.2697768211364746, 0.9826512336730957, 1.6955251693725586, 2.4083995819091797, 3.121273994445801, 3.834148406982422, 4.547022819519043, 5.259896755218506, 5.972771167755127, 6.685645580291748, 7.398519515991211, 8.111393928527832, 8.824268341064453, 9.537142753601074, 10.250017166137695, 10.962890625, 11.675765991210938, 12.388639450073242, 13.101513862609863, 13.814388275146484, 14.527262687683105, 15.240137100219727, 15.953011512756348, 16.66588592529297, 17.378759384155273, 18.09163475036621, 18.804508209228516, 19.517383575439453, 20.230257034301758]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 3.0, 4.0, 4.0, 3.0, 6.0, 3.0, 4.0, 6.0, 4.0, 3.0, 8.0, 5.0, 2.0, 1.0, 6.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.543664932250977, -19.843019485473633, -19.14237403869629, -18.441728591918945, -17.74108123779297, -17.040435791015625, -16.33979034423828, -15.639144897460938, -14.938499450683594, -14.23785400390625, -13.537208557128906, -12.836562156677246, -12.135916709899902, -11.435271263122559, -10.734624862670898, -10.033979415893555, -9.333333969116211, -8.632688522338867, -7.932042598724365, -7.231396675109863, -6.5307512283325195, -5.830105781555176, -5.129459857940674, -4.428813934326172, -3.728168487548828, -3.0275228023529053, -2.3268771171569824, -1.6262314319610596, -0.9255857467651367, -0.22494006156921387, 0.475705623626709, 1.176351547241211, 1.8769950866699219, 2.5776407718658447, 3.2782864570617676, 3.9789321422576904, 4.679577827453613, 5.380223274230957, 6.080869197845459, 6.781515121459961, 7.482160568237305, 8.182806015014648, 8.883451461791992, 9.584097862243652, 10.284743309020996, 10.98538875579834, 11.68603515625, 12.386680603027344, 13.087326049804688, 13.787971496582031, 14.488616943359375, 15.189263343811035, 15.889908790588379, 16.59055519104004, 17.291200637817383, 17.991846084594727, 18.69249153137207, 19.393136978149414, 20.093782424926758, 20.7944278717041, 21.495075225830078, 22.195720672607422, 22.896366119384766, 23.59701156616211, 24.297657012939453]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 5.0, 11.0, 10.0, 14.0, 18.0, 21.0, 38.0, 48.0, 60.0, 74.0, 97.0, 94.0, 103.0, 105.0, 77.0, 48.0, 45.0, 40.0, 33.0, 17.0, 13.0, 10.0, 12.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.6875, -2.6275482177734375, -2.567596435546875, -2.5076446533203125, -2.44769287109375, -2.3877410888671875, -2.327789306640625, -2.2678375244140625, -2.2078857421875, -2.1479339599609375, -2.087982177734375, -2.0280303955078125, -1.96807861328125, -1.9081268310546875, -1.848175048828125, -1.7882232666015625, -1.728271484375, -1.6683197021484375, -1.608367919921875, -1.5484161376953125, -1.48846435546875, -1.4285125732421875, -1.368560791015625, -1.3086090087890625, -1.2486572265625, -1.1887054443359375, -1.128753662109375, -1.0688018798828125, -1.00885009765625, -0.9488983154296875, -0.888946533203125, -0.8289947509765625, -0.76904296875, -0.7090911865234375, -0.649139404296875, -0.5891876220703125, -0.52923583984375, -0.4692840576171875, -0.409332275390625, -0.3493804931640625, -0.2894287109375, -0.2294769287109375, -0.169525146484375, -0.1095733642578125, -0.04962158203125, 0.0103302001953125, 0.070281982421875, 0.1302337646484375, 0.190185546875, 0.2501373291015625, 0.310089111328125, 0.3700408935546875, 0.42999267578125, 0.4899444580078125, 0.549896240234375, 0.6098480224609375, 0.6697998046875, 0.7297515869140625, 0.789703369140625, 0.8496551513671875, 0.90960693359375, 0.9695587158203125, 1.029510498046875, 1.0894622802734375, 1.1494140625]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 7.0, 16.0, 35.0, 49.0, 90.0, 165.0, 345.0, 819.0, 1860.0, 5178.0, 15842.0, 53175.0, 166750.0, 187882.0, 63597.0, 18823.0, 6006.0, 2048.0, 825.0, 360.0, 167.0, 96.0, 49.0, 26.0, 18.0, 11.0, 13.0, 9.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.125, -9.64453125, -9.1640625, -8.68359375, -8.203125, -7.72265625, -7.2421875, -6.76171875, -6.28125, -5.80078125, -5.3203125, -4.83984375, -4.359375, -3.87890625, -3.3984375, -2.91796875, -2.4375, -1.95703125, -1.4765625, -0.99609375, -0.515625, -0.03515625, 0.4453125, 0.92578125, 1.40625, 1.88671875, 2.3671875, 2.84765625, 3.328125, 3.80859375, 4.2890625, 4.76953125, 5.25, 5.73046875, 6.2109375, 6.69140625, 7.171875, 7.65234375, 8.1328125, 8.61328125, 9.09375, 9.57421875, 10.0546875, 10.53515625, 11.015625, 11.49609375, 11.9765625, 12.45703125, 12.9375, 13.41796875, 13.8984375, 14.37890625, 14.859375, 15.33984375, 15.8203125, 16.30078125, 16.78125, 17.26171875, 17.7421875, 18.22265625, 18.703125, 19.18359375, 19.6640625, 20.14453125, 20.625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 6.0, 8.0, 13.0, 16.0, 8.0, 10.0, 21.0, 25.0, 18.0, 20.0, 22.0, 25.0, 38.0, 37.0, 49.0, 56.0, 50.0, 50.0, 52.0, 48.0, 59.0, 46.0, 51.0, 35.0, 36.0, 28.0, 30.0, 23.0, 17.0, 14.0, 11.0, 11.0, 15.0, 12.0, 5.0, 5.0, 8.0, 6.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0], "bins": [-1.9775390625, -1.9232025146484375, -1.868865966796875, -1.8145294189453125, -1.76019287109375, -1.7058563232421875, -1.651519775390625, -1.5971832275390625, -1.5428466796875, -1.4885101318359375, -1.434173583984375, -1.3798370361328125, -1.32550048828125, -1.2711639404296875, -1.216827392578125, -1.1624908447265625, -1.108154296875, -1.0538177490234375, -0.999481201171875, -0.9451446533203125, -0.89080810546875, -0.8364715576171875, -0.782135009765625, -0.7277984619140625, -0.6734619140625, -0.6191253662109375, -0.564788818359375, -0.5104522705078125, -0.45611572265625, -0.4017791748046875, -0.347442626953125, -0.2931060791015625, -0.23876953125, -0.1844329833984375, -0.130096435546875, -0.0757598876953125, -0.02142333984375, 0.0329132080078125, 0.087249755859375, 0.1415863037109375, 0.1959228515625, 0.2502593994140625, 0.304595947265625, 0.3589324951171875, 0.41326904296875, 0.4676055908203125, 0.521942138671875, 0.5762786865234375, 0.630615234375, 0.6849517822265625, 0.739288330078125, 0.7936248779296875, 0.84796142578125, 0.9022979736328125, 0.956634521484375, 1.0109710693359375, 1.0653076171875, 1.1196441650390625, 1.173980712890625, 1.2283172607421875, 1.28265380859375, 1.3369903564453125, 1.391326904296875, 1.4456634521484375, 1.5]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 11.0, 7.0, 12.0, 22.0, 77.0, 130.0, 116.0, 66.0, 21.0, 9.0, 5.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.89421463012695, -35.0106086730957, -34.12700653076172, -33.24340057373047, -32.359798431396484, -31.476192474365234, -30.59259033203125, -29.708984375, -28.825380325317383, -27.941776275634766, -27.05817222595215, -26.17456817626953, -25.290964126586914, -24.407360076904297, -23.523754119873047, -22.64015007019043, -21.756546020507812, -20.872941970825195, -19.989337921142578, -19.10573387145996, -18.222129821777344, -17.338523864746094, -16.45492172241211, -15.57131576538086, -14.687713623046875, -13.804109573364258, -12.92050552368164, -12.036901473999023, -11.15329647064209, -10.269692420959473, -9.386088371276855, -8.502483367919922, -7.618879318237305, -6.7352752685546875, -5.851670742034912, -4.968066692352295, -4.0844621658325195, -3.2008581161499023, -2.317254066467285, -1.4336495399475098, -0.5500454902648926, 0.33355873823165894, 1.2171629667282104, 2.100767135620117, 2.9843714237213135, 3.8679757118225098, 4.751579761505127, 5.635184288024902, 6.5187883377075195, 7.402392387390137, 8.285996437072754, 9.169601440429688, 10.053205490112305, 10.936809539794922, 11.820413589477539, 12.704017639160156, 13.587621688842773, 14.47122573852539, 15.354829788208008, 16.238433837890625, 17.122037887573242, 18.00564193725586, 18.88924789428711, 19.772851943969727, 20.656455993652344]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 6.0, 6.0, 6.0, 10.0, 12.0, 21.0, 44.0, 94.0, 96.0, 79.0, 37.0, 20.0, 7.0, 8.0, 9.0, 8.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.67731285095215, -16.225927352905273, -15.774540901184082, -15.32315444946289, -14.8717679977417, -14.420382499694824, -13.968996047973633, -13.517610549926758, -13.066224098205566, -12.614837646484375, -12.1634521484375, -11.712065696716309, -11.260679244995117, -10.809293746948242, -10.35790729522705, -9.90652084350586, -9.455135345458984, -9.003748893737793, -8.552363395690918, -8.100976943969727, -7.649590969085693, -7.19820499420166, -6.746818542480469, -6.2954325675964355, -5.844045639038086, -5.392659664154053, -4.941273212432861, -4.489887237548828, -4.038501262664795, -3.5871150493621826, -3.1357288360595703, -2.684342861175537, -2.232956886291504, -1.7815707921981812, -1.3301846981048584, -0.8787984848022461, -0.42741239070892334, 0.023973703384399414, 0.4753599166870117, 0.9267458915710449, 1.3781321048736572, 1.82951819896698, 2.2809042930603027, 2.732290506362915, 3.1836767196655273, 3.6350626945495605, 4.086448669433594, 4.537835121154785, 4.989221096038818, 5.440607070922852, 5.891993522644043, 6.343379497528076, 6.794765472412109, 7.246151924133301, 7.697537899017334, 8.148923873901367, 8.600310325622559, 9.05169677734375, 9.503082275390625, 9.954468727111816, 10.405855178833008, 10.857240676879883, 11.308627128601074, 11.760013580322266, 12.21139907836914]}, "eval/loss": 4.240406036376953, "eval/wer": 1.8401428004760016, "eval/runtime": 1267.491, "eval/samples_per_second": 2.084, "eval/steps_per_second": 0.261} \ No newline at end of file