diff --git "a/wandb/run-20220228_144113-18osrjm3/files/wandb-summary.json" "b/wandb/run-20220228_144113-18osrjm3/files/wandb-summary.json" --- "a/wandb/run-20220228_144113-18osrjm3/files/wandb-summary.json" +++ "b/wandb/run-20220228_144113-18osrjm3/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.3145, "train/learning_rate": 8.860000000000002e-06, "train/epoch": 1.0, "train/global_step": 446, "_runtime": 6620, "_timestamp": 1646065893, "_step": 447, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 10.0, 27.0, 95.0, 154.0, 264.0, 230.0, 141.0, 62.0, 23.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.178123474121094, -22.747371673583984, -21.316619873046875, -19.885866165161133, -18.455114364624023, -17.024362564086914, -15.593609809875488, -14.162857055664062, -12.732105255126953, -11.301353454589844, -9.870600700378418, -8.439847946166992, -7.009096145629883, -5.578343868255615, -4.147591590881348, -2.716838836669922, -1.2860870361328125, 0.14466524124145508, 1.5754175186157227, 3.0061697959899902, 4.436922073364258, 5.867674350738525, 7.298426628112793, 8.729179382324219, 10.159931182861328, 11.590682983398438, 13.021435737609863, 14.452188491821289, 15.882940292358398, 17.313692092895508, 18.74444580078125, 20.17519760131836, 21.60594940185547, 23.036701202392578, 24.467453002929688, 25.89820671081543, 27.32895851135254, 28.75971031188965, 30.19046401977539, 31.6212158203125, 33.05196762084961, 34.48271942138672, 35.91347122192383, 37.34422302246094, 38.77497863769531, 40.20573043823242, 41.63648223876953, 43.06723403930664, 44.49798583984375, 45.92873764038086, 47.35948944091797, 48.79024124145508, 50.22099304199219, 51.65174865722656, 53.08250045776367, 54.51325225830078, 55.94400405883789, 57.374755859375, 58.80550765991211, 60.23625946044922, 61.667015075683594, 63.0977668762207, 64.52851867675781, 65.95927429199219, 67.39002227783203]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 6.0, 6.0, 11.0, 9.0, 15.0, 9.0, 9.0, 15.0, 24.0, 25.0, 24.0, 23.0, 30.0, 33.0, 34.0, 32.0, 38.0, 43.0, 44.0, 45.0, 47.0, 46.0, 42.0, 28.0, 37.0, 36.0, 36.0, 41.0, 22.0, 29.0, 35.0, 17.0, 22.0, 13.0, 11.0, 8.0, 15.0, 13.0, 9.0, 3.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.37661361694336, -28.406328201293945, -27.4360408782959, -26.465755462646484, -25.495468139648438, -24.525182723999023, -23.55489730834961, -22.584609985351562, -21.61432456970215, -20.644039154052734, -19.673751831054688, -18.703466415405273, -17.733179092407227, -16.762893676757812, -15.792607307434082, -14.822320938110352, -13.852034568786621, -12.88174819946289, -11.91146183013916, -10.94117546081543, -9.970890045166016, -9.000603675842285, -8.030317306518555, -7.060031414031982, -6.089745044708252, -5.1194586753845215, -4.149172782897949, -3.1788864135742188, -2.2086002826690674, -1.238314151763916, -0.26802778244018555, 0.7022581100463867, 1.6725444793701172, 2.6428306102752686, 3.61311674118042, 4.58340311050415, 5.553689002990723, 6.523975372314453, 7.494261741638184, 8.464548110961914, 9.434833526611328, 10.405119895935059, 11.375406265258789, 12.345691680908203, 13.315978050231934, 14.286264419555664, 15.256550788879395, 16.226837158203125, 17.197124481201172, 18.167409896850586, 19.137697219848633, 20.107982635498047, 21.078269958496094, 22.048555374145508, 23.018840789794922, 23.98912811279297, 24.959413528442383, 25.929698944091797, 26.899986267089844, 27.870271682739258, 28.840559005737305, 29.81084442138672, 30.781131744384766, 31.75141716003418, 32.721702575683594]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 9.0, 4.0, 9.0, 12.0, 10.0, 13.0, 14.0, 17.0, 11.0, 19.0, 31.0, 29.0, 29.0, 22.0, 29.0, 39.0, 46.0, 42.0, 38.0, 38.0, 37.0, 37.0, 39.0, 36.0, 41.0, 42.0, 46.0, 37.0, 34.0, 30.0, 27.0, 22.0, 20.0, 13.0, 18.0, 17.0, 10.0, 8.0, 5.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.94140625, -1.8817291259765625, -1.822052001953125, -1.7623748779296875, -1.70269775390625, -1.6430206298828125, -1.583343505859375, -1.5236663818359375, -1.4639892578125, -1.4043121337890625, -1.344635009765625, -1.2849578857421875, -1.22528076171875, -1.1656036376953125, -1.105926513671875, -1.0462493896484375, -0.986572265625, -0.9268951416015625, -0.867218017578125, -0.8075408935546875, -0.74786376953125, -0.6881866455078125, -0.628509521484375, -0.5688323974609375, -0.5091552734375, -0.4494781494140625, -0.389801025390625, -0.3301239013671875, -0.27044677734375, -0.2107696533203125, -0.151092529296875, -0.0914154052734375, -0.03173828125, 0.0279388427734375, 0.087615966796875, 0.1472930908203125, 0.20697021484375, 0.2666473388671875, 0.326324462890625, 0.3860015869140625, 0.4456787109375, 0.5053558349609375, 0.565032958984375, 0.6247100830078125, 0.68438720703125, 0.7440643310546875, 0.803741455078125, 0.8634185791015625, 0.923095703125, 0.9827728271484375, 1.042449951171875, 1.1021270751953125, 1.16180419921875, 1.2214813232421875, 1.281158447265625, 1.3408355712890625, 1.4005126953125, 1.4601898193359375, 1.519866943359375, 1.5795440673828125, 1.63922119140625, 1.6988983154296875, 1.758575439453125, 1.8182525634765625, 1.8779296875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 13.0, 2.0, 18.0, 18.0, 21.0, 22.0, 39.0, 57.0, 112.0, 150.0, 185.0, 247.0, 378.0, 716.0, 1142.0, 2033.0, 3863.0, 9314.0, 30312.0, 185619.0, 1951480.0, 1788085.0, 174110.0, 28857.0, 8971.0, 3909.0, 1823.0, 1020.0, 612.0, 397.0, 256.0, 174.0, 100.0, 83.0, 48.0, 25.0, 24.0, 19.0, 13.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08984375, -5.8994140625, -5.708984375, -5.5185546875, -5.328125, -5.1376953125, -4.947265625, -4.7568359375, -4.56640625, -4.3759765625, -4.185546875, -3.9951171875, -3.8046875, -3.6142578125, -3.423828125, -3.2333984375, -3.04296875, -2.8525390625, -2.662109375, -2.4716796875, -2.28125, -2.0908203125, -1.900390625, -1.7099609375, -1.51953125, -1.3291015625, -1.138671875, -0.9482421875, -0.7578125, -0.5673828125, -0.376953125, -0.1865234375, 0.00390625, 0.1943359375, 0.384765625, 0.5751953125, 0.765625, 0.9560546875, 1.146484375, 1.3369140625, 1.52734375, 1.7177734375, 1.908203125, 2.0986328125, 2.2890625, 2.4794921875, 2.669921875, 2.8603515625, 3.05078125, 3.2412109375, 3.431640625, 3.6220703125, 3.8125, 4.0029296875, 4.193359375, 4.3837890625, 4.57421875, 4.7646484375, 4.955078125, 5.1455078125, 5.3359375, 5.5263671875, 5.716796875, 5.9072265625, 6.09765625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 12.0, 16.0, 54.0, 104.0, 267.0, 681.0, 1383.0, 907.0, 362.0, 150.0, 66.0, 31.0, 22.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.203125, -18.614990234375, -18.02685546875, -17.438720703125, -16.8505859375, -16.262451171875, -15.67431640625, -15.086181640625, -14.498046875, -13.909912109375, -13.32177734375, -12.733642578125, -12.1455078125, -11.557373046875, -10.96923828125, -10.381103515625, -9.79296875, -9.204833984375, -8.61669921875, -8.028564453125, -7.4404296875, -6.852294921875, -6.26416015625, -5.676025390625, -5.087890625, -4.499755859375, -3.91162109375, -3.323486328125, -2.7353515625, -2.147216796875, -1.55908203125, -0.970947265625, -0.3828125, 0.205322265625, 0.79345703125, 1.381591796875, 1.9697265625, 2.557861328125, 3.14599609375, 3.734130859375, 4.322265625, 4.910400390625, 5.49853515625, 6.086669921875, 6.6748046875, 7.262939453125, 7.85107421875, 8.439208984375, 9.02734375, 9.615478515625, 10.20361328125, 10.791748046875, 11.3798828125, 11.968017578125, 12.55615234375, 13.144287109375, 13.732421875, 14.320556640625, 14.90869140625, 15.496826171875, 16.0849609375, 16.673095703125, 17.26123046875, 17.849365234375, 18.4375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 6.0, 2.0, 8.0, 26.0, 24.0, 58.0, 124.0, 257.0, 712.0, 2667.0, 79438.0, 4099747.0, 8932.0, 1416.0, 465.0, 193.0, 99.0, 46.0, 22.0, 11.0, 5.0, 7.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-53.03125, -51.43798828125, -49.8447265625, -48.25146484375, -46.658203125, -45.06494140625, -43.4716796875, -41.87841796875, -40.28515625, -38.69189453125, -37.0986328125, -35.50537109375, -33.912109375, -32.31884765625, -30.7255859375, -29.13232421875, -27.5390625, -25.94580078125, -24.3525390625, -22.75927734375, -21.166015625, -19.57275390625, -17.9794921875, -16.38623046875, -14.79296875, -13.19970703125, -11.6064453125, -10.01318359375, -8.419921875, -6.82666015625, -5.2333984375, -3.64013671875, -2.046875, -0.45361328125, 1.1396484375, 2.73291015625, 4.326171875, 5.91943359375, 7.5126953125, 9.10595703125, 10.69921875, 12.29248046875, 13.8857421875, 15.47900390625, 17.072265625, 18.66552734375, 20.2587890625, 21.85205078125, 23.4453125, 25.03857421875, 26.6318359375, 28.22509765625, 29.818359375, 31.41162109375, 33.0048828125, 34.59814453125, 36.19140625, 37.78466796875, 39.3779296875, 40.97119140625, 42.564453125, 44.15771484375, 45.7509765625, 47.34423828125, 48.9375]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 13.0, 84.0, 295.0, 382.0, 197.0, 40.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.72069549560547, -42.622344970703125, -40.523990631103516, -38.425636291503906, -36.32728576660156, -34.22893524169922, -32.13058090209961, -30.032228469848633, -27.933876037597656, -25.83552360534668, -23.737171173095703, -21.638818740844727, -19.54046630859375, -17.442113876342773, -15.343761444091797, -13.24540901184082, -11.147056579589844, -9.048704147338867, -6.950351715087891, -4.851999282836914, -2.7536468505859375, -0.6552944183349609, 1.4430580139160156, 3.541410446166992, 5.639762878417969, 7.738115310668945, 9.836467742919922, 11.934820175170898, 14.033172607421875, 16.13152503967285, 18.229877471923828, 20.328229904174805, 22.42657470703125, 24.524927139282227, 26.623279571533203, 28.72163200378418, 30.819984436035156, 32.9183349609375, 35.01668930053711, 37.11504364013672, 39.21339416503906, 41.311744689941406, 43.410099029541016, 45.508453369140625, 47.60680389404297, 49.70515441894531, 51.80350875854492, 53.90186309814453, 56.000213623046875, 58.09856414794922, 60.19691848754883, 62.29527282714844, 64.39362335205078, 66.49197387695312, 68.59033203125, 70.68868255615234, 72.78703308105469, 74.88538360595703, 76.98373413085938, 79.08209228515625, 81.1804428100586, 83.27879333496094, 85.37715148925781, 87.47550201416016, 89.5738525390625]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 3.0, 9.0, 9.0, 11.0, 10.0, 15.0, 18.0, 15.0, 21.0, 20.0, 28.0, 29.0, 38.0, 32.0, 45.0, 43.0, 37.0, 45.0, 42.0, 36.0, 42.0, 41.0, 44.0, 45.0, 37.0, 36.0, 26.0, 29.0, 35.0, 27.0, 26.0, 15.0, 14.0, 17.0, 12.0, 12.0, 9.0, 6.0, 6.0, 1.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-26.552268981933594, -25.800241470336914, -25.048215866088867, -24.296188354492188, -23.54416275024414, -22.79213523864746, -22.040109634399414, -21.288082122802734, -20.536056518554688, -19.784029006958008, -19.03200340270996, -18.27997589111328, -17.527950286865234, -16.775922775268555, -16.023897171020508, -15.271869659423828, -14.519843101501465, -13.767816543579102, -13.015789985656738, -12.263763427734375, -11.511736869812012, -10.759710311889648, -10.007682800292969, -9.255657196044922, -8.503629684448242, -7.751603126525879, -6.999576568603516, -6.247550010681152, -5.495523452758789, -4.743496894836426, -3.9914698600769043, -3.239443302154541, -2.487417221069336, -1.7353906631469727, -0.9833639860153198, -0.231337308883667, 0.5206892490386963, 1.2727158069610596, 2.024742603302002, 2.7767691612243652, 3.5287957191467285, 4.280822277069092, 5.032848834991455, 5.784875869750977, 6.53690242767334, 7.288928985595703, 8.040955543518066, 8.79298210144043, 9.545008659362793, 10.297035217285156, 11.04906177520752, 11.801088333129883, 12.553114891052246, 13.30514144897461, 14.057168960571289, 14.809194564819336, 15.561222076416016, 16.313249588012695, 17.065275192260742, 17.817302703857422, 18.56932830810547, 19.32135581970215, 20.073381423950195, 20.825408935546875, 21.577434539794922]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 1.0, 5.0, 6.0, 8.0, 7.0, 12.0, 11.0, 12.0, 10.0, 16.0, 21.0, 11.0, 21.0, 34.0, 28.0, 24.0, 34.0, 39.0, 27.0, 36.0, 42.0, 36.0, 37.0, 40.0, 38.0, 46.0, 35.0, 32.0, 34.0, 35.0, 38.0, 24.0, 36.0, 21.0, 21.0, 29.0, 15.0, 15.0, 17.0, 13.0, 8.0, 3.0, 8.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0], "bins": [-2.05859375, -1.99981689453125, -1.9410400390625, -1.88226318359375, -1.823486328125, -1.76470947265625, -1.7059326171875, -1.64715576171875, -1.58837890625, -1.52960205078125, -1.4708251953125, -1.41204833984375, -1.353271484375, -1.29449462890625, -1.2357177734375, -1.17694091796875, -1.1181640625, -1.05938720703125, -1.0006103515625, -0.94183349609375, -0.883056640625, -0.82427978515625, -0.7655029296875, -0.70672607421875, -0.64794921875, -0.58917236328125, -0.5303955078125, -0.47161865234375, -0.412841796875, -0.35406494140625, -0.2952880859375, -0.23651123046875, -0.177734375, -0.11895751953125, -0.0601806640625, -0.00140380859375, 0.057373046875, 0.11614990234375, 0.1749267578125, 0.23370361328125, 0.29248046875, 0.35125732421875, 0.4100341796875, 0.46881103515625, 0.527587890625, 0.58636474609375, 0.6451416015625, 0.70391845703125, 0.7626953125, 0.82147216796875, 0.8802490234375, 0.93902587890625, 0.997802734375, 1.05657958984375, 1.1153564453125, 1.17413330078125, 1.23291015625, 1.29168701171875, 1.3504638671875, 1.40924072265625, 1.468017578125, 1.52679443359375, 1.5855712890625, 1.64434814453125, 1.703125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 4.0, 6.0, 14.0, 32.0, 34.0, 46.0, 94.0, 122.0, 174.0, 280.0, 417.0, 624.0, 912.0, 1427.0, 2162.0, 3216.0, 4891.0, 7381.0, 11625.0, 17769.0, 27845.0, 44022.0, 72039.0, 130516.0, 315714.0, 173819.0, 87581.0, 52980.0, 32995.0, 20735.0, 13597.0, 8827.0, 5644.0, 3731.0, 2473.0, 1619.0, 1094.0, 682.0, 459.0, 315.0, 222.0, 161.0, 87.0, 46.0, 47.0, 22.0, 19.0, 16.0, 13.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.432373046875, -0.41828155517578125, -0.4041900634765625, -0.39009857177734375, -0.376007080078125, -0.36191558837890625, -0.3478240966796875, -0.33373260498046875, -0.31964111328125, -0.30554962158203125, -0.2914581298828125, -0.27736663818359375, -0.263275146484375, -0.24918365478515625, -0.2350921630859375, -0.22100067138671875, -0.2069091796875, -0.19281768798828125, -0.1787261962890625, -0.16463470458984375, -0.150543212890625, -0.13645172119140625, -0.1223602294921875, -0.10826873779296875, -0.09417724609375, -0.08008575439453125, -0.0659942626953125, -0.05190277099609375, -0.037811279296875, -0.02371978759765625, -0.0096282958984375, 0.00446319580078125, 0.0185546875, 0.03264617919921875, 0.0467376708984375, 0.06082916259765625, 0.074920654296875, 0.08901214599609375, 0.1031036376953125, 0.11719512939453125, 0.13128662109375, 0.14537811279296875, 0.1594696044921875, 0.17356109619140625, 0.187652587890625, 0.20174407958984375, 0.2158355712890625, 0.22992706298828125, 0.2440185546875, 0.25811004638671875, 0.2722015380859375, 0.28629302978515625, 0.300384521484375, 0.31447601318359375, 0.3285675048828125, 0.34265899658203125, 0.35675048828125, 0.37084197998046875, 0.3849334716796875, 0.39902496337890625, 0.413116455078125, 0.42720794677734375, 0.4412994384765625, 0.45539093017578125, 0.469482421875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 10.0, 8.0, 9.0, 7.0, 6.0, 17.0, 11.0, 13.0, 7.0, 21.0, 33.0, 27.0, 17.0, 31.0, 29.0, 37.0, 34.0, 32.0, 41.0, 30.0, 39.0, 30.0, 1053.0, 40.0, 41.0, 37.0, 27.0, 31.0, 38.0, 30.0, 26.0, 23.0, 23.0, 29.0, 22.0, 19.0, 16.0, 10.0, 14.0, 9.0, 10.0, 7.0, 13.0, 8.0, 5.0, 5.0, 4.0, 4.0, 1.0], "bins": [-1.341796875, -1.3057785034179688, -1.2697601318359375, -1.2337417602539062, -1.197723388671875, -1.1617050170898438, -1.1256866455078125, -1.0896682739257812, -1.05364990234375, -1.0176315307617188, -0.9816131591796875, -0.9455947875976562, -0.909576416015625, -0.8735580444335938, -0.8375396728515625, -0.8015213012695312, -0.7655029296875, -0.7294845581054688, -0.6934661865234375, -0.6574478149414062, -0.621429443359375, -0.5854110717773438, -0.5493927001953125, -0.5133743286132812, -0.47735595703125, -0.44133758544921875, -0.4053192138671875, -0.36930084228515625, -0.333282470703125, -0.29726409912109375, -0.2612457275390625, -0.22522735595703125, -0.189208984375, -0.15319061279296875, -0.1171722412109375, -0.08115386962890625, -0.045135498046875, -0.00911712646484375, 0.0269012451171875, 0.06291961669921875, 0.09893798828125, 0.13495635986328125, 0.1709747314453125, 0.20699310302734375, 0.243011474609375, 0.27902984619140625, 0.3150482177734375, 0.35106658935546875, 0.3870849609375, 0.42310333251953125, 0.4591217041015625, 0.49514007568359375, 0.531158447265625, 0.5671768188476562, 0.6031951904296875, 0.6392135620117188, 0.67523193359375, 0.7112503051757812, 0.7472686767578125, 0.7832870483398438, 0.819305419921875, 0.8553237915039062, 0.8913421630859375, 0.9273605346679688, 0.96337890625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 3.0, 6.0, 8.0, 12.0, 23.0, 36.0, 46.0, 78.0, 154.0, 179.0, 267.0, 500.0, 668.0, 1040.0, 1735.0, 2635.0, 4244.0, 6796.0, 11103.0, 18051.0, 30982.0, 53147.0, 94262.0, 200786.0, 1379612.0, 124792.0, 67575.0, 38802.0, 22883.0, 14101.0, 8459.0, 5185.0, 3302.0, 2114.0, 1308.0, 775.0, 516.0, 302.0, 201.0, 148.0, 93.0, 66.0, 37.0, 31.0, 32.0, 13.0, 9.0, 7.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42822265625, -0.41304779052734375, -0.3978729248046875, -0.38269805908203125, -0.367523193359375, -0.35234832763671875, -0.3371734619140625, -0.32199859619140625, -0.30682373046875, -0.29164886474609375, -0.2764739990234375, -0.26129913330078125, -0.246124267578125, -0.23094940185546875, -0.2157745361328125, -0.20059967041015625, -0.1854248046875, -0.17024993896484375, -0.1550750732421875, -0.13990020751953125, -0.124725341796875, -0.10955047607421875, -0.0943756103515625, -0.07920074462890625, -0.06402587890625, -0.04885101318359375, -0.0336761474609375, -0.01850128173828125, -0.003326416015625, 0.01184844970703125, 0.0270233154296875, 0.04219818115234375, 0.057373046875, 0.07254791259765625, 0.0877227783203125, 0.10289764404296875, 0.118072509765625, 0.13324737548828125, 0.1484222412109375, 0.16359710693359375, 0.17877197265625, 0.19394683837890625, 0.2091217041015625, 0.22429656982421875, 0.239471435546875, 0.25464630126953125, 0.2698211669921875, 0.28499603271484375, 0.3001708984375, 0.31534576416015625, 0.3305206298828125, 0.34569549560546875, 0.360870361328125, 0.37604522705078125, 0.3912200927734375, 0.40639495849609375, 0.42156982421875, 0.43674468994140625, 0.4519195556640625, 0.46709442138671875, 0.482269287109375, 0.49744415283203125, 0.5126190185546875, 0.5277938842773438, 0.54296875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 3.0, 4.0, 7.0, 7.0, 4.0, 12.0, 11.0, 13.0, 18.0, 29.0, 42.0, 46.0, 59.0, 75.0, 97.0, 127.0, 113.0, 88.0, 61.0, 50.0, 32.0, 26.0, 22.0, 12.0, 7.0, 10.0, 2.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.000385284423828125, -0.0003730654716491699, -0.00036084651947021484, -0.00034862756729125977, -0.0003364086151123047, -0.0003241896629333496, -0.00031197071075439453, -0.00029975175857543945, -0.0002875328063964844, -0.0002753138542175293, -0.0002630949020385742, -0.00025087594985961914, -0.00023865699768066406, -0.00022643804550170898, -0.0002142190933227539, -0.00020200014114379883, -0.00018978118896484375, -0.00017756223678588867, -0.0001653432846069336, -0.00015312433242797852, -0.00014090538024902344, -0.00012868642807006836, -0.00011646747589111328, -0.0001042485237121582, -9.202957153320312e-05, -7.981061935424805e-05, -6.759166717529297e-05, -5.537271499633789e-05, -4.315376281738281e-05, -3.0934810638427734e-05, -1.8715858459472656e-05, -6.496906280517578e-06, 5.7220458984375e-06, 1.7940998077392578e-05, 3.0159950256347656e-05, 4.2378902435302734e-05, 5.459785461425781e-05, 6.681680679321289e-05, 7.903575897216797e-05, 9.125471115112305e-05, 0.00010347366333007812, 0.0001156926155090332, 0.00012791156768798828, 0.00014013051986694336, 0.00015234947204589844, 0.00016456842422485352, 0.0001767873764038086, 0.00018900632858276367, 0.00020122528076171875, 0.00021344423294067383, 0.0002256631851196289, 0.00023788213729858398, 0.00025010108947753906, 0.00026232004165649414, 0.0002745389938354492, 0.0002867579460144043, 0.0002989768981933594, 0.00031119585037231445, 0.00032341480255126953, 0.0003356337547302246, 0.0003478527069091797, 0.00036007165908813477, 0.00037229061126708984, 0.0003845095634460449, 0.000396728515625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 6.0, 5.0, 3.0, 6.0, 8.0, 10.0, 6.0, 14.0, 24.0, 12.0, 27.0, 32.0, 69.0, 76.0, 135.0, 165.0, 274.0, 439.0, 843.0, 61082.0, 982778.0, 1088.0, 519.0, 291.0, 172.0, 136.0, 86.0, 69.0, 45.0, 25.0, 19.0, 14.0, 13.0, 9.0, 10.0, 10.0, 6.0, 6.0, 3.0, 4.0, 5.0, 1.0, 4.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006679534912109375, -0.006464958190917969, -0.0062503814697265625, -0.006035804748535156, -0.00582122802734375, -0.005606651306152344, -0.0053920745849609375, -0.005177497863769531, -0.004962921142578125, -0.004748344421386719, -0.0045337677001953125, -0.004319190979003906, -0.0041046142578125, -0.0038900375366210938, -0.0036754608154296875, -0.0034608840942382812, -0.003246307373046875, -0.0030317306518554688, -0.0028171539306640625, -0.0026025772094726562, -0.00238800048828125, -0.0021734237670898438, -0.0019588470458984375, -0.0017442703247070312, -0.001529693603515625, -0.0013151168823242188, -0.0011005401611328125, -0.0008859634399414062, -0.00067138671875, -0.00045680999755859375, -0.0002422332763671875, -2.765655517578125e-05, 0.000186920166015625, 0.00040149688720703125, 0.0006160736083984375, 0.0008306503295898438, 0.00104522705078125, 0.0012598037719726562, 0.0014743804931640625, 0.0016889572143554688, 0.001903533935546875, 0.0021181106567382812, 0.0023326873779296875, 0.0025472640991210938, 0.0027618408203125, 0.0029764175415039062, 0.0031909942626953125, 0.0034055709838867188, 0.003620147705078125, 0.0038347244262695312, 0.0040493011474609375, 0.004263877868652344, 0.00447845458984375, 0.004693031311035156, 0.0049076080322265625, 0.005122184753417969, 0.005336761474609375, 0.005551338195800781, 0.0057659149169921875, 0.005980491638183594, 0.006195068359375, 0.006409645080566406, 0.0066242218017578125, 0.006838798522949219, 0.007053375244140625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 41.0, 165.0, 369.0, 324.0, 81.0, 23.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012935695121996105, -0.00011844108666991815, -0.00010752522211987525, -9.660935029387474e-05, -8.569348574383184e-05, -7.477762119378895e-05, -6.386174936778843e-05, -5.2945884817745537e-05, -4.203002026770264e-05, -3.111415571765974e-05, -2.0198287529638037e-05, -9.282419341616333e-06, 1.633445208426565e-06, 1.2549309758469462e-05, 2.3465181584469974e-05, 3.438104613451287e-05, 4.529691068455577e-05, 5.6212775234598666e-05, 6.712863978464156e-05, 7.804451161064208e-05, 8.896037616068497e-05, 9.987624071072787e-05, 0.00011079211253672838, 0.00012170797708677128, 0.00013262384163681418, 0.0001435397134628147, 0.00015445557073689997, 0.00016537144256290048, 0.000176287314388901, 0.00018720317166298628, 0.0001981190434889868, 0.0002090349153149873, 0.00021995074348524213, 0.00023086661531124264, 0.00024178247258532792, 0.00025269834441132843, 0.0002636142016854137, 0.00027453008806332946, 0.00028544594533741474, 0.0002963618026115, 0.0003072776598855853, 0.0003181935171596706, 0.00032910940353758633, 0.0003400252608116716, 0.0003509411180857569, 0.00036185700446367264, 0.0003727728617377579, 0.0003836887190118432, 0.00039460460538975894, 0.00040552046266384423, 0.00041643634904175997, 0.00042735220631584525, 0.00043826806358993053, 0.0004491839208640158, 0.00046009980724193156, 0.00047101566451601684, 0.0004819315508939326, 0.0004928474081680179, 0.0005037632654421031, 0.0005146791227161884, 0.0005255950381979346, 0.0005365108954720199, 0.0005474267527461052, 0.0005583426100201905, 0.0005692584672942758]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 10.0, 11.0, 7.0, 14.0, 22.0, 22.0, 22.0, 17.0, 22.0, 24.0, 24.0, 35.0, 43.0, 31.0, 36.0, 51.0, 53.0, 47.0, 31.0, 45.0, 28.0, 41.0, 35.0, 48.0, 29.0, 33.0, 30.0, 42.0, 21.0, 14.0, 22.0, 19.0, 21.0, 8.0, 8.0, 4.0, 6.0, 1.0, 7.0, 5.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017070770263671875, -0.00016574375331401825, -0.00016077980399131775, -0.00015581585466861725, -0.00015085190534591675, -0.00014588795602321625, -0.00014092400670051575, -0.00013596005737781525, -0.00013099610805511475, -0.00012603215873241425, -0.00012106820940971375, -0.00011610426008701324, -0.00011114031076431274, -0.00010617636144161224, -0.00010121241211891174, -9.624846279621124e-05, -9.128451347351074e-05, -8.632056415081024e-05, -8.135661482810974e-05, -7.639266550540924e-05, -7.142871618270874e-05, -6.646476686000824e-05, -6.150081753730774e-05, -5.653686821460724e-05, -5.157291889190674e-05, -4.660896956920624e-05, -4.164502024650574e-05, -3.668107092380524e-05, -3.1717121601104736e-05, -2.6753172278404236e-05, -2.1789222955703735e-05, -1.6825273633003235e-05, -1.1861324310302734e-05, -6.897374987602234e-06, -1.9334256649017334e-06, 3.030523657798767e-06, 7.994472980499268e-06, 1.2958422303199768e-05, 1.792237162590027e-05, 2.288632094860077e-05, 2.785027027130127e-05, 3.281421959400177e-05, 3.777816891670227e-05, 4.274211823940277e-05, 4.770606756210327e-05, 5.267001688480377e-05, 5.763396620750427e-05, 6.259791553020477e-05, 6.756186485290527e-05, 7.252581417560577e-05, 7.748976349830627e-05, 8.245371282100677e-05, 8.741766214370728e-05, 9.238161146640778e-05, 9.734556078910828e-05, 0.00010230951011180878, 0.00010727345943450928, 0.00011223740875720978, 0.00011720135807991028, 0.00012216530740261078, 0.00012712925672531128, 0.00013209320604801178, 0.00013705715537071228, 0.00014202110469341278, 0.00014698505401611328]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 1.0, 5.0, 6.0, 8.0, 7.0, 12.0, 11.0, 12.0, 10.0, 16.0, 21.0, 11.0, 21.0, 34.0, 28.0, 24.0, 34.0, 39.0, 27.0, 36.0, 42.0, 36.0, 37.0, 40.0, 38.0, 46.0, 35.0, 32.0, 34.0, 35.0, 38.0, 24.0, 36.0, 21.0, 21.0, 29.0, 15.0, 15.0, 17.0, 13.0, 8.0, 3.0, 8.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0], "bins": [-2.05859375, -1.99981689453125, -1.9410400390625, -1.88226318359375, -1.823486328125, -1.76470947265625, -1.7059326171875, -1.64715576171875, -1.58837890625, -1.52960205078125, -1.4708251953125, -1.41204833984375, -1.353271484375, -1.29449462890625, -1.2357177734375, -1.17694091796875, -1.1181640625, -1.05938720703125, -1.0006103515625, -0.94183349609375, -0.883056640625, -0.82427978515625, -0.7655029296875, -0.70672607421875, -0.64794921875, -0.58917236328125, -0.5303955078125, -0.47161865234375, -0.412841796875, -0.35406494140625, -0.2952880859375, -0.23651123046875, -0.177734375, -0.11895751953125, -0.0601806640625, -0.00140380859375, 0.057373046875, 0.11614990234375, 0.1749267578125, 0.23370361328125, 0.29248046875, 0.35125732421875, 0.4100341796875, 0.46881103515625, 0.527587890625, 0.58636474609375, 0.6451416015625, 0.70391845703125, 0.7626953125, 0.82147216796875, 0.8802490234375, 0.93902587890625, 0.997802734375, 1.05657958984375, 1.1153564453125, 1.17413330078125, 1.23291015625, 1.29168701171875, 1.3504638671875, 1.40924072265625, 1.468017578125, 1.52679443359375, 1.5855712890625, 1.64434814453125, 1.703125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 12.0, 6.0, 13.0, 17.0, 18.0, 34.0, 34.0, 40.0, 76.0, 100.0, 92.0, 178.0, 203.0, 308.0, 383.0, 508.0, 779.0, 1022.0, 1590.0, 2285.0, 3571.0, 6127.0, 11608.0, 30470.0, 256039.0, 638337.0, 57605.0, 15852.0, 7805.0, 4511.0, 2798.0, 1735.0, 1229.0, 857.0, 611.0, 455.0, 309.0, 253.0, 164.0, 141.0, 87.0, 67.0, 62.0, 43.0, 29.0, 20.0, 21.0, 15.0, 12.0, 11.0, 5.0, 8.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-9.921875, -9.6038818359375, -9.285888671875, -8.9678955078125, -8.64990234375, -8.3319091796875, -8.013916015625, -7.6959228515625, -7.3779296875, -7.0599365234375, -6.741943359375, -6.4239501953125, -6.10595703125, -5.7879638671875, -5.469970703125, -5.1519775390625, -4.833984375, -4.5159912109375, -4.197998046875, -3.8800048828125, -3.56201171875, -3.2440185546875, -2.926025390625, -2.6080322265625, -2.2900390625, -1.9720458984375, -1.654052734375, -1.3360595703125, -1.01806640625, -0.7000732421875, -0.382080078125, -0.0640869140625, 0.25390625, 0.5718994140625, 0.889892578125, 1.2078857421875, 1.52587890625, 1.8438720703125, 2.161865234375, 2.4798583984375, 2.7978515625, 3.1158447265625, 3.433837890625, 3.7518310546875, 4.06982421875, 4.3878173828125, 4.705810546875, 5.0238037109375, 5.341796875, 5.6597900390625, 5.977783203125, 6.2957763671875, 6.61376953125, 6.9317626953125, 7.249755859375, 7.5677490234375, 7.8857421875, 8.2037353515625, 8.521728515625, 8.8397216796875, 9.15771484375, 9.4757080078125, 9.793701171875, 10.1116943359375, 10.4296875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 6.0, 3.0, 4.0, 1.0, 4.0, 9.0, 9.0, 12.0, 9.0, 14.0, 15.0, 18.0, 18.0, 24.0, 27.0, 26.0, 27.0, 30.0, 37.0, 45.0, 69.0, 57.0, 110.0, 237.0, 1364.0, 244.0, 138.0, 73.0, 53.0, 44.0, 41.0, 43.0, 30.0, 30.0, 33.0, 24.0, 19.0, 18.0, 17.0, 14.0, 10.0, 5.0, 9.0, 8.0, 7.0, 3.0, 2.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-5.1015625, -4.93524169921875, -4.7689208984375, -4.60260009765625, -4.436279296875, -4.26995849609375, -4.1036376953125, -3.93731689453125, -3.77099609375, -3.60467529296875, -3.4383544921875, -3.27203369140625, -3.105712890625, -2.93939208984375, -2.7730712890625, -2.60675048828125, -2.4404296875, -2.27410888671875, -2.1077880859375, -1.94146728515625, -1.775146484375, -1.60882568359375, -1.4425048828125, -1.27618408203125, -1.10986328125, -0.94354248046875, -0.7772216796875, -0.61090087890625, -0.444580078125, -0.27825927734375, -0.1119384765625, 0.05438232421875, 0.220703125, 0.38702392578125, 0.5533447265625, 0.71966552734375, 0.885986328125, 1.05230712890625, 1.2186279296875, 1.38494873046875, 1.55126953125, 1.71759033203125, 1.8839111328125, 2.05023193359375, 2.216552734375, 2.38287353515625, 2.5491943359375, 2.71551513671875, 2.8818359375, 3.04815673828125, 3.2144775390625, 3.38079833984375, 3.547119140625, 3.71343994140625, 3.8797607421875, 4.04608154296875, 4.21240234375, 4.37872314453125, 4.5450439453125, 4.71136474609375, 4.877685546875, 5.04400634765625, 5.2103271484375, 5.37664794921875, 5.54296875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 2.0, 6.0, 3.0, 4.0, 5.0, 10.0, 14.0, 14.0, 12.0, 14.0, 16.0, 14.0, 26.0, 38.0, 37.0, 47.0, 71.0, 100.0, 214.0, 483.0, 1904.0, 74589.0, 3056935.0, 9117.0, 1103.0, 364.0, 157.0, 101.0, 47.0, 46.0, 33.0, 25.0, 20.0, 23.0, 13.0, 17.0, 16.0, 10.0, 12.0, 7.0, 10.0, 4.0, 5.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-24.40625, -23.695068359375, -22.98388671875, -22.272705078125, -21.5615234375, -20.850341796875, -20.13916015625, -19.427978515625, -18.716796875, -18.005615234375, -17.29443359375, -16.583251953125, -15.8720703125, -15.160888671875, -14.44970703125, -13.738525390625, -13.02734375, -12.316162109375, -11.60498046875, -10.893798828125, -10.1826171875, -9.471435546875, -8.76025390625, -8.049072265625, -7.337890625, -6.626708984375, -5.91552734375, -5.204345703125, -4.4931640625, -3.781982421875, -3.07080078125, -2.359619140625, -1.6484375, -0.937255859375, -0.22607421875, 0.485107421875, 1.1962890625, 1.907470703125, 2.61865234375, 3.329833984375, 4.041015625, 4.752197265625, 5.46337890625, 6.174560546875, 6.8857421875, 7.596923828125, 8.30810546875, 9.019287109375, 9.73046875, 10.441650390625, 11.15283203125, 11.864013671875, 12.5751953125, 13.286376953125, 13.99755859375, 14.708740234375, 15.419921875, 16.131103515625, 16.84228515625, 17.553466796875, 18.2646484375, 18.975830078125, 19.68701171875, 20.398193359375, 21.109375]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 47.0, 963.0, 5.0, 4.0, 1.0, 1.0], "bins": [-219.2111053466797, -215.51856994628906, -211.82603454589844, -208.13348388671875, -204.44094848632812, -200.7484130859375, -197.05587768554688, -193.36334228515625, -189.67079162597656, -185.97825622558594, -182.2857208251953, -178.59317016601562, -174.900634765625, -171.20809936523438, -167.51556396484375, -163.82302856445312, -160.1304931640625, -156.43795776367188, -152.74542236328125, -149.05287170410156, -145.36033630371094, -141.6678009033203, -137.9752655029297, -134.28271484375, -130.59017944335938, -126.89764404296875, -123.2051010131836, -119.51256561279297, -115.82002258300781, -112.12748718261719, -108.43495178222656, -104.7424087524414, -101.04986572265625, -97.35733032226562, -93.66478729248047, -89.97225189208984, -86.27970886230469, -82.58717346191406, -78.89463806152344, -75.20209503173828, -71.50955200195312, -67.8170166015625, -64.12447357177734, -60.43193817138672, -56.73939514160156, -53.04685974121094, -49.35432052612305, -45.661781311035156, -41.969242095947266, -38.276702880859375, -34.584163665771484, -30.891626358032227, -27.199087142944336, -23.506547927856445, -19.814010620117188, -16.121471405029297, -12.428932189941406, -8.736392974853516, -5.043854713439941, -1.3513164520263672, 2.3412227630615234, 6.033761978149414, 9.726299285888672, 13.418838500976562, 17.111377716064453]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 3.0, 7.0, 9.0, 9.0, 14.0, 6.0, 15.0, 18.0, 19.0, 17.0, 30.0, 27.0, 32.0, 29.0, 35.0, 36.0, 40.0, 47.0, 39.0, 48.0, 32.0, 41.0, 39.0, 39.0, 51.0, 32.0, 35.0, 37.0, 28.0, 29.0, 19.0, 23.0, 21.0, 17.0, 16.0, 14.0, 14.0, 4.0, 5.0, 5.0, 4.0, 5.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.64004135131836, -20.046937942504883, -19.453834533691406, -18.860729217529297, -18.26762580871582, -17.674522399902344, -17.081418991088867, -16.48831558227539, -15.895210266113281, -15.302106857299805, -14.709002494812012, -14.115899085998535, -13.522794723510742, -12.929691314697266, -12.336587905883789, -11.743483543395996, -11.15038013458252, -10.557276725769043, -9.96417236328125, -9.371068954467773, -8.77796459197998, -8.184861183166504, -7.591757297515869, -6.998653411865234, -6.4055495262146, -5.812445640563965, -5.21934175491333, -4.626237869262695, -4.033134460449219, -3.440030336380005, -2.846926689147949, -2.2538228034973145, -1.6607189178466797, -1.067615032196045, -0.4745112657546997, 0.11859250068664551, 0.7116963863372803, 1.304800271987915, 1.8979039192199707, 2.4910078048706055, 3.0841116905212402, 3.677215576171875, 4.27031946182251, 4.8634233474731445, 5.456526756286621, 6.049631118774414, 6.642734527587891, 7.235838413238525, 7.82894229888916, 8.422045707702637, 9.01515007019043, 9.608253479003906, 10.2013578414917, 10.794461250305176, 11.387565612792969, 11.980669021606445, 12.573772430419922, 13.166875839233398, 13.759980201721191, 14.353083610534668, 14.946187973022461, 15.539291381835938, 16.132394790649414, 16.72549819946289, 17.318603515625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 6.0, 4.0, 3.0, 7.0, 5.0, 9.0, 14.0, 13.0, 13.0, 15.0, 19.0, 16.0, 24.0, 19.0, 35.0, 28.0, 32.0, 23.0, 35.0, 47.0, 27.0, 45.0, 45.0, 42.0, 32.0, 45.0, 30.0, 38.0, 39.0, 29.0, 35.0, 27.0, 32.0, 30.0, 26.0, 16.0, 23.0, 11.0, 18.0, 16.0, 6.0, 7.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0, 5.0], "bins": [-2.314453125, -2.2505950927734375, -2.186737060546875, -2.1228790283203125, -2.05902099609375, -1.9951629638671875, -1.931304931640625, -1.8674468994140625, -1.8035888671875, -1.7397308349609375, -1.675872802734375, -1.6120147705078125, -1.54815673828125, -1.4842987060546875, -1.420440673828125, -1.3565826416015625, -1.292724609375, -1.2288665771484375, -1.165008544921875, -1.1011505126953125, -1.03729248046875, -0.9734344482421875, -0.909576416015625, -0.8457183837890625, -0.7818603515625, -0.7180023193359375, -0.654144287109375, -0.5902862548828125, -0.52642822265625, -0.4625701904296875, -0.398712158203125, -0.3348541259765625, -0.27099609375, -0.2071380615234375, -0.143280029296875, -0.0794219970703125, -0.01556396484375, 0.0482940673828125, 0.112152099609375, 0.1760101318359375, 0.2398681640625, 0.3037261962890625, 0.367584228515625, 0.4314422607421875, 0.49530029296875, 0.5591583251953125, 0.623016357421875, 0.6868743896484375, 0.750732421875, 0.8145904541015625, 0.878448486328125, 0.9423065185546875, 1.00616455078125, 1.0700225830078125, 1.133880615234375, 1.1977386474609375, 1.2615966796875, 1.3254547119140625, 1.389312744140625, 1.4531707763671875, 1.51702880859375, 1.5808868408203125, 1.644744873046875, 1.7086029052734375, 1.7724609375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 3.0, 6.0, 5.0, 10.0, 15.0, 19.0, 22.0, 34.0, 42.0, 58.0, 85.0, 112.0, 166.0, 271.0, 403.0, 715.0, 1244.0, 2303.0, 4733.0, 10777.0, 29396.0, 152462.0, 2597760.0, 1273820.0, 82225.0, 20830.0, 8201.0, 3842.0, 1949.0, 1070.0, 630.0, 342.0, 229.0, 136.0, 96.0, 82.0, 44.0, 47.0, 26.0, 16.0, 14.0, 10.0, 7.0, 5.0, 2.0, 6.0, 7.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.140625, -9.8319091796875, -9.523193359375, -9.2144775390625, -8.90576171875, -8.5970458984375, -8.288330078125, -7.9796142578125, -7.6708984375, -7.3621826171875, -7.053466796875, -6.7447509765625, -6.43603515625, -6.1273193359375, -5.818603515625, -5.5098876953125, -5.201171875, -4.8924560546875, -4.583740234375, -4.2750244140625, -3.96630859375, -3.6575927734375, -3.348876953125, -3.0401611328125, -2.7314453125, -2.4227294921875, -2.114013671875, -1.8052978515625, -1.49658203125, -1.1878662109375, -0.879150390625, -0.5704345703125, -0.26171875, 0.0469970703125, 0.355712890625, 0.6644287109375, 0.97314453125, 1.2818603515625, 1.590576171875, 1.8992919921875, 2.2080078125, 2.5167236328125, 2.825439453125, 3.1341552734375, 3.44287109375, 3.7515869140625, 4.060302734375, 4.3690185546875, 4.677734375, 4.9864501953125, 5.295166015625, 5.6038818359375, 5.91259765625, 6.2213134765625, 6.530029296875, 6.8387451171875, 7.1474609375, 7.4561767578125, 7.764892578125, 8.0736083984375, 8.38232421875, 8.6910400390625, 8.999755859375, 9.3084716796875, 9.6171875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 6.0, 7.0, 7.0, 21.0, 17.0, 28.0, 51.0, 66.0, 109.0, 166.0, 287.0, 453.0, 669.0, 723.0, 559.0, 346.0, 205.0, 127.0, 82.0, 47.0, 35.0, 21.0, 20.0, 7.0, 7.0, 2.0, 7.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-17.046875, -16.65234375, -16.2578125, -15.86328125, -15.46875, -15.07421875, -14.6796875, -14.28515625, -13.890625, -13.49609375, -13.1015625, -12.70703125, -12.3125, -11.91796875, -11.5234375, -11.12890625, -10.734375, -10.33984375, -9.9453125, -9.55078125, -9.15625, -8.76171875, -8.3671875, -7.97265625, -7.578125, -7.18359375, -6.7890625, -6.39453125, -6.0, -5.60546875, -5.2109375, -4.81640625, -4.421875, -4.02734375, -3.6328125, -3.23828125, -2.84375, -2.44921875, -2.0546875, -1.66015625, -1.265625, -0.87109375, -0.4765625, -0.08203125, 0.3125, 0.70703125, 1.1015625, 1.49609375, 1.890625, 2.28515625, 2.6796875, 3.07421875, 3.46875, 3.86328125, 4.2578125, 4.65234375, 5.046875, 5.44140625, 5.8359375, 6.23046875, 6.625, 7.01953125, 7.4140625, 7.80859375, 8.203125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 10.0, 7.0, 11.0, 11.0, 18.0, 23.0, 38.0, 45.0, 71.0, 135.0, 198.0, 337.0, 767.0, 3103.0, 427449.0, 3752607.0, 7209.0, 1041.0, 448.0, 268.0, 122.0, 106.0, 72.0, 48.0, 41.0, 18.0, 21.0, 14.0, 9.0, 7.0, 10.0, 6.0, 0.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.53125, -35.27880859375, -34.0263671875, -32.77392578125, -31.521484375, -30.26904296875, -29.0166015625, -27.76416015625, -26.51171875, -25.25927734375, -24.0068359375, -22.75439453125, -21.501953125, -20.24951171875, -18.9970703125, -17.74462890625, -16.4921875, -15.23974609375, -13.9873046875, -12.73486328125, -11.482421875, -10.22998046875, -8.9775390625, -7.72509765625, -6.47265625, -5.22021484375, -3.9677734375, -2.71533203125, -1.462890625, -0.21044921875, 1.0419921875, 2.29443359375, 3.546875, 4.79931640625, 6.0517578125, 7.30419921875, 8.556640625, 9.80908203125, 11.0615234375, 12.31396484375, 13.56640625, 14.81884765625, 16.0712890625, 17.32373046875, 18.576171875, 19.82861328125, 21.0810546875, 22.33349609375, 23.5859375, 24.83837890625, 26.0908203125, 27.34326171875, 28.595703125, 29.84814453125, 31.1005859375, 32.35302734375, 33.60546875, 34.85791015625, 36.1103515625, 37.36279296875, 38.615234375, 39.86767578125, 41.1201171875, 42.37255859375, 43.625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 11.0, 464.0, 523.0, 20.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-290.7997131347656, -285.41876220703125, -280.03778076171875, -274.6568298339844, -269.27587890625, -263.8949279785156, -258.51397705078125, -253.13299560546875, -247.75204467773438, -242.37109375, -236.99012756347656, -231.60916137695312, -226.22821044921875, -220.84725952148438, -215.46629333496094, -210.0853271484375, -204.70437622070312, -199.32342529296875, -193.9424591064453, -188.56149291992188, -183.1805419921875, -177.79959106445312, -172.4186248779297, -167.03765869140625, -161.65670776367188, -156.2757568359375, -150.89479064941406, -145.51382446289062, -140.13287353515625, -134.75192260742188, -129.37095642089844, -123.98999786376953, -118.60903930664062, -113.22808074951172, -107.84712219238281, -102.4661636352539, -97.085205078125, -91.7042465209961, -86.32328796386719, -80.94232940673828, -75.56137084960938, -70.18041229248047, -64.79945373535156, -59.418495178222656, -54.03753662109375, -48.656578063964844, -43.27561950683594, -37.89466094970703, -32.51370620727539, -27.132747650146484, -21.751789093017578, -16.370830535888672, -10.989871978759766, -5.608913421630859, -0.22795486450195312, 5.153003692626953, 10.53396224975586, 15.914920806884766, 21.295879364013672, 26.676837921142578, 32.057796478271484, 37.43875503540039, 42.8197135925293, 48.2006721496582, 53.58163070678711]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 7.0, 4.0, 5.0, 11.0, 11.0, 9.0, 13.0, 17.0, 20.0, 27.0, 21.0, 24.0, 24.0, 35.0, 33.0, 39.0, 36.0, 37.0, 41.0, 28.0, 28.0, 40.0, 42.0, 36.0, 45.0, 31.0, 31.0, 39.0, 34.0, 33.0, 26.0, 31.0, 23.0, 23.0, 17.0, 20.0, 5.0, 20.0, 3.0, 6.0, 5.0, 8.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.058658599853516, -26.214746475219727, -25.370832443237305, -24.526920318603516, -23.683006286621094, -22.839094161987305, -21.995182037353516, -21.151268005371094, -20.307353973388672, -19.463441848754883, -18.61952781677246, -17.775615692138672, -16.93170166015625, -16.08778953552246, -15.243876457214355, -14.39996337890625, -13.556051254272461, -12.712138175964355, -11.86822509765625, -11.024312973022461, -10.180398941040039, -9.33648681640625, -8.492573738098145, -7.648660659790039, -6.804747581481934, -5.960834503173828, -5.116921424865723, -4.273008823394775, -3.42909574508667, -2.5851826667785645, -1.7412700653076172, -0.8973569869995117, -0.05344200134277344, 0.7904709577560425, 1.6343839168548584, 2.4782967567443848, 3.3222098350524902, 4.166122913360596, 5.010035514831543, 5.853948593139648, 6.697861671447754, 7.541774749755859, 8.385687828063965, 9.22960090637207, 10.07351303100586, 10.917427062988281, 11.76133918762207, 12.605252265930176, 13.449165344238281, 14.293078422546387, 15.136991500854492, 15.980903625488281, 16.824817657470703, 17.668729782104492, 18.51264190673828, 19.356555938720703, 20.200469970703125, 21.044382095336914, 21.888296127319336, 22.732208251953125, 23.576122283935547, 24.420034408569336, 25.263946533203125, 26.107860565185547, 26.951772689819336]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 8.0, 2.0, 4.0, 5.0, 11.0, 10.0, 5.0, 10.0, 12.0, 17.0, 17.0, 17.0, 22.0, 20.0, 24.0, 28.0, 29.0, 42.0, 34.0, 34.0, 41.0, 42.0, 34.0, 47.0, 37.0, 52.0, 34.0, 37.0, 36.0, 31.0, 28.0, 30.0, 30.0, 26.0, 25.0, 24.0, 18.0, 19.0, 13.0, 11.0, 10.0, 5.0, 8.0, 5.0, 9.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.24609375, -2.181304931640625, -2.11651611328125, -2.051727294921875, -1.9869384765625, -1.922149658203125, -1.85736083984375, -1.792572021484375, -1.727783203125, -1.662994384765625, -1.59820556640625, -1.533416748046875, -1.4686279296875, -1.403839111328125, -1.33905029296875, -1.274261474609375, -1.20947265625, -1.144683837890625, -1.07989501953125, -1.015106201171875, -0.9503173828125, -0.885528564453125, -0.82073974609375, -0.755950927734375, -0.691162109375, -0.626373291015625, -0.56158447265625, -0.496795654296875, -0.4320068359375, -0.367218017578125, -0.30242919921875, -0.237640380859375, -0.1728515625, -0.108062744140625, -0.04327392578125, 0.021514892578125, 0.0863037109375, 0.151092529296875, 0.21588134765625, 0.280670166015625, 0.345458984375, 0.410247802734375, 0.47503662109375, 0.539825439453125, 0.6046142578125, 0.669403076171875, 0.73419189453125, 0.798980712890625, 0.86376953125, 0.928558349609375, 0.99334716796875, 1.058135986328125, 1.1229248046875, 1.187713623046875, 1.25250244140625, 1.317291259765625, 1.382080078125, 1.446868896484375, 1.51165771484375, 1.576446533203125, 1.6412353515625, 1.706024169921875, 1.77081298828125, 1.835601806640625, 1.900390625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 1.0, 3.0, 6.0, 9.0, 14.0, 13.0, 22.0, 63.0, 69.0, 102.0, 132.0, 226.0, 271.0, 447.0, 662.0, 912.0, 1372.0, 1982.0, 2945.0, 4372.0, 6579.0, 9531.0, 14358.0, 21764.0, 33290.0, 52876.0, 88529.0, 175046.0, 311703.0, 125894.0, 69565.0, 42643.0, 27583.0, 18408.0, 12008.0, 8117.0, 5503.0, 3718.0, 2518.0, 1712.0, 1150.0, 784.0, 524.0, 368.0, 236.0, 189.0, 122.0, 84.0, 42.0, 34.0, 23.0, 12.0, 17.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4677734375, -0.45281982421875, -0.4378662109375, -0.42291259765625, -0.407958984375, -0.39300537109375, -0.3780517578125, -0.36309814453125, -0.34814453125, -0.33319091796875, -0.3182373046875, -0.30328369140625, -0.288330078125, -0.27337646484375, -0.2584228515625, -0.24346923828125, -0.228515625, -0.21356201171875, -0.1986083984375, -0.18365478515625, -0.168701171875, -0.15374755859375, -0.1387939453125, -0.12384033203125, -0.10888671875, -0.09393310546875, -0.0789794921875, -0.06402587890625, -0.049072265625, -0.03411865234375, -0.0191650390625, -0.00421142578125, 0.0107421875, 0.02569580078125, 0.0406494140625, 0.05560302734375, 0.070556640625, 0.08551025390625, 0.1004638671875, 0.11541748046875, 0.13037109375, 0.14532470703125, 0.1602783203125, 0.17523193359375, 0.190185546875, 0.20513916015625, 0.2200927734375, 0.23504638671875, 0.25, 0.26495361328125, 0.2799072265625, 0.29486083984375, 0.309814453125, 0.32476806640625, 0.3397216796875, 0.35467529296875, 0.36962890625, 0.38458251953125, 0.3995361328125, 0.41448974609375, 0.429443359375, 0.44439697265625, 0.4593505859375, 0.47430419921875, 0.4892578125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 1.0, 4.0, 6.0, 5.0, 7.0, 4.0, 8.0, 5.0, 7.0, 15.0, 22.0, 19.0, 15.0, 14.0, 16.0, 17.0, 32.0, 27.0, 39.0, 29.0, 26.0, 35.0, 42.0, 31.0, 32.0, 44.0, 1063.0, 28.0, 35.0, 28.0, 30.0, 36.0, 33.0, 36.0, 25.0, 22.0, 27.0, 28.0, 22.0, 14.0, 20.0, 10.0, 13.0, 8.0, 13.0, 7.0, 5.0, 4.0, 3.0, 5.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 2.0], "bins": [-1.2431640625, -1.206146240234375, -1.16912841796875, -1.132110595703125, -1.0950927734375, -1.058074951171875, -1.02105712890625, -0.984039306640625, -0.947021484375, -0.910003662109375, -0.87298583984375, -0.835968017578125, -0.7989501953125, -0.761932373046875, -0.72491455078125, -0.687896728515625, -0.65087890625, -0.613861083984375, -0.57684326171875, -0.539825439453125, -0.5028076171875, -0.465789794921875, -0.42877197265625, -0.391754150390625, -0.354736328125, -0.317718505859375, -0.28070068359375, -0.243682861328125, -0.2066650390625, -0.169647216796875, -0.13262939453125, -0.095611572265625, -0.05859375, -0.021575927734375, 0.01544189453125, 0.052459716796875, 0.0894775390625, 0.126495361328125, 0.16351318359375, 0.200531005859375, 0.237548828125, 0.274566650390625, 0.31158447265625, 0.348602294921875, 0.3856201171875, 0.422637939453125, 0.45965576171875, 0.496673583984375, 0.53369140625, 0.570709228515625, 0.60772705078125, 0.644744873046875, 0.6817626953125, 0.718780517578125, 0.75579833984375, 0.792816162109375, 0.829833984375, 0.866851806640625, 0.90386962890625, 0.940887451171875, 0.9779052734375, 1.014923095703125, 1.05194091796875, 1.088958740234375, 1.1259765625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 6.0, 12.0, 20.0, 29.0, 30.0, 63.0, 77.0, 93.0, 147.0, 194.0, 359.0, 525.0, 789.0, 1124.0, 1755.0, 2523.0, 4083.0, 6355.0, 9453.0, 15274.0, 24430.0, 40491.0, 68891.0, 125947.0, 1382406.0, 184782.0, 90943.0, 52180.0, 31306.0, 18981.0, 11890.0, 7520.0, 4814.0, 3105.0, 2102.0, 1384.0, 919.0, 692.0, 467.0, 291.0, 204.0, 142.0, 107.0, 63.0, 44.0, 34.0, 30.0, 14.0, 14.0, 13.0, 4.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.466064453125, -0.4509010314941406, -0.43573760986328125, -0.4205741882324219, -0.4054107666015625, -0.3902473449707031, -0.37508392333984375, -0.3599205017089844, -0.344757080078125, -0.3295936584472656, -0.31443023681640625, -0.2992668151855469, -0.2841033935546875, -0.2689399719238281, -0.25377655029296875, -0.23861312866210938, -0.22344970703125, -0.20828628540039062, -0.19312286376953125, -0.17795944213867188, -0.1627960205078125, -0.14763259887695312, -0.13246917724609375, -0.11730575561523438, -0.102142333984375, -0.08697891235351562, -0.07181549072265625, -0.056652069091796875, -0.0414886474609375, -0.026325225830078125, -0.01116180419921875, 0.004001617431640625, 0.0191650390625, 0.034328460693359375, 0.04949188232421875, 0.06465530395507812, 0.0798187255859375, 0.09498214721679688, 0.11014556884765625, 0.12530899047851562, 0.140472412109375, 0.15563583374023438, 0.17079925537109375, 0.18596267700195312, 0.2011260986328125, 0.21628952026367188, 0.23145294189453125, 0.24661636352539062, 0.26177978515625, 0.2769432067871094, 0.29210662841796875, 0.3072700500488281, 0.3224334716796875, 0.3375968933105469, 0.35276031494140625, 0.3679237365722656, 0.383087158203125, 0.3982505798339844, 0.41341400146484375, 0.4285774230957031, 0.4437408447265625, 0.4589042663574219, 0.47406768798828125, 0.4892311096191406, 0.50439453125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 7.0, 11.0, 5.0, 14.0, 21.0, 24.0, 24.0, 42.0, 63.0, 69.0, 79.0, 108.0, 99.0, 90.0, 73.0, 63.0, 57.0, 30.0, 35.0, 25.0, 17.0, 12.0, 7.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005121231079101562, -0.0004980526864528656, -0.00048398226499557495, -0.0004699118435382843, -0.00045584142208099365, -0.000441771000623703, -0.00042770057916641235, -0.0004136301577091217, -0.00039955973625183105, -0.0003854893147945404, -0.00037141889333724976, -0.0003573484718799591, -0.00034327805042266846, -0.0003292076289653778, -0.00031513720750808716, -0.0003010667860507965, -0.00028699636459350586, -0.0002729259431362152, -0.00025885552167892456, -0.0002447851002216339, -0.00023071467876434326, -0.0002166442573070526, -0.00020257383584976196, -0.0001885034143924713, -0.00017443299293518066, -0.00016036257147789001, -0.00014629215002059937, -0.00013222172856330872, -0.00011815130710601807, -0.00010408088564872742, -9.001046419143677e-05, -7.594004273414612e-05, -6.186962127685547e-05, -4.779919981956482e-05, -3.372877836227417e-05, -1.965835690498352e-05, -5.587935447692871e-06, 8.482486009597778e-06, 2.2552907466888428e-05, 3.662332892417908e-05, 5.0693750381469727e-05, 6.476417183876038e-05, 7.883459329605103e-05, 9.290501475334167e-05, 0.00010697543621063232, 0.00012104585766792297, 0.00013511627912521362, 0.00014918670058250427, 0.00016325712203979492, 0.00017732754349708557, 0.00019139796495437622, 0.00020546838641166687, 0.00021953880786895752, 0.00023360922932624817, 0.0002476796507835388, 0.00026175007224082947, 0.0002758204936981201, 0.00028989091515541077, 0.0003039613366127014, 0.00031803175806999207, 0.0003321021795272827, 0.00034617260098457336, 0.000360243022441864, 0.00037431344389915466, 0.0003883838653564453]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 4.0, 5.0, 8.0, 14.0, 18.0, 40.0, 53.0, 78.0, 107.0, 143.0, 267.0, 709.0, 249744.0, 795750.0, 751.0, 321.0, 173.0, 119.0, 64.0, 38.0, 45.0, 27.0, 18.0, 15.0, 11.0, 11.0, 5.0, 4.0, 4.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009918212890625, -0.009608626365661621, -0.009299039840698242, -0.008989453315734863, -0.008679866790771484, -0.008370280265808105, -0.008060693740844727, -0.007751107215881348, -0.007441520690917969, -0.00713193416595459, -0.006822347640991211, -0.006512761116027832, -0.006203174591064453, -0.005893588066101074, -0.005584001541137695, -0.005274415016174316, -0.0049648284912109375, -0.004655241966247559, -0.00434565544128418, -0.004036068916320801, -0.003726482391357422, -0.003416895866394043, -0.003107309341430664, -0.002797722816467285, -0.0024881362915039062, -0.0021785497665405273, -0.0018689632415771484, -0.0015593767166137695, -0.0012497901916503906, -0.0009402036666870117, -0.0006306171417236328, -0.0003210306167602539, -1.1444091796875e-05, 0.0002981424331665039, 0.0006077289581298828, 0.0009173154830932617, 0.0012269020080566406, 0.0015364885330200195, 0.0018460750579833984, 0.0021556615829467773, 0.0024652481079101562, 0.002774834632873535, 0.003084421157836914, 0.003394007682800293, 0.003703594207763672, 0.004013180732727051, 0.00432276725769043, 0.004632353782653809, 0.0049419403076171875, 0.005251526832580566, 0.005561113357543945, 0.005870699882507324, 0.006180286407470703, 0.006489872932434082, 0.006799459457397461, 0.00710904598236084, 0.007418632507324219, 0.007728219032287598, 0.008037805557250977, 0.008347392082214355, 0.008656978607177734, 0.008966565132141113, 0.009276151657104492, 0.009585738182067871, 0.00989532470703125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 22.0, 94.0, 296.0, 387.0, 170.0, 38.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006656274199485779, -0.0006498635630123317, -0.0006340997642837465, -0.0006183359073475003, -0.0006025721086189151, -0.0005868082516826689, -0.0005710444529540837, -0.0005552805960178375, -0.0005395167972892523, -0.0005237529403530061, -0.0005079891416244209, -0.0004922252846881747, -0.0004764614859595895, -0.0004606976290233433, -0.0004449338011909276, -0.0004291699733585119, -0.00041340611642226577, -0.00039764228858985007, -0.00038187846075743437, -0.00036611463292501867, -0.00035035080509260297, -0.0003345869481563568, -0.0003188231203239411, -0.0003030592924915254, -0.0002872954646591097, -0.000271531636826694, -0.0002557678089942783, -0.00024000396660994738, -0.00022424013877753168, -0.00020847631094511598, -0.00019271246856078506, -0.00017694864072836936, -0.0001611847837921232, -0.0001454209559597075, -0.0001296571281272918, -0.00011389328574296087, -9.812945791054517e-05, -8.236563007812947e-05, -6.660179496975616e-05, -5.083795986138284e-05, -3.507413202896714e-05, -1.9310300558572635e-05, -3.546469088178128e-06, 1.2217362382216379e-05, 2.7981193852610886e-05, 4.3745021685026586e-05, 5.95088567933999e-05, 7.527269190177321e-05, 9.103651973418891e-05, 0.00010680034756660461, 0.00012256417539902031, 0.00013832801778335124, 0.00015409184561576694, 0.00016985567344818264, 0.00018561951583251357, 0.00020138334366492927, 0.00021714717149734497, 0.00023291099932976067, 0.00024867482716217637, 0.00026443865499459207, 0.00028020248282700777, 0.00029596633976325393, 0.00031173016759566963, 0.00032749399542808533, 0.00034325782326050103]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 5.0, 9.0, 14.0, 13.0, 14.0, 23.0, 29.0, 40.0, 24.0, 32.0, 31.0, 33.0, 35.0, 41.0, 44.0, 39.0, 52.0, 47.0, 43.0, 37.0, 48.0, 42.0, 41.0, 45.0, 33.0, 24.0, 25.0, 17.0, 21.0, 19.0, 17.0, 15.0, 18.0, 6.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019800662994384766, -0.00019209552556276321, -0.00018618442118167877, -0.00018027331680059433, -0.0001743622124195099, -0.00016845110803842545, -0.000162540003657341, -0.00015662889927625656, -0.00015071779489517212, -0.00014480669051408768, -0.00013889558613300323, -0.0001329844817519188, -0.00012707337737083435, -0.00012116227298974991, -0.00011525116860866547, -0.00010934006422758102, -0.00010342895984649658, -9.751785546541214e-05, -9.16067510843277e-05, -8.569564670324326e-05, -7.978454232215881e-05, -7.387343794107437e-05, -6.796233355998993e-05, -6.205122917890549e-05, -5.6140124797821045e-05, -5.02290204167366e-05, -4.431791603565216e-05, -3.840681165456772e-05, -3.2495707273483276e-05, -2.6584602892398834e-05, -2.0673498511314392e-05, -1.476239413022995e-05, -8.851289749145508e-06, -2.9401853680610657e-06, 2.9709190130233765e-06, 8.882023394107819e-06, 1.479312777519226e-05, 2.0704232156276703e-05, 2.6615336537361145e-05, 3.252644091844559e-05, 3.843754529953003e-05, 4.434864968061447e-05, 5.0259754061698914e-05, 5.6170858442783356e-05, 6.20819628238678e-05, 6.799306720495224e-05, 7.390417158603668e-05, 7.981527596712112e-05, 8.572638034820557e-05, 9.163748472929001e-05, 9.754858911037445e-05, 0.00010345969349145889, 0.00010937079787254333, 0.00011528190225362778, 0.00012119300663471222, 0.00012710411101579666, 0.0001330152153968811, 0.00013892631977796555, 0.00014483742415905, 0.00015074852854013443, 0.00015665963292121887, 0.00016257073730230331, 0.00016848184168338776, 0.0001743929460644722, 0.00018030405044555664]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 8.0, 2.0, 4.0, 5.0, 11.0, 10.0, 5.0, 10.0, 12.0, 17.0, 17.0, 17.0, 22.0, 20.0, 24.0, 28.0, 29.0, 42.0, 34.0, 34.0, 41.0, 42.0, 34.0, 47.0, 37.0, 52.0, 34.0, 37.0, 36.0, 31.0, 28.0, 30.0, 30.0, 26.0, 25.0, 24.0, 18.0, 19.0, 13.0, 11.0, 10.0, 5.0, 8.0, 5.0, 9.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.24609375, -2.181304931640625, -2.11651611328125, -2.051727294921875, -1.9869384765625, -1.922149658203125, -1.85736083984375, -1.792572021484375, -1.727783203125, -1.662994384765625, -1.59820556640625, -1.533416748046875, -1.4686279296875, -1.403839111328125, -1.33905029296875, -1.274261474609375, -1.20947265625, -1.144683837890625, -1.07989501953125, -1.015106201171875, -0.9503173828125, -0.885528564453125, -0.82073974609375, -0.755950927734375, -0.691162109375, -0.626373291015625, -0.56158447265625, -0.496795654296875, -0.4320068359375, -0.367218017578125, -0.30242919921875, -0.237640380859375, -0.1728515625, -0.108062744140625, -0.04327392578125, 0.021514892578125, 0.0863037109375, 0.151092529296875, 0.21588134765625, 0.280670166015625, 0.345458984375, 0.410247802734375, 0.47503662109375, 0.539825439453125, 0.6046142578125, 0.669403076171875, 0.73419189453125, 0.798980712890625, 0.86376953125, 0.928558349609375, 0.99334716796875, 1.058135986328125, 1.1229248046875, 1.187713623046875, 1.25250244140625, 1.317291259765625, 1.382080078125, 1.446868896484375, 1.51165771484375, 1.576446533203125, 1.6412353515625, 1.706024169921875, 1.77081298828125, 1.835601806640625, 1.900390625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 4.0, 11.0, 8.0, 8.0, 16.0, 22.0, 26.0, 28.0, 57.0, 77.0, 91.0, 152.0, 196.0, 300.0, 491.0, 735.0, 1340.0, 2391.0, 4972.0, 10795.0, 26071.0, 67104.0, 180994.0, 358462.0, 240334.0, 91825.0, 34587.0, 14164.0, 6149.0, 2951.0, 1621.0, 924.0, 545.0, 337.0, 237.0, 170.0, 116.0, 61.0, 49.0, 47.0, 26.0, 19.0, 11.0, 21.0, 8.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.427734375, -2.348541259765625, -2.26934814453125, -2.190155029296875, -2.1109619140625, -2.031768798828125, -1.95257568359375, -1.873382568359375, -1.794189453125, -1.714996337890625, -1.63580322265625, -1.556610107421875, -1.4774169921875, -1.398223876953125, -1.31903076171875, -1.239837646484375, -1.16064453125, -1.081451416015625, -1.00225830078125, -0.923065185546875, -0.8438720703125, -0.764678955078125, -0.68548583984375, -0.606292724609375, -0.527099609375, -0.447906494140625, -0.36871337890625, -0.289520263671875, -0.2103271484375, -0.131134033203125, -0.05194091796875, 0.027252197265625, 0.1064453125, 0.185638427734375, 0.26483154296875, 0.344024658203125, 0.4232177734375, 0.502410888671875, 0.58160400390625, 0.660797119140625, 0.739990234375, 0.819183349609375, 0.89837646484375, 0.977569580078125, 1.0567626953125, 1.135955810546875, 1.21514892578125, 1.294342041015625, 1.37353515625, 1.452728271484375, 1.53192138671875, 1.611114501953125, 1.6903076171875, 1.769500732421875, 1.84869384765625, 1.927886962890625, 2.007080078125, 2.086273193359375, 2.16546630859375, 2.244659423828125, 2.3238525390625, 2.403045654296875, 2.48223876953125, 2.561431884765625, 2.640625]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 3.0, 10.0, 11.0, 5.0, 15.0, 11.0, 11.0, 15.0, 8.0, 22.0, 21.0, 23.0, 32.0, 30.0, 40.0, 36.0, 34.0, 47.0, 44.0, 81.0, 191.0, 1484.0, 290.0, 122.0, 72.0, 50.0, 36.0, 31.0, 31.0, 32.0, 27.0, 24.0, 24.0, 27.0, 17.0, 16.0, 12.0, 12.0, 7.0, 13.0, 8.0, 8.0, 3.0, 1.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-7.12890625, -6.91741943359375, -6.7059326171875, -6.49444580078125, -6.282958984375, -6.07147216796875, -5.8599853515625, -5.64849853515625, -5.43701171875, -5.22552490234375, -5.0140380859375, -4.80255126953125, -4.591064453125, -4.37957763671875, -4.1680908203125, -3.95660400390625, -3.7451171875, -3.53363037109375, -3.3221435546875, -3.11065673828125, -2.899169921875, -2.68768310546875, -2.4761962890625, -2.26470947265625, -2.05322265625, -1.84173583984375, -1.6302490234375, -1.41876220703125, -1.207275390625, -0.99578857421875, -0.7843017578125, -0.57281494140625, -0.361328125, -0.14984130859375, 0.0616455078125, 0.27313232421875, 0.484619140625, 0.69610595703125, 0.9075927734375, 1.11907958984375, 1.33056640625, 1.54205322265625, 1.7535400390625, 1.96502685546875, 2.176513671875, 2.38800048828125, 2.5994873046875, 2.81097412109375, 3.0224609375, 3.23394775390625, 3.4454345703125, 3.65692138671875, 3.868408203125, 4.07989501953125, 4.2913818359375, 4.50286865234375, 4.71435546875, 4.92584228515625, 5.1373291015625, 5.34881591796875, 5.560302734375, 5.77178955078125, 5.9832763671875, 6.19476318359375, 6.40625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 7.0, 4.0, 5.0, 10.0, 16.0, 13.0, 11.0, 22.0, 13.0, 26.0, 30.0, 30.0, 43.0, 59.0, 87.0, 116.0, 226.0, 434.0, 1501.0, 18089.0, 2853192.0, 266078.0, 3944.0, 809.0, 303.0, 181.0, 105.0, 63.0, 60.0, 43.0, 33.0, 24.0, 23.0, 9.0, 16.0, 16.0, 16.0, 9.0, 7.0, 7.0, 4.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-13.9765625, -13.5069580078125, -13.037353515625, -12.5677490234375, -12.09814453125, -11.6285400390625, -11.158935546875, -10.6893310546875, -10.2197265625, -9.7501220703125, -9.280517578125, -8.8109130859375, -8.34130859375, -7.8717041015625, -7.402099609375, -6.9324951171875, -6.462890625, -5.9932861328125, -5.523681640625, -5.0540771484375, -4.58447265625, -4.1148681640625, -3.645263671875, -3.1756591796875, -2.7060546875, -2.2364501953125, -1.766845703125, -1.2972412109375, -0.82763671875, -0.3580322265625, 0.111572265625, 0.5811767578125, 1.05078125, 1.5203857421875, 1.989990234375, 2.4595947265625, 2.92919921875, 3.3988037109375, 3.868408203125, 4.3380126953125, 4.8076171875, 5.2772216796875, 5.746826171875, 6.2164306640625, 6.68603515625, 7.1556396484375, 7.625244140625, 8.0948486328125, 8.564453125, 9.0340576171875, 9.503662109375, 9.9732666015625, 10.44287109375, 10.9124755859375, 11.382080078125, 11.8516845703125, 12.3212890625, 12.7908935546875, 13.260498046875, 13.7301025390625, 14.19970703125, 14.6693115234375, 15.138916015625, 15.6085205078125, 16.078125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 58.0, 509.0, 403.0, 40.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.01401901245117, -45.538883209228516, -44.06374740600586, -42.58860778808594, -41.11347198486328, -39.638336181640625, -38.16320037841797, -36.68806457519531, -35.212928771972656, -33.73779296875, -32.262657165527344, -30.787519454956055, -29.3123836517334, -27.83724594116211, -26.362110137939453, -24.886974334716797, -23.411836624145508, -21.93670082092285, -20.461563110351562, -18.986427307128906, -17.51129150390625, -16.036155700683594, -14.561017990112305, -13.085882186889648, -11.610745429992676, -10.135608673095703, -8.660472869873047, -7.185336112976074, -5.71019983291626, -4.235063552856445, -2.7599267959594727, -1.2847909927368164, 0.19034576416015625, 1.6654821634292603, 3.1406185626983643, 4.615755081176758, 6.090891361236572, 7.566027641296387, 9.04116439819336, 10.516300201416016, 11.991436958312988, 13.466573715209961, 14.941709518432617, 16.416847229003906, 17.891983032226562, 19.36711883544922, 20.842254638671875, 22.31739044189453, 23.79252815246582, 25.267663955688477, 26.742801666259766, 28.217937469482422, 29.693073272705078, 31.168209075927734, 32.643348693847656, 34.11848449707031, 35.59362030029297, 37.068756103515625, 38.54389190673828, 40.01902770996094, 41.49416732788086, 42.969303131103516, 44.44443893432617, 45.91957473754883, 47.394710540771484]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 7.0, 5.0, 4.0, 7.0, 16.0, 15.0, 20.0, 11.0, 22.0, 15.0, 24.0, 24.0, 28.0, 43.0, 38.0, 35.0, 39.0, 40.0, 33.0, 57.0, 38.0, 48.0, 30.0, 32.0, 50.0, 34.0, 39.0, 33.0, 21.0, 31.0, 18.0, 21.0, 22.0, 15.0, 14.0, 13.0, 9.0, 11.0, 8.0, 6.0, 7.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-20.036022186279297, -19.33404541015625, -18.632070541381836, -17.93009376525879, -17.228116989135742, -16.526142120361328, -15.824165344238281, -15.12218952178955, -14.42021369934082, -13.71823787689209, -13.016261100769043, -12.314285278320312, -11.612309455871582, -10.910333633422852, -10.208356857299805, -9.506381034851074, -8.804404258728027, -8.102428436279297, -7.400452136993408, -6.6984758377075195, -5.996500015258789, -5.2945237159729, -4.592547416687012, -3.8905715942382812, -3.1885952949523926, -2.486619234085083, -1.7846430540084839, -1.0826668739318848, -0.3806908130645752, 0.3212852478027344, 1.023261547088623, 1.7252373695373535, 2.427213668823242, 3.1291897296905518, 3.8311657905578613, 4.53314208984375, 5.2351179122924805, 5.937094211578369, 6.639070510864258, 7.341046333312988, 8.043022155761719, 8.74499797821045, 9.446974754333496, 10.148950576782227, 10.850926399230957, 11.552902221679688, 12.254878997802734, 12.956854820251465, 13.658831596374512, 14.360807418823242, 15.062784194946289, 15.76476001739502, 16.46673583984375, 17.168712615966797, 17.870689392089844, 18.572664260864258, 19.274641036987305, 19.97661781311035, 20.678592681884766, 21.380569458007812, 22.08254623413086, 22.784521102905273, 23.48649787902832, 24.188472747802734, 24.89044952392578]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 6.0, 7.0, 7.0, 7.0, 9.0, 7.0, 7.0, 10.0, 24.0, 20.0, 16.0, 27.0, 21.0, 17.0, 32.0, 38.0, 35.0, 27.0, 42.0, 45.0, 36.0, 51.0, 40.0, 43.0, 33.0, 42.0, 30.0, 43.0, 23.0, 30.0, 37.0, 29.0, 23.0, 36.0, 16.0, 12.0, 18.0, 9.0, 14.0, 11.0, 3.0, 4.0, 9.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.287109375, -2.218719482421875, -2.15032958984375, -2.081939697265625, -2.0135498046875, -1.945159912109375, -1.87677001953125, -1.808380126953125, -1.739990234375, -1.671600341796875, -1.60321044921875, -1.534820556640625, -1.4664306640625, -1.398040771484375, -1.32965087890625, -1.261260986328125, -1.19287109375, -1.124481201171875, -1.05609130859375, -0.987701416015625, -0.9193115234375, -0.850921630859375, -0.78253173828125, -0.714141845703125, -0.645751953125, -0.577362060546875, -0.50897216796875, -0.440582275390625, -0.3721923828125, -0.303802490234375, -0.23541259765625, -0.167022705078125, -0.0986328125, -0.030242919921875, 0.03814697265625, 0.106536865234375, 0.1749267578125, 0.243316650390625, 0.31170654296875, 0.380096435546875, 0.448486328125, 0.516876220703125, 0.58526611328125, 0.653656005859375, 0.7220458984375, 0.790435791015625, 0.85882568359375, 0.927215576171875, 0.99560546875, 1.063995361328125, 1.13238525390625, 1.200775146484375, 1.2691650390625, 1.337554931640625, 1.40594482421875, 1.474334716796875, 1.542724609375, 1.611114501953125, 1.67950439453125, 1.747894287109375, 1.8162841796875, 1.884674072265625, 1.95306396484375, 2.021453857421875, 2.08984375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 5.0, 9.0, 6.0, 10.0, 17.0, 15.0, 20.0, 32.0, 33.0, 58.0, 70.0, 101.0, 171.0, 299.0, 550.0, 1208.0, 4214.0, 23852.0, 268217.0, 2564993.0, 1231429.0, 84415.0, 10376.0, 2254.0, 813.0, 437.0, 199.0, 129.0, 86.0, 62.0, 42.0, 36.0, 30.0, 12.0, 12.0, 14.0, 14.0, 7.0, 10.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.3359375, -7.1187744140625, -6.901611328125, -6.6844482421875, -6.46728515625, -6.2501220703125, -6.032958984375, -5.8157958984375, -5.5986328125, -5.3814697265625, -5.164306640625, -4.9471435546875, -4.72998046875, -4.5128173828125, -4.295654296875, -4.0784912109375, -3.861328125, -3.6441650390625, -3.427001953125, -3.2098388671875, -2.99267578125, -2.7755126953125, -2.558349609375, -2.3411865234375, -2.1240234375, -1.9068603515625, -1.689697265625, -1.4725341796875, -1.25537109375, -1.0382080078125, -0.821044921875, -0.6038818359375, -0.38671875, -0.1695556640625, 0.047607421875, 0.2647705078125, 0.48193359375, 0.6990966796875, 0.916259765625, 1.1334228515625, 1.3505859375, 1.5677490234375, 1.784912109375, 2.0020751953125, 2.21923828125, 2.4364013671875, 2.653564453125, 2.8707275390625, 3.087890625, 3.3050537109375, 3.522216796875, 3.7393798828125, 3.95654296875, 4.1737060546875, 4.390869140625, 4.6080322265625, 4.8251953125, 5.0423583984375, 5.259521484375, 5.4766845703125, 5.69384765625, 5.9110107421875, 6.128173828125, 6.3453369140625, 6.5625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 4.0, 5.0, 5.0, 8.0, 15.0, 16.0, 25.0, 32.0, 49.0, 69.0, 122.0, 164.0, 241.0, 307.0, 419.0, 507.0, 547.0, 443.0, 307.0, 250.0, 149.0, 114.0, 95.0, 54.0, 52.0, 27.0, 19.0, 14.0, 4.0, 7.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.390625, -11.11346435546875, -10.8363037109375, -10.55914306640625, -10.281982421875, -10.00482177734375, -9.7276611328125, -9.45050048828125, -9.17333984375, -8.89617919921875, -8.6190185546875, -8.34185791015625, -8.064697265625, -7.78753662109375, -7.5103759765625, -7.23321533203125, -6.9560546875, -6.67889404296875, -6.4017333984375, -6.12457275390625, -5.847412109375, -5.57025146484375, -5.2930908203125, -5.01593017578125, -4.73876953125, -4.46160888671875, -4.1844482421875, -3.90728759765625, -3.630126953125, -3.35296630859375, -3.0758056640625, -2.79864501953125, -2.521484375, -2.24432373046875, -1.9671630859375, -1.69000244140625, -1.412841796875, -1.13568115234375, -0.8585205078125, -0.58135986328125, -0.30419921875, -0.02703857421875, 0.2501220703125, 0.52728271484375, 0.804443359375, 1.08160400390625, 1.3587646484375, 1.63592529296875, 1.9130859375, 2.19024658203125, 2.4674072265625, 2.74456787109375, 3.021728515625, 3.29888916015625, 3.5760498046875, 3.85321044921875, 4.13037109375, 4.40753173828125, 4.6846923828125, 4.96185302734375, 5.239013671875, 5.51617431640625, 5.7933349609375, 6.07049560546875, 6.34765625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [4.0, 3.0, 0.0, 4.0, 3.0, 1.0, 7.0, 8.0, 15.0, 29.0, 25.0, 28.0, 56.0, 79.0, 117.0, 196.0, 353.0, 856.0, 4504.0, 241963.0, 3889173.0, 53028.0, 2395.0, 630.0, 262.0, 177.0, 120.0, 74.0, 55.0, 40.0, 24.0, 26.0, 14.0, 10.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.484375, -15.674560546875, -14.86474609375, -14.054931640625, -13.2451171875, -12.435302734375, -11.62548828125, -10.815673828125, -10.005859375, -9.196044921875, -8.38623046875, -7.576416015625, -6.7666015625, -5.956787109375, -5.14697265625, -4.337158203125, -3.52734375, -2.717529296875, -1.90771484375, -1.097900390625, -0.2880859375, 0.521728515625, 1.33154296875, 2.141357421875, 2.951171875, 3.760986328125, 4.57080078125, 5.380615234375, 6.1904296875, 7.000244140625, 7.81005859375, 8.619873046875, 9.4296875, 10.239501953125, 11.04931640625, 11.859130859375, 12.6689453125, 13.478759765625, 14.28857421875, 15.098388671875, 15.908203125, 16.718017578125, 17.52783203125, 18.337646484375, 19.1474609375, 19.957275390625, 20.76708984375, 21.576904296875, 22.38671875, 23.196533203125, 24.00634765625, 24.816162109375, 25.6259765625, 26.435791015625, 27.24560546875, 28.055419921875, 28.865234375, 29.675048828125, 30.48486328125, 31.294677734375, 32.1044921875, 32.914306640625, 33.72412109375, 34.533935546875, 35.34375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 10.0, 30.0, 85.0, 171.0, 259.0, 232.0, 139.0, 60.0, 20.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.64305114746094, -80.0042495727539, -78.36544799804688, -76.72663879394531, -75.08783721923828, -73.44903564453125, -71.81023406982422, -70.17143249511719, -68.53262329101562, -66.8938217163086, -65.25502014160156, -63.616214752197266, -61.97740936279297, -60.33860778808594, -58.699806213378906, -57.061004638671875, -55.422203063964844, -53.78340148925781, -52.144596099853516, -50.505794525146484, -48.86698913574219, -47.228187561035156, -45.589385986328125, -43.950584411621094, -42.3117790222168, -40.672977447509766, -39.03417205810547, -37.39537048339844, -35.756568908691406, -34.11776351928711, -32.47896194458008, -30.840158462524414, -29.201351165771484, -27.56254768371582, -25.923744201660156, -24.284942626953125, -22.64613914489746, -21.007335662841797, -19.368534088134766, -17.7297306060791, -16.090927124023438, -14.452123641967773, -12.813321113586426, -11.174518585205078, -9.535715103149414, -7.89691162109375, -6.258109092712402, -4.619306564331055, -2.9805030822753906, -1.3417000770568848, 0.2971029281616211, 1.935905933380127, 3.574708938598633, 5.213512420654297, 6.8523149490356445, 8.491117477416992, 10.129920959472656, 11.76872444152832, 13.407526969909668, 15.046329498291016, 16.68513298034668, 18.323936462402344, 19.962738037109375, 21.60154151916504, 23.240345001220703]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 6.0, 8.0, 12.0, 14.0, 12.0, 18.0, 17.0, 15.0, 15.0, 25.0, 34.0, 26.0, 36.0, 45.0, 39.0, 38.0, 34.0, 41.0, 39.0, 52.0, 29.0, 51.0, 38.0, 34.0, 38.0, 27.0, 35.0, 23.0, 30.0, 23.0, 24.0, 17.0, 18.0, 11.0, 19.0, 17.0, 17.0, 8.0, 2.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.884597778320312, -25.114299774169922, -24.34400177001953, -23.57370376586914, -22.803407669067383, -22.033109664916992, -21.2628116607666, -20.49251365661621, -19.722217559814453, -18.951919555664062, -18.181621551513672, -17.41132354736328, -16.641027450561523, -15.870729446411133, -15.100431442260742, -14.330133438110352, -13.559835433959961, -12.78953742980957, -12.019240379333496, -11.248942375183105, -10.478645324707031, -9.70834732055664, -8.93804931640625, -8.16775131225586, -7.397454261779785, -6.627156734466553, -5.85685920715332, -5.08656120300293, -4.316263675689697, -3.545966148376465, -2.775668144226074, -2.005370616912842, -1.2350730895996094, -0.4647754430770874, 0.30552220344543457, 1.075819969177246, 1.8461174964904785, 2.616415023803711, 3.3867130279541016, 4.157010555267334, 4.927308082580566, 5.697605609893799, 6.467903137207031, 7.238201141357422, 8.008499145507812, 8.778796195983887, 9.549094200134277, 10.319391250610352, 11.089689254760742, 11.859987258911133, 12.630284309387207, 13.400582313537598, 14.170879364013672, 14.941177368164062, 15.711475372314453, 16.481773376464844, 17.252071380615234, 18.022369384765625, 18.792667388916016, 19.562965393066406, 20.333261489868164, 21.103559494018555, 21.873857498168945, 22.644155502319336, 23.414451599121094]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 3.0, 7.0, 11.0, 13.0, 11.0, 18.0, 17.0, 16.0, 26.0, 17.0, 29.0, 27.0, 30.0, 26.0, 32.0, 25.0, 31.0, 32.0, 35.0, 52.0, 45.0, 38.0, 46.0, 29.0, 28.0, 38.0, 35.0, 26.0, 37.0, 25.0, 22.0, 16.0, 23.0, 23.0, 19.0, 14.0, 12.0, 13.0, 13.0, 8.0, 7.0, 5.0, 2.0, 5.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.142578125, -2.0771484375, -2.01171875, -1.9462890625, -1.880859375, -1.8154296875, -1.75, -1.6845703125, -1.619140625, -1.5537109375, -1.48828125, -1.4228515625, -1.357421875, -1.2919921875, -1.2265625, -1.1611328125, -1.095703125, -1.0302734375, -0.96484375, -0.8994140625, -0.833984375, -0.7685546875, -0.703125, -0.6376953125, -0.572265625, -0.5068359375, -0.44140625, -0.3759765625, -0.310546875, -0.2451171875, -0.1796875, -0.1142578125, -0.048828125, 0.0166015625, 0.08203125, 0.1474609375, 0.212890625, 0.2783203125, 0.34375, 0.4091796875, 0.474609375, 0.5400390625, 0.60546875, 0.6708984375, 0.736328125, 0.8017578125, 0.8671875, 0.9326171875, 0.998046875, 1.0634765625, 1.12890625, 1.1943359375, 1.259765625, 1.3251953125, 1.390625, 1.4560546875, 1.521484375, 1.5869140625, 1.65234375, 1.7177734375, 1.783203125, 1.8486328125, 1.9140625, 1.9794921875, 2.044921875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 3.0, 0.0, 8.0, 8.0, 12.0, 28.0, 43.0, 52.0, 78.0, 67.0, 149.0, 214.0, 303.0, 449.0, 602.0, 918.0, 1290.0, 1835.0, 2572.0, 3776.0, 5451.0, 7865.0, 11103.0, 16003.0, 22976.0, 33099.0, 48983.0, 74074.0, 122274.0, 275982.0, 154242.0, 85526.0, 55614.0, 37714.0, 25923.0, 18035.0, 12540.0, 8620.0, 6081.0, 4283.0, 2990.0, 2037.0, 1488.0, 1006.0, 626.0, 486.0, 373.0, 252.0, 158.0, 123.0, 73.0, 56.0, 35.0, 26.0, 15.0, 15.0, 3.0, 4.0, 2.0, 2.0, 4.0], "bins": [-0.43408203125, -0.4207916259765625, -0.407501220703125, -0.3942108154296875, -0.38092041015625, -0.3676300048828125, -0.354339599609375, -0.3410491943359375, -0.3277587890625, -0.3144683837890625, -0.301177978515625, -0.2878875732421875, -0.27459716796875, -0.2613067626953125, -0.248016357421875, -0.2347259521484375, -0.221435546875, -0.2081451416015625, -0.194854736328125, -0.1815643310546875, -0.16827392578125, -0.1549835205078125, -0.141693115234375, -0.1284027099609375, -0.1151123046875, -0.1018218994140625, -0.088531494140625, -0.0752410888671875, -0.06195068359375, -0.0486602783203125, -0.035369873046875, -0.0220794677734375, -0.0087890625, 0.0045013427734375, 0.017791748046875, 0.0310821533203125, 0.04437255859375, 0.0576629638671875, 0.070953369140625, 0.0842437744140625, 0.0975341796875, 0.1108245849609375, 0.124114990234375, 0.1374053955078125, 0.15069580078125, 0.1639862060546875, 0.177276611328125, 0.1905670166015625, 0.203857421875, 0.2171478271484375, 0.230438232421875, 0.2437286376953125, 0.25701904296875, 0.2703094482421875, 0.283599853515625, 0.2968902587890625, 0.3101806640625, 0.3234710693359375, 0.336761474609375, 0.3500518798828125, 0.36334228515625, 0.3766326904296875, 0.389923095703125, 0.4032135009765625, 0.41650390625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 3.0, 6.0, 7.0, 10.0, 17.0, 17.0, 10.0, 17.0, 20.0, 15.0, 29.0, 37.0, 32.0, 39.0, 40.0, 46.0, 50.0, 42.0, 50.0, 1066.0, 44.0, 52.0, 38.0, 41.0, 41.0, 33.0, 40.0, 29.0, 28.0, 26.0, 12.0, 17.0, 8.0, 16.0, 15.0, 8.0, 7.0, 5.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5205078125, -1.4700469970703125, -1.419586181640625, -1.3691253662109375, -1.31866455078125, -1.2682037353515625, -1.217742919921875, -1.1672821044921875, -1.1168212890625, -1.0663604736328125, -1.015899658203125, -0.9654388427734375, -0.91497802734375, -0.8645172119140625, -0.814056396484375, -0.7635955810546875, -0.713134765625, -0.6626739501953125, -0.612213134765625, -0.5617523193359375, -0.51129150390625, -0.4608306884765625, -0.410369873046875, -0.3599090576171875, -0.3094482421875, -0.2589874267578125, -0.208526611328125, -0.1580657958984375, -0.10760498046875, -0.0571441650390625, -0.006683349609375, 0.0437774658203125, 0.09423828125, 0.1446990966796875, 0.195159912109375, 0.2456207275390625, 0.29608154296875, 0.3465423583984375, 0.397003173828125, 0.4474639892578125, 0.4979248046875, 0.5483856201171875, 0.598846435546875, 0.6493072509765625, 0.69976806640625, 0.7502288818359375, 0.800689697265625, 0.8511505126953125, 0.901611328125, 0.9520721435546875, 1.002532958984375, 1.0529937744140625, 1.10345458984375, 1.1539154052734375, 1.204376220703125, 1.2548370361328125, 1.3052978515625, 1.3557586669921875, 1.406219482421875, 1.4566802978515625, 1.50714111328125, 1.5576019287109375, 1.608062744140625, 1.6585235595703125, 1.708984375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 8.0, 10.0, 8.0, 23.0, 31.0, 47.0, 69.0, 135.0, 161.0, 260.0, 436.0, 705.0, 1048.0, 1789.0, 2989.0, 5023.0, 8514.0, 14697.0, 26479.0, 49534.0, 99318.0, 256068.0, 1390665.0, 113411.0, 56340.0, 29762.0, 16383.0, 9382.0, 5355.0, 3346.0, 1882.0, 1207.0, 713.0, 501.0, 269.0, 180.0, 141.0, 72.0, 57.0, 42.0, 21.0, 16.0, 13.0, 9.0, 2.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.6962890625, -0.6758651733398438, -0.6554412841796875, -0.6350173950195312, -0.614593505859375, -0.5941696166992188, -0.5737457275390625, -0.5533218383789062, -0.53289794921875, -0.5124740600585938, -0.4920501708984375, -0.47162628173828125, -0.451202392578125, -0.43077850341796875, -0.4103546142578125, -0.38993072509765625, -0.3695068359375, -0.34908294677734375, -0.3286590576171875, -0.30823516845703125, -0.287811279296875, -0.26738739013671875, -0.2469635009765625, -0.22653961181640625, -0.20611572265625, -0.18569183349609375, -0.1652679443359375, -0.14484405517578125, -0.124420166015625, -0.10399627685546875, -0.0835723876953125, -0.06314849853515625, -0.042724609375, -0.02230072021484375, -0.0018768310546875, 0.01854705810546875, 0.038970947265625, 0.05939483642578125, 0.0798187255859375, 0.10024261474609375, 0.12066650390625, 0.14109039306640625, 0.1615142822265625, 0.18193817138671875, 0.202362060546875, 0.22278594970703125, 0.2432098388671875, 0.26363372802734375, 0.2840576171875, 0.30448150634765625, 0.3249053955078125, 0.34532928466796875, 0.365753173828125, 0.38617706298828125, 0.4066009521484375, 0.42702484130859375, 0.44744873046875, 0.46787261962890625, 0.4882965087890625, 0.5087203979492188, 0.529144287109375, 0.5495681762695312, 0.5699920654296875, 0.5904159545898438, 0.61083984375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 7.0, 8.0, 11.0, 10.0, 13.0, 20.0, 28.0, 27.0, 39.0, 41.0, 57.0, 65.0, 74.0, 89.0, 95.0, 87.0, 70.0, 39.0, 40.0, 25.0, 29.0, 16.0, 23.0, 16.0, 9.0, 12.0, 7.0, 13.0, 9.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0003712177276611328, -0.00035952404141426086, -0.0003478303551673889, -0.00033613666892051697, -0.000324442982673645, -0.00031274929642677307, -0.0003010556101799011, -0.0002893619239330292, -0.0002776682376861572, -0.0002659745514392853, -0.00025428086519241333, -0.00024258717894554138, -0.00023089349269866943, -0.00021919980645179749, -0.00020750612020492554, -0.0001958124339580536, -0.00018411874771118164, -0.0001724250614643097, -0.00016073137521743774, -0.0001490376889705658, -0.00013734400272369385, -0.0001256503164768219, -0.00011395663022994995, -0.000102262943983078, -9.056925773620605e-05, -7.88755714893341e-05, -6.718188524246216e-05, -5.548819899559021e-05, -4.379451274871826e-05, -3.2100826501846313e-05, -2.0407140254974365e-05, -8.713454008102417e-06, 2.9802322387695312e-06, 1.467391848564148e-05, 2.6367604732513428e-05, 3.8061290979385376e-05, 4.9754977226257324e-05, 6.144866347312927e-05, 7.314234972000122e-05, 8.483603596687317e-05, 9.652972221374512e-05, 0.00010822340846061707, 0.00011991709470748901, 0.00013161078095436096, 0.0001433044672012329, 0.00015499815344810486, 0.0001666918396949768, 0.00017838552594184875, 0.0001900792121887207, 0.00020177289843559265, 0.0002134665846824646, 0.00022516027092933655, 0.0002368539571762085, 0.00024854764342308044, 0.0002602413296699524, 0.00027193501591682434, 0.0002836287021636963, 0.00029532238841056824, 0.0003070160746574402, 0.00031870976090431213, 0.0003304034471511841, 0.00034209713339805603, 0.000353790819644928, 0.0003654845058917999, 0.0003771781921386719]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 5.0, 6.0, 8.0, 6.0, 11.0, 9.0, 28.0, 27.0, 35.0, 42.0, 46.0, 76.0, 112.0, 148.0, 269.0, 580.0, 4417.0, 1032769.0, 8476.0, 562.0, 312.0, 190.0, 101.0, 81.0, 47.0, 49.0, 35.0, 31.0, 22.0, 11.0, 9.0, 9.0, 6.0, 7.0, 2.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00824737548828125, -0.00799405574798584, -0.00774073600769043, -0.0074874162673950195, -0.007234096527099609, -0.006980776786804199, -0.006727457046508789, -0.006474137306213379, -0.006220817565917969, -0.005967497825622559, -0.0057141780853271484, -0.005460858345031738, -0.005207538604736328, -0.004954218864440918, -0.004700899124145508, -0.004447579383850098, -0.0041942596435546875, -0.003940939903259277, -0.003687620162963867, -0.003434300422668457, -0.003180980682373047, -0.0029276609420776367, -0.0026743412017822266, -0.0024210214614868164, -0.0021677017211914062, -0.001914381980895996, -0.001661062240600586, -0.0014077425003051758, -0.0011544227600097656, -0.0009011030197143555, -0.0006477832794189453, -0.00039446353912353516, -0.000141143798828125, 0.00011217594146728516, 0.0003654956817626953, 0.0006188154220581055, 0.0008721351623535156, 0.0011254549026489258, 0.001378774642944336, 0.001632094383239746, 0.0018854141235351562, 0.0021387338638305664, 0.0023920536041259766, 0.0026453733444213867, 0.002898693084716797, 0.003152012825012207, 0.003405332565307617, 0.0036586523056030273, 0.0039119720458984375, 0.004165291786193848, 0.004418611526489258, 0.004671931266784668, 0.004925251007080078, 0.005178570747375488, 0.0054318904876708984, 0.005685210227966309, 0.005938529968261719, 0.006191849708557129, 0.006445169448852539, 0.006698489189147949, 0.006951808929443359, 0.0072051286697387695, 0.00745844841003418, 0.00771176815032959, 0.007965087890625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 10.0, 158.0, 583.0, 241.0, 21.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011593077797442675, -0.0011284862412139773, -0.0010976645862683654, -0.0010668430477380753, -0.0010360213927924633, -0.0010051998542621732, -0.0009743782575242221, -0.0009435566607862711, -0.0009127350640483201, -0.000881913467310369, -0.000851091870572418, -0.0008202702738344669, -0.0007894487353041768, -0.0007586270803585649, -0.0007278055418282747, -0.0006969839450903237, -0.0006661623483523726, -0.0006353407516144216, -0.0006045191548764706, -0.0005736975581385195, -0.0005428759614005685, -0.0005120544228702784, -0.0004812328261323273, -0.0004504112293943763, -0.00041958963265642524, -0.0003887680359184742, -0.00035794643918052316, -0.0003271248715464026, -0.00029630327480845153, -0.0002654816780705005, -0.00023466009588446468, -0.00020383851369842887, -0.00017301685875281692, -0.00014219526201486588, -0.00011137367982883006, -8.055209036683664e-05, -4.973050090484321e-05, -1.890890416689217e-05, 1.1912678019143641e-05, 4.273426020517945e-05, 7.355585694313049e-05, 0.00010437744640512392, 0.00013519903586711735, 0.00016602061805315316, 0.0001968422147911042, 0.00022766381152905524, 0.0002584853791631758, 0.00028930697590112686, 0.0003201285726390779, 0.00035095016937702894, 0.00038177176611498, 0.00041259333374910057, 0.0004434149304870516, 0.00047423652722500265, 0.0005050580948591232, 0.0005358796915970743, 0.0005667012883350253, 0.0005975228850729764, 0.0006283444818109274, 0.0006591660785488784, 0.0006899876752868295, 0.0007208092138171196, 0.0007516308105550706, 0.0007824524072930217, 0.0008132740040309727]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 3.0, 1.0, 7.0, 5.0, 6.0, 7.0, 18.0, 13.0, 13.0, 20.0, 12.0, 25.0, 16.0, 27.0, 32.0, 36.0, 30.0, 28.0, 28.0, 42.0, 28.0, 41.0, 36.0, 32.0, 34.0, 31.0, 39.0, 37.0, 30.0, 28.0, 42.0, 26.0, 27.0, 17.0, 34.0, 22.0, 16.0, 16.0, 9.0, 14.0, 17.0, 13.0, 12.0, 10.0, 5.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.00016307830810546875, -0.00015824567526578903, -0.00015341304242610931, -0.0001485804095864296, -0.00014374777674674988, -0.00013891514390707016, -0.00013408251106739044, -0.00012924987822771072, -0.000124417245388031, -0.00011958461254835129, -0.00011475197970867157, -0.00010991934686899185, -0.00010508671402931213, -0.00010025408118963242, -9.54214483499527e-05, -9.058881551027298e-05, -8.575618267059326e-05, -8.092354983091354e-05, -7.609091699123383e-05, -7.125828415155411e-05, -6.642565131187439e-05, -6.159301847219467e-05, -5.6760385632514954e-05, -5.1927752792835236e-05, -4.709511995315552e-05, -4.22624871134758e-05, -3.742985427379608e-05, -3.2597221434116364e-05, -2.7764588594436646e-05, -2.2931955754756927e-05, -1.809932291507721e-05, -1.3266690075397491e-05, -8.434057235717773e-06, -3.6014243960380554e-06, 1.2312084436416626e-06, 6.063841283321381e-06, 1.0896474123001099e-05, 1.5729106962680817e-05, 2.0561739802360535e-05, 2.5394372642040253e-05, 3.022700548171997e-05, 3.505963832139969e-05, 3.989227116107941e-05, 4.4724904000759125e-05, 4.955753684043884e-05, 5.439016968011856e-05, 5.922280251979828e-05, 6.4055435359478e-05, 6.888806819915771e-05, 7.372070103883743e-05, 7.855333387851715e-05, 8.338596671819687e-05, 8.821859955787659e-05, 9.30512323975563e-05, 9.788386523723602e-05, 0.00010271649807691574, 0.00010754913091659546, 0.00011238176375627518, 0.0001172143965959549, 0.00012204702943563461, 0.00012687966227531433, 0.00013171229511499405, 0.00013654492795467377, 0.00014137756079435349, 0.0001462101936340332]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 3.0, 7.0, 11.0, 13.0, 11.0, 18.0, 17.0, 16.0, 26.0, 17.0, 29.0, 27.0, 30.0, 26.0, 32.0, 25.0, 31.0, 32.0, 35.0, 52.0, 45.0, 38.0, 46.0, 29.0, 28.0, 38.0, 35.0, 26.0, 37.0, 25.0, 22.0, 16.0, 23.0, 23.0, 19.0, 14.0, 12.0, 13.0, 13.0, 8.0, 7.0, 5.0, 2.0, 4.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.142578125, -2.0771484375, -2.01171875, -1.9462890625, -1.880859375, -1.8154296875, -1.75, -1.6845703125, -1.619140625, -1.5537109375, -1.48828125, -1.4228515625, -1.357421875, -1.2919921875, -1.2265625, -1.1611328125, -1.095703125, -1.0302734375, -0.96484375, -0.8994140625, -0.833984375, -0.7685546875, -0.703125, -0.6376953125, -0.572265625, -0.5068359375, -0.44140625, -0.3759765625, -0.310546875, -0.2451171875, -0.1796875, -0.1142578125, -0.048828125, 0.0166015625, 0.08203125, 0.1474609375, 0.212890625, 0.2783203125, 0.34375, 0.4091796875, 0.474609375, 0.5400390625, 0.60546875, 0.6708984375, 0.736328125, 0.8017578125, 0.8671875, 0.9326171875, 0.998046875, 1.0634765625, 1.12890625, 1.1943359375, 1.259765625, 1.3251953125, 1.390625, 1.4560546875, 1.521484375, 1.5869140625, 1.65234375, 1.7177734375, 1.783203125, 1.8486328125, 1.9140625, 1.9794921875, 2.044921875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 12.0, 11.0, 11.0, 19.0, 24.0, 31.0, 51.0, 61.0, 69.0, 101.0, 154.0, 230.0, 317.0, 465.0, 827.0, 1326.0, 2415.0, 4772.0, 9359.0, 20803.0, 51395.0, 152519.0, 423922.0, 246403.0, 77311.0, 29198.0, 12910.0, 6183.0, 3048.0, 1653.0, 998.0, 658.0, 376.0, 277.0, 200.0, 120.0, 106.0, 60.0, 38.0, 36.0, 22.0, 26.0, 14.0, 5.0, 8.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.474609375, -2.39654541015625, -2.3184814453125, -2.24041748046875, -2.162353515625, -2.08428955078125, -2.0062255859375, -1.92816162109375, -1.85009765625, -1.77203369140625, -1.6939697265625, -1.61590576171875, -1.537841796875, -1.45977783203125, -1.3817138671875, -1.30364990234375, -1.2255859375, -1.14752197265625, -1.0694580078125, -0.99139404296875, -0.913330078125, -0.83526611328125, -0.7572021484375, -0.67913818359375, -0.60107421875, -0.52301025390625, -0.4449462890625, -0.36688232421875, -0.288818359375, -0.21075439453125, -0.1326904296875, -0.05462646484375, 0.0234375, 0.10150146484375, 0.1795654296875, 0.25762939453125, 0.335693359375, 0.41375732421875, 0.4918212890625, 0.56988525390625, 0.64794921875, 0.72601318359375, 0.8040771484375, 0.88214111328125, 0.960205078125, 1.03826904296875, 1.1163330078125, 1.19439697265625, 1.2724609375, 1.35052490234375, 1.4285888671875, 1.50665283203125, 1.584716796875, 1.66278076171875, 1.7408447265625, 1.81890869140625, 1.89697265625, 1.97503662109375, 2.0531005859375, 2.13116455078125, 2.209228515625, 2.28729248046875, 2.3653564453125, 2.44342041015625, 2.521484375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 7.0, 3.0, 3.0, 9.0, 6.0, 10.0, 13.0, 17.0, 19.0, 28.0, 24.0, 32.0, 35.0, 55.0, 44.0, 59.0, 54.0, 114.0, 432.0, 1519.0, 123.0, 50.0, 55.0, 53.0, 50.0, 38.0, 33.0, 29.0, 31.0, 28.0, 26.0, 8.0, 8.0, 9.0, 10.0, 3.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0, -7.7147216796875, -7.429443359375, -7.1441650390625, -6.85888671875, -6.5736083984375, -6.288330078125, -6.0030517578125, -5.7177734375, -5.4324951171875, -5.147216796875, -4.8619384765625, -4.57666015625, -4.2913818359375, -4.006103515625, -3.7208251953125, -3.435546875, -3.1502685546875, -2.864990234375, -2.5797119140625, -2.29443359375, -2.0091552734375, -1.723876953125, -1.4385986328125, -1.1533203125, -0.8680419921875, -0.582763671875, -0.2974853515625, -0.01220703125, 0.2730712890625, 0.558349609375, 0.8436279296875, 1.12890625, 1.4141845703125, 1.699462890625, 1.9847412109375, 2.27001953125, 2.5552978515625, 2.840576171875, 3.1258544921875, 3.4111328125, 3.6964111328125, 3.981689453125, 4.2669677734375, 4.55224609375, 4.8375244140625, 5.122802734375, 5.4080810546875, 5.693359375, 5.9786376953125, 6.263916015625, 6.5491943359375, 6.83447265625, 7.1197509765625, 7.405029296875, 7.6903076171875, 7.9755859375, 8.2608642578125, 8.546142578125, 8.8314208984375, 9.11669921875, 9.4019775390625, 9.687255859375, 9.9725341796875, 10.2578125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 18.0, 12.0, 8.0, 12.0, 23.0, 32.0, 41.0, 57.0, 55.0, 79.0, 117.0, 191.0, 348.0, 1101.0, 11049.0, 2046745.0, 1075322.0, 8569.0, 948.0, 378.0, 171.0, 109.0, 65.0, 59.0, 44.0, 36.0, 21.0, 21.0, 12.0, 10.0, 10.0, 17.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.6875, -16.210205078125, -15.73291015625, -15.255615234375, -14.7783203125, -14.301025390625, -13.82373046875, -13.346435546875, -12.869140625, -12.391845703125, -11.91455078125, -11.437255859375, -10.9599609375, -10.482666015625, -10.00537109375, -9.528076171875, -9.05078125, -8.573486328125, -8.09619140625, -7.618896484375, -7.1416015625, -6.664306640625, -6.18701171875, -5.709716796875, -5.232421875, -4.755126953125, -4.27783203125, -3.800537109375, -3.3232421875, -2.845947265625, -2.36865234375, -1.891357421875, -1.4140625, -0.936767578125, -0.45947265625, 0.017822265625, 0.4951171875, 0.972412109375, 1.44970703125, 1.927001953125, 2.404296875, 2.881591796875, 3.35888671875, 3.836181640625, 4.3134765625, 4.790771484375, 5.26806640625, 5.745361328125, 6.22265625, 6.699951171875, 7.17724609375, 7.654541015625, 8.1318359375, 8.609130859375, 9.08642578125, 9.563720703125, 10.041015625, 10.518310546875, 10.99560546875, 11.472900390625, 11.9501953125, 12.427490234375, 12.90478515625, 13.382080078125, 13.859375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 10.0, 37.0, 138.0, 324.0, 339.0, 140.0, 26.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.88785934448242, -42.930809020996094, -41.97376251220703, -41.0167121887207, -40.059661865234375, -39.10261154174805, -38.14556121826172, -37.188514709472656, -36.23146438598633, -35.2744140625, -34.31736755371094, -33.36031723022461, -32.40326690673828, -31.446216583251953, -30.489168167114258, -29.532119750976562, -28.575069427490234, -27.618019104003906, -26.66097068786621, -25.703922271728516, -24.746871948242188, -23.78982162475586, -22.832773208618164, -21.87572479248047, -20.91867446899414, -19.961624145507812, -19.004575729370117, -18.047527313232422, -17.090476989746094, -16.133426666259766, -15.17637825012207, -14.219328880310059, -13.262277603149414, -12.305228233337402, -11.34817886352539, -10.391129493713379, -9.434080123901367, -8.477030754089355, -7.519981384277344, -6.562932014465332, -5.60588264465332, -4.648833274841309, -3.691783905029297, -2.734734535217285, -1.7776851654052734, -0.8206357955932617, 0.13641357421875, 1.0934629440307617, 2.0505123138427734, 3.007561683654785, 3.964611053466797, 4.921660423278809, 5.87870979309082, 6.835759162902832, 7.792808532714844, 8.749857902526855, 9.706907272338867, 10.663956642150879, 11.62100601196289, 12.578055381774902, 13.535104751586914, 14.492154121398926, 15.449203491210938, 16.406253814697266, 17.36330223083496]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 10.0, 13.0, 8.0, 16.0, 15.0, 12.0, 17.0, 13.0, 20.0, 22.0, 32.0, 28.0, 31.0, 36.0, 35.0, 35.0, 41.0, 43.0, 45.0, 39.0, 35.0, 30.0, 45.0, 32.0, 45.0, 26.0, 33.0, 32.0, 23.0, 34.0, 22.0, 17.0, 17.0, 13.0, 16.0, 12.0, 14.0, 3.0, 9.0, 9.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-27.39957618713379, -26.6306209564209, -25.86166763305664, -25.09271240234375, -24.32375717163086, -23.5548038482666, -22.78584861755371, -22.016895294189453, -21.247940063476562, -20.478984832763672, -19.710031509399414, -18.941076278686523, -18.172122955322266, -17.403167724609375, -16.634212493896484, -15.86525821685791, -15.096303939819336, -14.327349662780762, -13.558395385742188, -12.789440155029297, -12.020485877990723, -11.251531600952148, -10.482576370239258, -9.713622093200684, -8.94466781616211, -8.175713539123535, -7.406758785247803, -6.63780403137207, -5.868849754333496, -5.099895477294922, -4.3309407234191895, -3.561985969543457, -2.7930335998535156, -2.0240790843963623, -1.255124568939209, -0.48617005348205566, 0.28278446197509766, 1.051738977432251, 1.8206934928894043, 2.5896482467651367, 3.358602523803711, 4.127556800842285, 4.896511554718018, 5.66546630859375, 6.434420585632324, 7.203374862670898, 7.972329616546631, 8.741284370422363, 9.510238647460938, 10.279192924499512, 11.048147201538086, 11.817102432250977, 12.58605670928955, 13.355010986328125, 14.123966217041016, 14.89292049407959, 15.661874771118164, 16.430830001831055, 17.199783325195312, 17.968738555908203, 18.737693786621094, 19.50664710998535, 20.275602340698242, 21.0445556640625, 21.81351089477539]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 6.0, 3.0, 2.0, 5.0, 2.0, 7.0, 8.0, 12.0, 16.0, 15.0, 15.0, 22.0, 21.0, 18.0, 22.0, 23.0, 31.0, 25.0, 29.0, 25.0, 41.0, 32.0, 33.0, 44.0, 31.0, 51.0, 42.0, 34.0, 37.0, 39.0, 34.0, 35.0, 19.0, 19.0, 34.0, 15.0, 19.0, 19.0, 26.0, 11.0, 18.0, 15.0, 12.0, 10.0, 3.0, 7.0, 6.0, 3.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.1640625, -2.096588134765625, -2.02911376953125, -1.961639404296875, -1.8941650390625, -1.826690673828125, -1.75921630859375, -1.691741943359375, -1.624267578125, -1.556793212890625, -1.48931884765625, -1.421844482421875, -1.3543701171875, -1.286895751953125, -1.21942138671875, -1.151947021484375, -1.08447265625, -1.016998291015625, -0.94952392578125, -0.882049560546875, -0.8145751953125, -0.747100830078125, -0.67962646484375, -0.612152099609375, -0.544677734375, -0.477203369140625, -0.40972900390625, -0.342254638671875, -0.2747802734375, -0.207305908203125, -0.13983154296875, -0.072357177734375, -0.0048828125, 0.062591552734375, 0.13006591796875, 0.197540283203125, 0.2650146484375, 0.332489013671875, 0.39996337890625, 0.467437744140625, 0.534912109375, 0.602386474609375, 0.66986083984375, 0.737335205078125, 0.8048095703125, 0.872283935546875, 0.93975830078125, 1.007232666015625, 1.07470703125, 1.142181396484375, 1.20965576171875, 1.277130126953125, 1.3446044921875, 1.412078857421875, 1.47955322265625, 1.547027587890625, 1.614501953125, 1.681976318359375, 1.74945068359375, 1.816925048828125, 1.8843994140625, 1.951873779296875, 2.01934814453125, 2.086822509765625, 2.154296875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 8.0, 10.0, 10.0, 12.0, 12.0, 13.0, 12.0, 15.0, 23.0, 28.0, 19.0, 16.0, 26.0, 31.0, 37.0, 60.0, 148.0, 468.0, 2428.0, 42806.0, 2771058.0, 1356148.0, 18638.0, 1502.0, 310.0, 113.0, 56.0, 44.0, 26.0, 27.0, 17.0, 15.0, 12.0, 20.0, 20.0, 20.0, 17.0, 11.0, 12.0, 10.0, 5.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.8203125, -12.430419921875, -12.04052734375, -11.650634765625, -11.2607421875, -10.870849609375, -10.48095703125, -10.091064453125, -9.701171875, -9.311279296875, -8.92138671875, -8.531494140625, -8.1416015625, -7.751708984375, -7.36181640625, -6.971923828125, -6.58203125, -6.192138671875, -5.80224609375, -5.412353515625, -5.0224609375, -4.632568359375, -4.24267578125, -3.852783203125, -3.462890625, -3.072998046875, -2.68310546875, -2.293212890625, -1.9033203125, -1.513427734375, -1.12353515625, -0.733642578125, -0.34375, 0.046142578125, 0.43603515625, 0.825927734375, 1.2158203125, 1.605712890625, 1.99560546875, 2.385498046875, 2.775390625, 3.165283203125, 3.55517578125, 3.945068359375, 4.3349609375, 4.724853515625, 5.11474609375, 5.504638671875, 5.89453125, 6.284423828125, 6.67431640625, 7.064208984375, 7.4541015625, 7.843994140625, 8.23388671875, 8.623779296875, 9.013671875, 9.403564453125, 9.79345703125, 10.183349609375, 10.5732421875, 10.963134765625, 11.35302734375, 11.742919921875, 12.1328125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 8.0, 6.0, 6.0, 6.0, 15.0, 21.0, 22.0, 30.0, 48.0, 60.0, 70.0, 102.0, 128.0, 201.0, 250.0, 271.0, 419.0, 415.0, 403.0, 348.0, 334.0, 266.0, 157.0, 127.0, 107.0, 65.0, 27.0, 27.0, 39.0, 25.0, 19.0, 18.0, 5.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.2890625, -7.08026123046875, -6.8714599609375, -6.66265869140625, -6.453857421875, -6.24505615234375, -6.0362548828125, -5.82745361328125, -5.61865234375, -5.40985107421875, -5.2010498046875, -4.99224853515625, -4.783447265625, -4.57464599609375, -4.3658447265625, -4.15704345703125, -3.9482421875, -3.73944091796875, -3.5306396484375, -3.32183837890625, -3.113037109375, -2.90423583984375, -2.6954345703125, -2.48663330078125, -2.27783203125, -2.06903076171875, -1.8602294921875, -1.65142822265625, -1.442626953125, -1.23382568359375, -1.0250244140625, -0.81622314453125, -0.607421875, -0.39862060546875, -0.1898193359375, 0.01898193359375, 0.227783203125, 0.43658447265625, 0.6453857421875, 0.85418701171875, 1.06298828125, 1.27178955078125, 1.4805908203125, 1.68939208984375, 1.898193359375, 2.10699462890625, 2.3157958984375, 2.52459716796875, 2.7333984375, 2.94219970703125, 3.1510009765625, 3.35980224609375, 3.568603515625, 3.77740478515625, 3.9862060546875, 4.19500732421875, 4.40380859375, 4.61260986328125, 4.8214111328125, 5.03021240234375, 5.239013671875, 5.44781494140625, 5.6566162109375, 5.86541748046875, 6.07421875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 8.0, 5.0, 21.0, 20.0, 34.0, 37.0, 58.0, 122.0, 139.0, 240.0, 508.0, 2925.0, 361250.0, 3812626.0, 14491.0, 883.0, 362.0, 184.0, 110.0, 107.0, 56.0, 31.0, 22.0, 15.0, 11.0, 8.0, 5.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.171875, -26.135986328125, -25.10009765625, -24.064208984375, -23.0283203125, -21.992431640625, -20.95654296875, -19.920654296875, -18.884765625, -17.848876953125, -16.81298828125, -15.777099609375, -14.7412109375, -13.705322265625, -12.66943359375, -11.633544921875, -10.59765625, -9.561767578125, -8.52587890625, -7.489990234375, -6.4541015625, -5.418212890625, -4.38232421875, -3.346435546875, -2.310546875, -1.274658203125, -0.23876953125, 0.797119140625, 1.8330078125, 2.868896484375, 3.90478515625, 4.940673828125, 5.9765625, 7.012451171875, 8.04833984375, 9.084228515625, 10.1201171875, 11.156005859375, 12.19189453125, 13.227783203125, 14.263671875, 15.299560546875, 16.33544921875, 17.371337890625, 18.4072265625, 19.443115234375, 20.47900390625, 21.514892578125, 22.55078125, 23.586669921875, 24.62255859375, 25.658447265625, 26.6943359375, 27.730224609375, 28.76611328125, 29.802001953125, 30.837890625, 31.873779296875, 32.90966796875, 33.945556640625, 34.9814453125, 36.017333984375, 37.05322265625, 38.089111328125, 39.125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 30.0, 165.0, 378.0, 330.0, 100.0, 10.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-170.1788787841797, -167.13201904296875, -164.0851593017578, -161.03829956054688, -157.99143981933594, -154.944580078125, -151.89773559570312, -148.8508758544922, -145.80401611328125, -142.7571563720703, -139.71029663085938, -136.66343688964844, -133.6165771484375, -130.56973266601562, -127.52286529541016, -124.47600555419922, -121.42914581298828, -118.38228607177734, -115.3354263305664, -112.28857421875, -109.24171447753906, -106.19485473632812, -103.14799499511719, -100.10113525390625, -97.05427551269531, -94.00741577148438, -90.96055603027344, -87.9136962890625, -84.8668441772461, -81.81998443603516, -78.77312469482422, -75.72626495361328, -72.6794204711914, -69.63256072998047, -66.58570098876953, -63.53884506225586, -60.49198913574219, -57.44512939453125, -54.39826965332031, -51.351409912109375, -48.3045539855957, -45.257694244384766, -42.210838317871094, -39.163978576660156, -36.11711883544922, -33.07026290893555, -30.02340316772461, -26.976545333862305, -23.9296875, -20.882829666137695, -17.83597183227539, -14.789112091064453, -11.742254257202148, -8.695396423339844, -5.648536682128906, -2.6016788482666016, 0.4451789855957031, 3.492037296295166, 6.538895606994629, 9.58575439453125, 12.632612228393555, 15.67947006225586, 18.726329803466797, 21.7731876373291, 24.820045471191406]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 6.0, 9.0, 8.0, 10.0, 9.0, 9.0, 10.0, 17.0, 19.0, 17.0, 20.0, 23.0, 27.0, 32.0, 23.0, 25.0, 41.0, 27.0, 50.0, 34.0, 34.0, 49.0, 39.0, 44.0, 40.0, 40.0, 39.0, 37.0, 23.0, 24.0, 25.0, 30.0, 19.0, 19.0, 17.0, 13.0, 15.0, 11.0, 15.0, 8.0, 9.0, 7.0, 7.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.906139373779297, -19.24754524230957, -18.58894920349121, -17.930355072021484, -17.271759033203125, -16.6131649017334, -15.954569816589355, -15.295974731445312, -14.63737964630127, -13.978784561157227, -13.320189476013184, -12.66159439086914, -12.003000259399414, -11.344404220581055, -10.685810089111328, -10.027215003967285, -9.368619918823242, -8.7100248336792, -8.051429748535156, -7.3928351402282715, -6.7342400550842285, -6.0756449699401855, -5.417050361633301, -4.758455276489258, -4.099860191345215, -3.441265106201172, -2.782670259475708, -2.124075412750244, -1.4654803276062012, -0.8068852424621582, -0.14829039573669434, 0.5103044509887695, 1.1689014434814453, 1.8274964094161987, 2.486091375350952, 3.144686222076416, 3.803281307220459, 4.461876392364502, 5.120471000671387, 5.77906608581543, 6.437661170959473, 7.096256256103516, 7.754851341247559, 8.413446426391602, 9.072040557861328, 9.730636596679688, 10.389230728149414, 11.047825813293457, 11.7064208984375, 12.365015983581543, 13.023611068725586, 13.682206153869629, 14.340801239013672, 14.999395370483398, 15.657990455627441, 16.316585540771484, 16.975181579589844, 17.63377571105957, 18.29237174987793, 18.950965881347656, 19.609561920166016, 20.268156051635742, 20.9267520904541, 21.585346221923828, 22.243940353393555]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 10.0, 5.0, 7.0, 10.0, 7.0, 12.0, 14.0, 14.0, 22.0, 20.0, 21.0, 14.0, 23.0, 29.0, 40.0, 32.0, 37.0, 32.0, 46.0, 22.0, 37.0, 28.0, 50.0, 41.0, 48.0, 36.0, 40.0, 29.0, 33.0, 24.0, 18.0, 23.0, 20.0, 17.0, 26.0, 21.0, 21.0, 17.0, 12.0, 7.0, 12.0, 7.0, 6.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.177734375, -2.107421875, -2.037109375, -1.966796875, -1.896484375, -1.826171875, -1.755859375, -1.685546875, -1.615234375, -1.544921875, -1.474609375, -1.404296875, -1.333984375, -1.263671875, -1.193359375, -1.123046875, -1.052734375, -0.982421875, -0.912109375, -0.841796875, -0.771484375, -0.701171875, -0.630859375, -0.560546875, -0.490234375, -0.419921875, -0.349609375, -0.279296875, -0.208984375, -0.138671875, -0.068359375, 0.001953125, 0.072265625, 0.142578125, 0.212890625, 0.283203125, 0.353515625, 0.423828125, 0.494140625, 0.564453125, 0.634765625, 0.705078125, 0.775390625, 0.845703125, 0.916015625, 0.986328125, 1.056640625, 1.126953125, 1.197265625, 1.267578125, 1.337890625, 1.408203125, 1.478515625, 1.548828125, 1.619140625, 1.689453125, 1.759765625, 1.830078125, 1.900390625, 1.970703125, 2.041015625, 2.111328125, 2.181640625, 2.251953125, 2.322265625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 7.0, 8.0, 8.0, 11.0, 13.0, 24.0, 38.0, 58.0, 66.0, 111.0, 162.0, 226.0, 338.0, 482.0, 700.0, 983.0, 1449.0, 2053.0, 2925.0, 4291.0, 6130.0, 8811.0, 12756.0, 18585.0, 27513.0, 41772.0, 67127.0, 116498.0, 297536.0, 182195.0, 91381.0, 54424.0, 34814.0, 23245.0, 15891.0, 10958.0, 7680.0, 5327.0, 3673.0, 2565.0, 1770.0, 1204.0, 864.0, 583.0, 396.0, 272.0, 189.0, 151.0, 98.0, 60.0, 53.0, 32.0, 20.0, 14.0, 12.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.4853515625, -0.4695892333984375, -0.453826904296875, -0.4380645751953125, -0.42230224609375, -0.4065399169921875, -0.390777587890625, -0.3750152587890625, -0.3592529296875, -0.3434906005859375, -0.327728271484375, -0.3119659423828125, -0.29620361328125, -0.2804412841796875, -0.264678955078125, -0.2489166259765625, -0.233154296875, -0.2173919677734375, -0.201629638671875, -0.1858673095703125, -0.17010498046875, -0.1543426513671875, -0.138580322265625, -0.1228179931640625, -0.1070556640625, -0.0912933349609375, -0.075531005859375, -0.0597686767578125, -0.04400634765625, -0.0282440185546875, -0.012481689453125, 0.0032806396484375, 0.01904296875, 0.0348052978515625, 0.050567626953125, 0.0663299560546875, 0.08209228515625, 0.0978546142578125, 0.113616943359375, 0.1293792724609375, 0.1451416015625, 0.1609039306640625, 0.176666259765625, 0.1924285888671875, 0.20819091796875, 0.2239532470703125, 0.239715576171875, 0.2554779052734375, 0.271240234375, 0.2870025634765625, 0.302764892578125, 0.3185272216796875, 0.33428955078125, 0.3500518798828125, 0.365814208984375, 0.3815765380859375, 0.3973388671875, 0.4131011962890625, 0.428863525390625, 0.4446258544921875, 0.46038818359375, 0.4761505126953125, 0.491912841796875, 0.5076751708984375, 0.5234375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 1.0, 9.0, 12.0, 8.0, 9.0, 20.0, 20.0, 13.0, 27.0, 20.0, 30.0, 35.0, 42.0, 46.0, 43.0, 32.0, 42.0, 40.0, 47.0, 1063.0, 37.0, 32.0, 39.0, 27.0, 34.0, 50.0, 21.0, 30.0, 33.0, 32.0, 24.0, 13.0, 17.0, 9.0, 16.0, 7.0, 12.0, 6.0, 6.0, 5.0, 6.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.419921875, -1.3717498779296875, -1.323577880859375, -1.2754058837890625, -1.22723388671875, -1.1790618896484375, -1.130889892578125, -1.0827178955078125, -1.0345458984375, -0.9863739013671875, -0.938201904296875, -0.8900299072265625, -0.84185791015625, -0.7936859130859375, -0.745513916015625, -0.6973419189453125, -0.649169921875, -0.6009979248046875, -0.552825927734375, -0.5046539306640625, -0.45648193359375, -0.4083099365234375, -0.360137939453125, -0.3119659423828125, -0.2637939453125, -0.2156219482421875, -0.167449951171875, -0.1192779541015625, -0.07110595703125, -0.0229339599609375, 0.025238037109375, 0.0734100341796875, 0.12158203125, 0.1697540283203125, 0.217926025390625, 0.2660980224609375, 0.31427001953125, 0.3624420166015625, 0.410614013671875, 0.4587860107421875, 0.5069580078125, 0.5551300048828125, 0.603302001953125, 0.6514739990234375, 0.69964599609375, 0.7478179931640625, 0.795989990234375, 0.8441619873046875, 0.892333984375, 0.9405059814453125, 0.988677978515625, 1.0368499755859375, 1.08502197265625, 1.1331939697265625, 1.181365966796875, 1.2295379638671875, 1.2777099609375, 1.3258819580078125, 1.374053955078125, 1.4222259521484375, 1.47039794921875, 1.5185699462890625, 1.566741943359375, 1.6149139404296875, 1.6630859375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 8.0, 4.0, 5.0, 8.0, 9.0, 20.0, 27.0, 27.0, 44.0, 82.0, 79.0, 133.0, 223.0, 304.0, 459.0, 620.0, 1146.0, 1572.0, 2649.0, 4330.0, 7165.0, 11838.0, 20521.0, 36493.0, 66515.0, 125244.0, 1387818.0, 209345.0, 97256.0, 52282.0, 28964.0, 16537.0, 9608.0, 5846.0, 3539.0, 2363.0, 1440.0, 872.0, 607.0, 393.0, 267.0, 145.0, 119.0, 78.0, 41.0, 28.0, 27.0, 15.0, 8.0, 10.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-0.6494140625, -0.6302032470703125, -0.610992431640625, -0.5917816162109375, -0.57257080078125, -0.5533599853515625, -0.534149169921875, -0.5149383544921875, -0.4957275390625, -0.4765167236328125, -0.457305908203125, -0.4380950927734375, -0.41888427734375, -0.3996734619140625, -0.380462646484375, -0.3612518310546875, -0.342041015625, -0.3228302001953125, -0.303619384765625, -0.2844085693359375, -0.26519775390625, -0.2459869384765625, -0.226776123046875, -0.2075653076171875, -0.1883544921875, -0.1691436767578125, -0.149932861328125, -0.1307220458984375, -0.11151123046875, -0.0923004150390625, -0.073089599609375, -0.0538787841796875, -0.03466796875, -0.0154571533203125, 0.003753662109375, 0.0229644775390625, 0.04217529296875, 0.0613861083984375, 0.080596923828125, 0.0998077392578125, 0.1190185546875, 0.1382293701171875, 0.157440185546875, 0.1766510009765625, 0.19586181640625, 0.2150726318359375, 0.234283447265625, 0.2534942626953125, 0.272705078125, 0.2919158935546875, 0.311126708984375, 0.3303375244140625, 0.34954833984375, 0.3687591552734375, 0.387969970703125, 0.4071807861328125, 0.4263916015625, 0.4456024169921875, 0.464813232421875, 0.4840240478515625, 0.50323486328125, 0.5224456787109375, 0.541656494140625, 0.5608673095703125, 0.580078125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 2.0, 5.0, 7.0, 12.0, 10.0, 18.0, 17.0, 21.0, 18.0, 25.0, 41.0, 67.0, 73.0, 78.0, 116.0, 88.0, 84.0, 66.0, 51.0, 38.0, 30.0, 26.0, 12.0, 21.0, 12.0, 21.0, 8.0, 9.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.0005950927734375, -0.000578068196773529, -0.0005610436201095581, -0.0005440190434455872, -0.0005269944667816162, -0.0005099698901176453, -0.0004929453134536743, -0.00047592073678970337, -0.0004588961601257324, -0.0004418715834617615, -0.00042484700679779053, -0.0004078224301338196, -0.00039079785346984863, -0.0003737732768058777, -0.00035674870014190674, -0.0003397241234779358, -0.00032269954681396484, -0.0003056749701499939, -0.00028865039348602295, -0.000271625816822052, -0.00025460124015808105, -0.0002375766634941101, -0.00022055208683013916, -0.0002035275101661682, -0.00018650293350219727, -0.00016947835683822632, -0.00015245378017425537, -0.00013542920351028442, -0.00011840462684631348, -0.00010138005018234253, -8.435547351837158e-05, -6.733089685440063e-05, -5.030632019042969e-05, -3.328174352645874e-05, -1.6257166862487793e-05, 7.674098014831543e-07, 1.77919864654541e-05, 3.481656312942505e-05, 5.1841139793395996e-05, 6.886571645736694e-05, 8.589029312133789e-05, 0.00010291486978530884, 0.00011993944644927979, 0.00013696402311325073, 0.00015398859977722168, 0.00017101317644119263, 0.00018803775310516357, 0.00020506232976913452, 0.00022208690643310547, 0.00023911148309707642, 0.00025613605976104736, 0.0002731606364250183, 0.00029018521308898926, 0.0003072097897529602, 0.00032423436641693115, 0.0003412589430809021, 0.00035828351974487305, 0.000375308096408844, 0.00039233267307281494, 0.0004093572497367859, 0.00042638182640075684, 0.0004434064030647278, 0.00046043097972869873, 0.0004774555563926697, 0.0004944801330566406]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 5.0, 0.0, 4.0, 2.0, 6.0, 1.0, 3.0, 9.0, 9.0, 13.0, 12.0, 19.0, 24.0, 40.0, 30.0, 44.0, 63.0, 109.0, 112.0, 221.0, 457.0, 2615.0, 1028139.0, 15160.0, 595.0, 262.0, 187.0, 118.0, 67.0, 54.0, 40.0, 28.0, 20.0, 21.0, 9.0, 16.0, 18.0, 9.0, 6.0, 5.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00975799560546875, -0.009428858757019043, -0.009099721908569336, -0.008770585060119629, -0.008441448211669922, -0.008112311363220215, -0.007783174514770508, -0.007454037666320801, -0.007124900817871094, -0.006795763969421387, -0.00646662712097168, -0.006137490272521973, -0.005808353424072266, -0.005479216575622559, -0.0051500797271728516, -0.0048209428787231445, -0.0044918060302734375, -0.0041626691818237305, -0.0038335323333740234, -0.0035043954849243164, -0.0031752586364746094, -0.0028461217880249023, -0.0025169849395751953, -0.0021878480911254883, -0.0018587112426757812, -0.0015295743942260742, -0.0012004375457763672, -0.0008713006973266602, -0.0005421638488769531, -0.0002130270004272461, 0.00011610984802246094, 0.00044524669647216797, 0.000774383544921875, 0.001103520393371582, 0.001432657241821289, 0.001761794090270996, 0.002090930938720703, 0.00242006778717041, 0.002749204635620117, 0.0030783414840698242, 0.0034074783325195312, 0.0037366151809692383, 0.004065752029418945, 0.004394888877868652, 0.004724025726318359, 0.005053162574768066, 0.0053822994232177734, 0.0057114362716674805, 0.0060405731201171875, 0.0063697099685668945, 0.0066988468170166016, 0.007027983665466309, 0.007357120513916016, 0.007686257362365723, 0.00801539421081543, 0.008344531059265137, 0.008673667907714844, 0.00900280475616455, 0.009331941604614258, 0.009661078453063965, 0.009990215301513672, 0.010319352149963379, 0.010648488998413086, 0.010977625846862793, 0.0113067626953125]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 63.0, 688.0, 259.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002278360305353999, -0.002217974280938506, -0.0021575884893536568, -0.0020972024649381638, -0.0020368166733533144, -0.0019764306489378214, -0.0019160447409376502, -0.001855658832937479, -0.0017952729249373078, -0.0017348870169371367, -0.0016745011089369655, -0.0016141152009367943, -0.0015537291765213013, -0.001493343384936452, -0.001432957360520959, -0.0013725714525207877, -0.0013121855445206165, -0.0012517996365204453, -0.0011914137285202742, -0.001131027820520103, -0.0010706419125199318, -0.0010102558881044388, -0.0009498699801042676, -0.0008894840721040964, -0.0008290981641039252, -0.000768712256103754, -0.0007083263481035829, -0.0006479403818957508, -0.0005875544738955796, -0.0005271685658954084, -0.00046678262879140675, -0.0004063966916874051, -0.0003460106672719121, -0.0002856247592717409, -0.00022523882216773927, -0.00016485289961565286, -0.00010446697706356645, -4.408106906339526e-05, 1.630486804060638e-05, 7.669080514460802e-05, 0.0001370767131447792, 0.00019746263569686562, 0.00025784855824895203, 0.00031823449535295367, 0.00037862040335312486, 0.00043900631135329604, 0.0004993922775611281, 0.0005597781855612993, 0.0006201640935614705, 0.0006805500015616417, 0.0007409359095618129, 0.000801321875769645, 0.0008617077837698162, 0.0009220936917699873, 0.0009824796579778194, 0.0010428655659779906, 0.0011032514739781618, 0.001163637381978333, 0.0012240232899785042, 0.0012844091979786754, 0.0013447951059788465, 0.0014051811303943396, 0.0014655670383945107, 0.001525952946394682, 0.0015863388543948531]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 8.0, 13.0, 10.0, 15.0, 15.0, 23.0, 16.0, 38.0, 23.0, 28.0, 35.0, 30.0, 38.0, 37.0, 48.0, 55.0, 54.0, 38.0, 51.0, 44.0, 42.0, 38.0, 33.0, 40.0, 38.0, 29.0, 30.0, 18.0, 25.0, 6.0, 15.0, 12.0, 11.0, 13.0, 8.0, 9.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000260770320892334, -0.0002523651346564293, -0.0002439599484205246, -0.0002355547621846199, -0.0002271495759487152, -0.00021874438971281052, -0.00021033920347690582, -0.00020193401724100113, -0.00019352883100509644, -0.00018512364476919174, -0.00017671845853328705, -0.00016831327229738235, -0.00015990808606147766, -0.00015150289982557297, -0.00014309771358966827, -0.00013469252735376358, -0.0001262873411178589, -0.00011788215488195419, -0.0001094769686460495, -0.0001010717824101448, -9.266659617424011e-05, -8.426140993833542e-05, -7.585622370243073e-05, -6.745103746652603e-05, -5.904585123062134e-05, -5.0640664994716644e-05, -4.223547875881195e-05, -3.383029252290726e-05, -2.5425106287002563e-05, -1.701992005109787e-05, -8.614733815193176e-06, -2.0954757928848267e-07, 8.195638656616211e-06, 1.6600824892520905e-05, 2.5006011128425598e-05, 3.341119736433029e-05, 4.1816383600234985e-05, 5.022156983613968e-05, 5.862675607204437e-05, 6.703194230794907e-05, 7.543712854385376e-05, 8.384231477975845e-05, 9.224750101566315e-05, 0.00010065268725156784, 0.00010905787348747253, 0.00011746305972337723, 0.00012586824595928192, 0.00013427343219518661, 0.0001426786184310913, 0.000151083804666996, 0.0001594889909029007, 0.0001678941771388054, 0.00017629936337471008, 0.00018470454961061478, 0.00019310973584651947, 0.00020151492208242416, 0.00020992010831832886, 0.00021832529455423355, 0.00022673048079013824, 0.00023513566702604294, 0.00024354085326194763, 0.0002519460394978523, 0.000260351225733757, 0.0002687564119696617, 0.0002771615982055664]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 10.0, 5.0, 7.0, 10.0, 7.0, 12.0, 14.0, 14.0, 22.0, 20.0, 21.0, 14.0, 23.0, 29.0, 40.0, 32.0, 37.0, 32.0, 46.0, 22.0, 37.0, 27.0, 51.0, 41.0, 48.0, 36.0, 40.0, 29.0, 33.0, 24.0, 18.0, 23.0, 20.0, 17.0, 26.0, 21.0, 21.0, 17.0, 12.0, 7.0, 12.0, 7.0, 6.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.177734375, -2.107421875, -2.037109375, -1.966796875, -1.896484375, -1.826171875, -1.755859375, -1.685546875, -1.615234375, -1.544921875, -1.474609375, -1.404296875, -1.333984375, -1.263671875, -1.193359375, -1.123046875, -1.052734375, -0.982421875, -0.912109375, -0.841796875, -0.771484375, -0.701171875, -0.630859375, -0.560546875, -0.490234375, -0.419921875, -0.349609375, -0.279296875, -0.208984375, -0.138671875, -0.068359375, 0.001953125, 0.072265625, 0.142578125, 0.212890625, 0.283203125, 0.353515625, 0.423828125, 0.494140625, 0.564453125, 0.634765625, 0.705078125, 0.775390625, 0.845703125, 0.916015625, 0.986328125, 1.056640625, 1.126953125, 1.197265625, 1.267578125, 1.337890625, 1.408203125, 1.478515625, 1.548828125, 1.619140625, 1.689453125, 1.759765625, 1.830078125, 1.900390625, 1.970703125, 2.041015625, 2.111328125, 2.181640625, 2.251953125, 2.322265625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 2.0, 6.0, 10.0, 13.0, 25.0, 22.0, 28.0, 24.0, 52.0, 62.0, 69.0, 106.0, 141.0, 229.0, 323.0, 570.0, 963.0, 1591.0, 2944.0, 6830.0, 17918.0, 54860.0, 198112.0, 453141.0, 216716.0, 59894.0, 19076.0, 7280.0, 3293.0, 1563.0, 948.0, 538.0, 334.0, 253.0, 156.0, 109.0, 88.0, 63.0, 58.0, 32.0, 31.0, 16.0, 13.0, 16.0, 12.0, 7.0, 6.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4921875, -2.407806396484375, -2.32342529296875, -2.239044189453125, -2.1546630859375, -2.070281982421875, -1.98590087890625, -1.901519775390625, -1.817138671875, -1.732757568359375, -1.64837646484375, -1.563995361328125, -1.4796142578125, -1.395233154296875, -1.31085205078125, -1.226470947265625, -1.14208984375, -1.057708740234375, -0.97332763671875, -0.888946533203125, -0.8045654296875, -0.720184326171875, -0.63580322265625, -0.551422119140625, -0.467041015625, -0.382659912109375, -0.29827880859375, -0.213897705078125, -0.1295166015625, -0.045135498046875, 0.03924560546875, 0.123626708984375, 0.2080078125, 0.292388916015625, 0.37677001953125, 0.461151123046875, 0.5455322265625, 0.629913330078125, 0.71429443359375, 0.798675537109375, 0.883056640625, 0.967437744140625, 1.05181884765625, 1.136199951171875, 1.2205810546875, 1.304962158203125, 1.38934326171875, 1.473724365234375, 1.55810546875, 1.642486572265625, 1.72686767578125, 1.811248779296875, 1.8956298828125, 1.980010986328125, 2.06439208984375, 2.148773193359375, 2.233154296875, 2.317535400390625, 2.40191650390625, 2.486297607421875, 2.5706787109375, 2.655059814453125, 2.73944091796875, 2.823822021484375, 2.908203125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 4.0, 4.0, 8.0, 7.0, 9.0, 12.0, 13.0, 10.0, 16.0, 29.0, 27.0, 41.0, 38.0, 27.0, 42.0, 58.0, 63.0, 117.0, 425.0, 1526.0, 119.0, 71.0, 35.0, 49.0, 45.0, 33.0, 41.0, 41.0, 28.0, 24.0, 16.0, 10.0, 17.0, 12.0, 7.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.09375, -9.7974853515625, -9.501220703125, -9.2049560546875, -8.90869140625, -8.6124267578125, -8.316162109375, -8.0198974609375, -7.7236328125, -7.4273681640625, -7.131103515625, -6.8348388671875, -6.53857421875, -6.2423095703125, -5.946044921875, -5.6497802734375, -5.353515625, -5.0572509765625, -4.760986328125, -4.4647216796875, -4.16845703125, -3.8721923828125, -3.575927734375, -3.2796630859375, -2.9833984375, -2.6871337890625, -2.390869140625, -2.0946044921875, -1.79833984375, -1.5020751953125, -1.205810546875, -0.9095458984375, -0.61328125, -0.3170166015625, -0.020751953125, 0.2755126953125, 0.57177734375, 0.8680419921875, 1.164306640625, 1.4605712890625, 1.7568359375, 2.0531005859375, 2.349365234375, 2.6456298828125, 2.94189453125, 3.2381591796875, 3.534423828125, 3.8306884765625, 4.126953125, 4.4232177734375, 4.719482421875, 5.0157470703125, 5.31201171875, 5.6082763671875, 5.904541015625, 6.2008056640625, 6.4970703125, 6.7933349609375, 7.089599609375, 7.3858642578125, 7.68212890625, 7.9783935546875, 8.274658203125, 8.5709228515625, 8.8671875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 2.0, 7.0, 15.0, 14.0, 20.0, 18.0, 26.0, 39.0, 51.0, 51.0, 80.0, 109.0, 193.0, 386.0, 968.0, 7059.0, 782772.0, 2341593.0, 9991.0, 1243.0, 441.0, 178.0, 100.0, 78.0, 57.0, 54.0, 42.0, 16.0, 17.0, 15.0, 13.0, 12.0, 10.0, 6.0, 7.0, 4.0, 6.0, 5.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.921875, -15.42529296875, -14.9287109375, -14.43212890625, -13.935546875, -13.43896484375, -12.9423828125, -12.44580078125, -11.94921875, -11.45263671875, -10.9560546875, -10.45947265625, -9.962890625, -9.46630859375, -8.9697265625, -8.47314453125, -7.9765625, -7.47998046875, -6.9833984375, -6.48681640625, -5.990234375, -5.49365234375, -4.9970703125, -4.50048828125, -4.00390625, -3.50732421875, -3.0107421875, -2.51416015625, -2.017578125, -1.52099609375, -1.0244140625, -0.52783203125, -0.03125, 0.46533203125, 0.9619140625, 1.45849609375, 1.955078125, 2.45166015625, 2.9482421875, 3.44482421875, 3.94140625, 4.43798828125, 4.9345703125, 5.43115234375, 5.927734375, 6.42431640625, 6.9208984375, 7.41748046875, 7.9140625, 8.41064453125, 8.9072265625, 9.40380859375, 9.900390625, 10.39697265625, 10.8935546875, 11.39013671875, 11.88671875, 12.38330078125, 12.8798828125, 13.37646484375, 13.873046875, 14.36962890625, 14.8662109375, 15.36279296875, 15.859375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [24.0, 989.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.454665184020996, -2.6199545860290527, 3.2147560119628906, 9.049466133117676, 14.884177207946777, 20.718887329101562, 26.55359649658203, 32.388309478759766, 38.223018646240234, 44.0577278137207, 49.89244079589844, 55.727149963378906, 61.561859130859375, 67.39657592773438, 73.23127746582031, 79.06599426269531, 84.90070343017578, 90.73541259765625, 96.57012176513672, 102.40483093261719, 108.23954772949219, 114.07425689697266, 119.90896606445312, 125.74368286132812, 131.57838439941406, 137.41310119628906, 143.247802734375, 149.08251953125, 154.91722106933594, 160.75193786621094, 166.58663940429688, 172.42135620117188, 178.25608825683594, 184.09080505371094, 189.92550659179688, 195.76022338867188, 201.5949249267578, 207.4296417236328, 213.26434326171875, 219.09906005859375, 224.93377685546875, 230.76849365234375, 236.6031951904297, 242.4379119873047, 248.27261352539062, 254.10733032226562, 259.9420471191406, 265.7767639160156, 271.6114501953125, 277.4461669921875, 283.2808837890625, 289.1155700683594, 294.9502868652344, 300.7850036621094, 306.6197204589844, 312.4544372558594, 318.2891540527344, 324.1238708496094, 329.9585876464844, 335.79327392578125, 341.62799072265625, 347.46270751953125, 353.29742431640625, 359.13214111328125, 364.9668273925781]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 7.0, 7.0, 6.0, 13.0, 9.0, 15.0, 15.0, 21.0, 18.0, 23.0, 30.0, 30.0, 27.0, 38.0, 40.0, 39.0, 44.0, 39.0, 38.0, 33.0, 47.0, 33.0, 49.0, 41.0, 41.0, 38.0, 38.0, 30.0, 31.0, 28.0, 19.0, 19.0, 19.0, 14.0, 12.0, 11.0, 12.0, 7.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.91810417175293, -28.028846740722656, -27.139589309692383, -26.250329971313477, -25.361072540283203, -24.47181510925293, -23.582557678222656, -22.69329833984375, -21.804040908813477, -20.914783477783203, -20.02552604675293, -19.136266708374023, -18.24700927734375, -17.357751846313477, -16.468494415283203, -15.579236030578613, -14.68997859954834, -13.800721168518066, -12.911462783813477, -12.022205352783203, -11.132946968078613, -10.24368953704834, -9.35443115234375, -8.465173721313477, -7.575915813446045, -6.686657905578613, -5.797399997711182, -4.90814208984375, -4.018884658813477, -3.129626750946045, -2.2403688430786133, -1.3511109352111816, -0.46185302734375, 0.42740482091903687, 1.3166626691818237, 2.205920457839966, 3.0951783657073975, 3.98443603515625, 4.873693943023682, 5.762951850891113, 6.652209758758545, 7.541467666625977, 8.43072509765625, 9.31998348236084, 10.209240913391113, 11.098499298095703, 11.987756729125977, 12.87701416015625, 13.76627254486084, 14.655529975891113, 15.544788360595703, 16.434045791625977, 17.32330322265625, 18.212562561035156, 19.10181999206543, 19.991077423095703, 20.880334854125977, 21.76959228515625, 22.658849716186523, 23.54810905456543, 24.437366485595703, 25.326623916625977, 26.21588134765625, 27.105140686035156, 27.99439811706543]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 5.0, 5.0, 4.0, 5.0, 7.0, 7.0, 12.0, 8.0, 13.0, 16.0, 21.0, 18.0, 19.0, 21.0, 22.0, 19.0, 30.0, 35.0, 44.0, 44.0, 39.0, 33.0, 38.0, 46.0, 32.0, 37.0, 37.0, 51.0, 43.0, 37.0, 23.0, 18.0, 24.0, 18.0, 23.0, 21.0, 17.0, 23.0, 23.0, 21.0, 15.0, 6.0, 8.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.244140625, -2.169219970703125, -2.09429931640625, -2.019378662109375, -1.9444580078125, -1.869537353515625, -1.79461669921875, -1.719696044921875, -1.644775390625, -1.569854736328125, -1.49493408203125, -1.420013427734375, -1.3450927734375, -1.270172119140625, -1.19525146484375, -1.120330810546875, -1.04541015625, -0.970489501953125, -0.89556884765625, -0.820648193359375, -0.7457275390625, -0.670806884765625, -0.59588623046875, -0.520965576171875, -0.446044921875, -0.371124267578125, -0.29620361328125, -0.221282958984375, -0.1463623046875, -0.071441650390625, 0.00347900390625, 0.078399658203125, 0.1533203125, 0.228240966796875, 0.30316162109375, 0.378082275390625, 0.4530029296875, 0.527923583984375, 0.60284423828125, 0.677764892578125, 0.752685546875, 0.827606201171875, 0.90252685546875, 0.977447509765625, 1.0523681640625, 1.127288818359375, 1.20220947265625, 1.277130126953125, 1.35205078125, 1.426971435546875, 1.50189208984375, 1.576812744140625, 1.6517333984375, 1.726654052734375, 1.80157470703125, 1.876495361328125, 1.951416015625, 2.026336669921875, 2.10125732421875, 2.176177978515625, 2.2510986328125, 2.326019287109375, 2.40093994140625, 2.475860595703125, 2.55078125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 6.0, 7.0, 4.0, 8.0, 17.0, 20.0, 22.0, 20.0, 35.0, 60.0, 66.0, 111.0, 168.0, 360.0, 643.0, 1495.0, 4384.0, 15122.0, 68867.0, 431227.0, 1808287.0, 1498927.0, 296845.0, 49883.0, 11635.0, 3447.0, 1253.0, 511.0, 284.0, 184.0, 105.0, 68.0, 48.0, 30.0, 24.0, 24.0, 15.0, 12.0, 10.0, 18.0, 8.0, 3.0, 7.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.44921875, -4.3004150390625, -4.151611328125, -4.0028076171875, -3.85400390625, -3.7052001953125, -3.556396484375, -3.4075927734375, -3.2587890625, -3.1099853515625, -2.961181640625, -2.8123779296875, -2.66357421875, -2.5147705078125, -2.365966796875, -2.2171630859375, -2.068359375, -1.9195556640625, -1.770751953125, -1.6219482421875, -1.47314453125, -1.3243408203125, -1.175537109375, -1.0267333984375, -0.8779296875, -0.7291259765625, -0.580322265625, -0.4315185546875, -0.28271484375, -0.1339111328125, 0.014892578125, 0.1636962890625, 0.3125, 0.4613037109375, 0.610107421875, 0.7589111328125, 0.90771484375, 1.0565185546875, 1.205322265625, 1.3541259765625, 1.5029296875, 1.6517333984375, 1.800537109375, 1.9493408203125, 2.09814453125, 2.2469482421875, 2.395751953125, 2.5445556640625, 2.693359375, 2.8421630859375, 2.990966796875, 3.1397705078125, 3.28857421875, 3.4373779296875, 3.586181640625, 3.7349853515625, 3.8837890625, 4.0325927734375, 4.181396484375, 4.3302001953125, 4.47900390625, 4.6278076171875, 4.776611328125, 4.9254150390625, 5.07421875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 5.0, 9.0, 12.0, 15.0, 20.0, 32.0, 44.0, 62.0, 98.0, 125.0, 176.0, 240.0, 317.0, 403.0, 474.0, 452.0, 411.0, 319.0, 223.0, 151.0, 131.0, 74.0, 73.0, 43.0, 41.0, 36.0, 21.0, 10.0, 14.0, 7.0, 10.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-8.8203125, -8.5938720703125, -8.367431640625, -8.1409912109375, -7.91455078125, -7.6881103515625, -7.461669921875, -7.2352294921875, -7.0087890625, -6.7823486328125, -6.555908203125, -6.3294677734375, -6.10302734375, -5.8765869140625, -5.650146484375, -5.4237060546875, -5.197265625, -4.9708251953125, -4.744384765625, -4.5179443359375, -4.29150390625, -4.0650634765625, -3.838623046875, -3.6121826171875, -3.3857421875, -3.1593017578125, -2.932861328125, -2.7064208984375, -2.47998046875, -2.2535400390625, -2.027099609375, -1.8006591796875, -1.57421875, -1.3477783203125, -1.121337890625, -0.8948974609375, -0.66845703125, -0.4420166015625, -0.215576171875, 0.0108642578125, 0.2373046875, 0.4637451171875, 0.690185546875, 0.9166259765625, 1.14306640625, 1.3695068359375, 1.595947265625, 1.8223876953125, 2.048828125, 2.2752685546875, 2.501708984375, 2.7281494140625, 2.95458984375, 3.1810302734375, 3.407470703125, 3.6339111328125, 3.8603515625, 4.0867919921875, 4.313232421875, 4.5396728515625, 4.76611328125, 4.9925537109375, 5.218994140625, 5.4454345703125, 5.671875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 5.0, 10.0, 10.0, 18.0, 17.0, 25.0, 44.0, 53.0, 82.0, 136.0, 215.0, 515.0, 2429.0, 99322.0, 4010479.0, 77596.0, 2136.0, 538.0, 232.0, 141.0, 64.0, 60.0, 46.0, 38.0, 17.0, 16.0, 4.0, 10.0, 7.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.125, -23.2138671875, -22.302734375, -21.3916015625, -20.48046875, -19.5693359375, -18.658203125, -17.7470703125, -16.8359375, -15.9248046875, -15.013671875, -14.1025390625, -13.19140625, -12.2802734375, -11.369140625, -10.4580078125, -9.546875, -8.6357421875, -7.724609375, -6.8134765625, -5.90234375, -4.9912109375, -4.080078125, -3.1689453125, -2.2578125, -1.3466796875, -0.435546875, 0.4755859375, 1.38671875, 2.2978515625, 3.208984375, 4.1201171875, 5.03125, 5.9423828125, 6.853515625, 7.7646484375, 8.67578125, 9.5869140625, 10.498046875, 11.4091796875, 12.3203125, 13.2314453125, 14.142578125, 15.0537109375, 15.96484375, 16.8759765625, 17.787109375, 18.6982421875, 19.609375, 20.5205078125, 21.431640625, 22.3427734375, 23.25390625, 24.1650390625, 25.076171875, 25.9873046875, 26.8984375, 27.8095703125, 28.720703125, 29.6318359375, 30.54296875, 31.4541015625, 32.365234375, 33.2763671875, 34.1875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 10.0, 38.0, 158.0, 330.0, 303.0, 137.0, 29.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.01701354980469, -117.21588897705078, -114.41476440429688, -111.61363983154297, -108.81251525878906, -106.01139068603516, -103.21026611328125, -100.40913391113281, -97.60801696777344, -94.80689239501953, -92.00576782226562, -89.20464324951172, -86.40351867675781, -83.6023941040039, -80.80126953125, -78.00013732910156, -75.19901275634766, -72.39788818359375, -69.59676361083984, -66.79563903808594, -63.99451446533203, -61.193389892578125, -58.39226150512695, -55.59113693237305, -52.79001235961914, -49.988887786865234, -47.18776321411133, -44.386634826660156, -41.58551025390625, -38.784385681152344, -35.98326110839844, -33.18213653564453, -30.38100814819336, -27.579883575439453, -24.778759002685547, -21.977632522583008, -19.1765079498291, -16.375383377075195, -13.574256896972656, -10.77313232421875, -7.972007751464844, -5.170882701873779, -2.369757652282715, 0.4313678741455078, 3.232492446899414, 6.03361701965332, 8.83474349975586, 11.635868072509766, 14.436992645263672, 17.238117218017578, 20.039241790771484, 22.840368270874023, 25.64149284362793, 28.442617416381836, 31.243743896484375, 34.04486846923828, 36.84599304199219, 39.647117614746094, 42.4482421875, 45.249366760253906, 48.05049133300781, 50.85161590576172, 53.65274429321289, 56.4538688659668, 59.2549934387207]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 3.0, 2.0, 4.0, 5.0, 8.0, 5.0, 9.0, 16.0, 19.0, 19.0, 22.0, 23.0, 24.0, 22.0, 41.0, 31.0, 26.0, 43.0, 29.0, 35.0, 47.0, 39.0, 43.0, 46.0, 48.0, 44.0, 37.0, 34.0, 27.0, 40.0, 25.0, 32.0, 31.0, 25.0, 15.0, 18.0, 12.0, 10.0, 13.0, 6.0, 7.0, 6.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-27.347843170166016, -26.58557891845703, -25.823314666748047, -25.061052322387695, -24.29878807067871, -23.536523818969727, -22.774261474609375, -22.01199722290039, -21.249732971191406, -20.487468719482422, -19.725204467773438, -18.962942123413086, -18.2006778717041, -17.438413619995117, -16.676151275634766, -15.913887023925781, -15.151622772216797, -14.389358520507812, -13.627095222473145, -12.864831924438477, -12.102567672729492, -11.340303421020508, -10.57804012298584, -9.815776824951172, -9.053512573242188, -8.291248321533203, -7.528985023498535, -6.766721248626709, -6.004457473754883, -5.242193698883057, -4.4799299240112305, -3.7176661491394043, -2.955402374267578, -2.193138599395752, -1.4308748245239258, -0.6686110496520996, 0.09365272521972656, 0.8559165000915527, 1.618180274963379, 2.380444049835205, 3.1427078247070312, 3.9049715995788574, 4.667235374450684, 5.42949914932251, 6.191762924194336, 6.954026699066162, 7.716290473937988, 8.478553771972656, 9.24081802368164, 10.003082275390625, 10.765345573425293, 11.527608871459961, 12.289873123168945, 13.05213737487793, 13.814400672912598, 14.576663970947266, 15.33892822265625, 16.101192474365234, 16.86345672607422, 17.62571907043457, 18.387983322143555, 19.15024757385254, 19.91250991821289, 20.674774169921875, 21.43703842163086]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 3.0, 8.0, 8.0, 13.0, 15.0, 13.0, 22.0, 16.0, 15.0, 22.0, 19.0, 24.0, 28.0, 39.0, 44.0, 24.0, 39.0, 52.0, 37.0, 62.0, 39.0, 37.0, 40.0, 37.0, 30.0, 32.0, 32.0, 22.0, 32.0, 30.0, 23.0, 27.0, 17.0, 21.0, 16.0, 19.0, 11.0, 6.0, 7.0, 9.0, 4.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.57421875, -2.492279052734375, -2.41033935546875, -2.328399658203125, -2.2464599609375, -2.164520263671875, -2.08258056640625, -2.000640869140625, -1.918701171875, -1.836761474609375, -1.75482177734375, -1.672882080078125, -1.5909423828125, -1.509002685546875, -1.42706298828125, -1.345123291015625, -1.26318359375, -1.181243896484375, -1.09930419921875, -1.017364501953125, -0.9354248046875, -0.853485107421875, -0.77154541015625, -0.689605712890625, -0.607666015625, -0.525726318359375, -0.44378662109375, -0.361846923828125, -0.2799072265625, -0.197967529296875, -0.11602783203125, -0.034088134765625, 0.0478515625, 0.129791259765625, 0.21173095703125, 0.293670654296875, 0.3756103515625, 0.457550048828125, 0.53948974609375, 0.621429443359375, 0.703369140625, 0.785308837890625, 0.86724853515625, 0.949188232421875, 1.0311279296875, 1.113067626953125, 1.19500732421875, 1.276947021484375, 1.35888671875, 1.440826416015625, 1.52276611328125, 1.604705810546875, 1.6866455078125, 1.768585205078125, 1.85052490234375, 1.932464599609375, 2.014404296875, 2.096343994140625, 2.17828369140625, 2.260223388671875, 2.3421630859375, 2.424102783203125, 2.50604248046875, 2.587982177734375, 2.669921875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 8.0, 6.0, 9.0, 11.0, 10.0, 22.0, 36.0, 44.0, 76.0, 118.0, 181.0, 263.0, 413.0, 658.0, 1027.0, 1787.0, 2888.0, 4695.0, 7815.0, 12633.0, 21279.0, 35889.0, 64296.0, 123412.0, 342531.0, 211705.0, 92916.0, 50724.0, 28870.0, 17336.0, 10398.0, 6428.0, 3917.0, 2336.0, 1399.0, 825.0, 559.0, 370.0, 228.0, 140.0, 101.0, 67.0, 48.0, 27.0, 18.0, 14.0, 9.0, 5.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.7216796875, -0.699676513671875, -0.67767333984375, -0.655670166015625, -0.6336669921875, -0.611663818359375, -0.58966064453125, -0.567657470703125, -0.545654296875, -0.523651123046875, -0.50164794921875, -0.479644775390625, -0.4576416015625, -0.435638427734375, -0.41363525390625, -0.391632080078125, -0.36962890625, -0.347625732421875, -0.32562255859375, -0.303619384765625, -0.2816162109375, -0.259613037109375, -0.23760986328125, -0.215606689453125, -0.193603515625, -0.171600341796875, -0.14959716796875, -0.127593994140625, -0.1055908203125, -0.083587646484375, -0.06158447265625, -0.039581298828125, -0.017578125, 0.004425048828125, 0.02642822265625, 0.048431396484375, 0.0704345703125, 0.092437744140625, 0.11444091796875, 0.136444091796875, 0.158447265625, 0.180450439453125, 0.20245361328125, 0.224456787109375, 0.2464599609375, 0.268463134765625, 0.29046630859375, 0.312469482421875, 0.33447265625, 0.356475830078125, 0.37847900390625, 0.400482177734375, 0.4224853515625, 0.444488525390625, 0.46649169921875, 0.488494873046875, 0.510498046875, 0.532501220703125, 0.55450439453125, 0.576507568359375, 0.5985107421875, 0.620513916015625, 0.64251708984375, 0.664520263671875, 0.6865234375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 1.0, 5.0, 2.0, 9.0, 7.0, 10.0, 7.0, 19.0, 19.0, 20.0, 20.0, 28.0, 28.0, 37.0, 43.0, 45.0, 49.0, 39.0, 47.0, 39.0, 1072.0, 41.0, 50.0, 53.0, 40.0, 39.0, 35.0, 34.0, 24.0, 31.0, 19.0, 23.0, 13.0, 12.0, 16.0, 11.0, 8.0, 7.0, 4.0, 7.0, 5.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.8671875, -1.810211181640625, -1.75323486328125, -1.696258544921875, -1.6392822265625, -1.582305908203125, -1.52532958984375, -1.468353271484375, -1.411376953125, -1.354400634765625, -1.29742431640625, -1.240447998046875, -1.1834716796875, -1.126495361328125, -1.06951904296875, -1.012542724609375, -0.95556640625, -0.898590087890625, -0.84161376953125, -0.784637451171875, -0.7276611328125, -0.670684814453125, -0.61370849609375, -0.556732177734375, -0.499755859375, -0.442779541015625, -0.38580322265625, -0.328826904296875, -0.2718505859375, -0.214874267578125, -0.15789794921875, -0.100921630859375, -0.0439453125, 0.013031005859375, 0.07000732421875, 0.126983642578125, 0.1839599609375, 0.240936279296875, 0.29791259765625, 0.354888916015625, 0.411865234375, 0.468841552734375, 0.52581787109375, 0.582794189453125, 0.6397705078125, 0.696746826171875, 0.75372314453125, 0.810699462890625, 0.86767578125, 0.924652099609375, 0.98162841796875, 1.038604736328125, 1.0955810546875, 1.152557373046875, 1.20953369140625, 1.266510009765625, 1.323486328125, 1.380462646484375, 1.43743896484375, 1.494415283203125, 1.5513916015625, 1.608367919921875, 1.66534423828125, 1.722320556640625, 1.779296875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 5.0, 5.0, 10.0, 18.0, 15.0, 49.0, 43.0, 76.0, 87.0, 156.0, 242.0, 314.0, 612.0, 891.0, 1368.0, 2287.0, 3767.0, 6253.0, 10932.0, 19404.0, 35962.0, 70084.0, 149346.0, 1455715.0, 172565.0, 77228.0, 39165.0, 21001.0, 11738.0, 6950.0, 4102.0, 2496.0, 1559.0, 943.0, 640.0, 390.0, 241.0, 173.0, 107.0, 67.0, 42.0, 29.0, 20.0, 9.0, 9.0, 10.0, 7.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.73681640625, -0.7134780883789062, -0.6901397705078125, -0.6668014526367188, -0.643463134765625, -0.6201248168945312, -0.5967864990234375, -0.5734481811523438, -0.55010986328125, -0.5267715454101562, -0.5034332275390625, -0.48009490966796875, -0.456756591796875, -0.43341827392578125, -0.4100799560546875, -0.38674163818359375, -0.3634033203125, -0.34006500244140625, -0.3167266845703125, -0.29338836669921875, -0.270050048828125, -0.24671173095703125, -0.2233734130859375, -0.20003509521484375, -0.17669677734375, -0.15335845947265625, -0.1300201416015625, -0.10668182373046875, -0.083343505859375, -0.06000518798828125, -0.0366668701171875, -0.01332855224609375, 0.010009765625, 0.03334808349609375, 0.0566864013671875, 0.08002471923828125, 0.103363037109375, 0.12670135498046875, 0.1500396728515625, 0.17337799072265625, 0.19671630859375, 0.22005462646484375, 0.2433929443359375, 0.26673126220703125, 0.290069580078125, 0.31340789794921875, 0.3367462158203125, 0.36008453369140625, 0.3834228515625, 0.40676116943359375, 0.4300994873046875, 0.45343780517578125, 0.476776123046875, 0.5001144409179688, 0.5234527587890625, 0.5467910766601562, 0.57012939453125, 0.5934677124023438, 0.6168060302734375, 0.6401443481445312, 0.663482666015625, 0.6868209838867188, 0.7101593017578125, 0.7334976196289062, 0.7568359375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 6.0, 7.0, 2.0, 5.0, 7.0, 8.0, 15.0, 23.0, 23.0, 17.0, 35.0, 34.0, 49.0, 79.0, 105.0, 119.0, 109.0, 87.0, 54.0, 47.0, 28.0, 27.0, 22.0, 17.0, 8.0, 11.0, 5.0, 6.0, 6.0, 8.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0005049705505371094, -0.0004903040826320648, -0.00047563761472702026, -0.0004609711468219757, -0.00044630467891693115, -0.0004316382110118866, -0.00041697174310684204, -0.0004023052752017975, -0.00038763880729675293, -0.0003729723393917084, -0.0003583058714866638, -0.00034363940358161926, -0.0003289729356765747, -0.00031430646777153015, -0.0002996399998664856, -0.00028497353196144104, -0.0002703070640563965, -0.00025564059615135193, -0.00024097412824630737, -0.00022630766034126282, -0.00021164119243621826, -0.0001969747245311737, -0.00018230825662612915, -0.0001676417887210846, -0.00015297532081604004, -0.00013830885291099548, -0.00012364238500595093, -0.00010897591710090637, -9.430944919586182e-05, -7.964298129081726e-05, -6.49765133857727e-05, -5.031004548072815e-05, -3.5643577575683594e-05, -2.0977109670639038e-05, -6.310641765594482e-06, 8.355826139450073e-06, 2.302229404449463e-05, 3.7688761949539185e-05, 5.235522985458374e-05, 6.70216977596283e-05, 8.168816566467285e-05, 9.635463356971741e-05, 0.00011102110147476196, 0.00012568756937980652, 0.00014035403728485107, 0.00015502050518989563, 0.00016968697309494019, 0.00018435344099998474, 0.0001990199089050293, 0.00021368637681007385, 0.0002283528447151184, 0.00024301931262016296, 0.0002576857805252075, 0.0002723522484302521, 0.00028701871633529663, 0.0003016851842403412, 0.00031635165214538574, 0.0003310181200504303, 0.00034568458795547485, 0.0003603510558605194, 0.00037501752376556396, 0.0003896839916706085, 0.0004043504595756531, 0.00041901692748069763, 0.0004336833953857422]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 2.0, 3.0, 6.0, 7.0, 13.0, 10.0, 13.0, 18.0, 29.0, 40.0, 53.0, 63.0, 78.0, 140.0, 262.0, 517.0, 5001.0, 1024641.0, 16185.0, 663.0, 288.0, 160.0, 96.0, 58.0, 40.0, 27.0, 32.0, 27.0, 10.0, 6.0, 12.0, 7.0, 12.0, 7.0, 4.0, 4.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.01016998291015625, -0.009867310523986816, -0.009564638137817383, -0.00926196575164795, -0.008959293365478516, -0.008656620979309082, -0.008353948593139648, -0.008051276206970215, -0.007748603820800781, -0.007445931434631348, -0.007143259048461914, -0.0068405866622924805, -0.006537914276123047, -0.006235241889953613, -0.00593256950378418, -0.005629897117614746, -0.0053272247314453125, -0.005024552345275879, -0.004721879959106445, -0.004419207572937012, -0.004116535186767578, -0.0038138628005981445, -0.003511190414428711, -0.0032085180282592773, -0.0029058456420898438, -0.00260317325592041, -0.0023005008697509766, -0.001997828483581543, -0.0016951560974121094, -0.0013924837112426758, -0.0010898113250732422, -0.0007871389389038086, -0.000484466552734375, -0.0001817941665649414, 0.00012087821960449219, 0.0004235506057739258, 0.0007262229919433594, 0.001028895378112793, 0.0013315677642822266, 0.0016342401504516602, 0.0019369125366210938, 0.0022395849227905273, 0.002542257308959961, 0.0028449296951293945, 0.003147602081298828, 0.0034502744674682617, 0.0037529468536376953, 0.004055619239807129, 0.0043582916259765625, 0.004660964012145996, 0.00496363639831543, 0.005266308784484863, 0.005568981170654297, 0.0058716535568237305, 0.006174325942993164, 0.006476998329162598, 0.006779670715332031, 0.007082343101501465, 0.0073850154876708984, 0.007687687873840332, 0.007990360260009766, 0.0082930326461792, 0.008595705032348633, 0.008898377418518066, 0.0092010498046875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 26.0, 64.0, 167.0, 242.0, 266.0, 124.0, 71.0, 31.0, 11.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007197977975010872, -0.0007022435311228037, -0.0006846892647445202, -0.0006671349983662367, -0.0006495807319879532, -0.0006320265238173306, -0.0006144722574390471, -0.0005969179910607636, -0.0005793637246824801, -0.0005618094583041966, -0.0005442551919259131, -0.0005267009255476296, -0.000509146717377007, -0.0004915924509987235, -0.00047403818462044, -0.0004564839182421565, -0.000438929651863873, -0.0004213753854855895, -0.000403821119107306, -0.00038626688183285296, -0.00036871261545456946, -0.00035115834907628596, -0.0003336041118018329, -0.0003160498454235494, -0.0002984955790452659, -0.0002809413126669824, -0.0002633870462886989, -0.00024583280901424587, -0.00022827854263596237, -0.00021072427625767887, -0.0001931700244313106, -0.00017561577260494232, -0.0001580614480189979, -0.0001405071816407144, -0.00012295292981434613, -0.00010539867071202025, -8.784441160969436e-05, -7.029015250736848e-05, -5.273589340504259e-05, -3.5181641578674316e-05, -1.7627375200390816e-05, -7.311609806492925e-08, 1.7481143004260957e-05, 3.5035402106586844e-05, 5.258966120891273e-05, 7.014392031123862e-05, 8.76981794135645e-05, 0.00010525243123993278, 0.00012280669761821628, 0.00014036096399649978, 0.00015791521582286805, 0.00017546946764923632, 0.00019302373402751982, 0.00021057800040580332, 0.0002281322522321716, 0.00024568650405853987, 0.00026324077043682337, 0.00028079503681510687, 0.00029834930319339037, 0.0003159035404678434, 0.0003334578068461269, 0.0003510120732244104, 0.00036856631049886346, 0.00038612057687714696, 0.00040367484325543046]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 5.0, 5.0, 9.0, 3.0, 11.0, 4.0, 12.0, 11.0, 9.0, 18.0, 16.0, 23.0, 24.0, 22.0, 23.0, 25.0, 32.0, 40.0, 33.0, 29.0, 30.0, 35.0, 39.0, 42.0, 48.0, 42.0, 29.0, 38.0, 26.0, 38.0, 36.0, 39.0, 20.0, 19.0, 22.0, 22.0, 15.0, 20.0, 15.0, 10.0, 10.0, 13.0, 6.0, 3.0, 10.0, 3.0, 8.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0], "bins": [-0.00020509958267211914, -0.0001990078017115593, -0.00019291602075099945, -0.0001868242397904396, -0.00018073245882987976, -0.00017464067786931992, -0.00016854889690876007, -0.00016245711594820023, -0.00015636533498764038, -0.00015027355402708054, -0.0001441817730665207, -0.00013808999210596085, -0.000131998211145401, -0.00012590643018484116, -0.00011981464922428131, -0.00011372286826372147, -0.00010763108730316162, -0.00010153930634260178, -9.544752538204193e-05, -8.935574442148209e-05, -8.326396346092224e-05, -7.71721825003624e-05, -7.108040153980255e-05, -6.49886205792427e-05, -5.889683961868286e-05, -5.2805058658123016e-05, -4.671327769756317e-05, -4.0621496737003326e-05, -3.452971577644348e-05, -2.8437934815883636e-05, -2.234615385532379e-05, -1.6254372894763947e-05, -1.0162591934204102e-05, -4.070810973644257e-06, 2.0209699869155884e-06, 8.112750947475433e-06, 1.4204531908035278e-05, 2.0296312868595123e-05, 2.6388093829154968e-05, 3.247987478971481e-05, 3.857165575027466e-05, 4.46634367108345e-05, 5.075521767139435e-05, 5.684699863195419e-05, 6.293877959251404e-05, 6.903056055307388e-05, 7.512234151363373e-05, 8.121412247419357e-05, 8.730590343475342e-05, 9.339768439531326e-05, 9.948946535587311e-05, 0.00010558124631643295, 0.0001116730272769928, 0.00011776480823755264, 0.0001238565891981125, 0.00012994837015867233, 0.00013604015111923218, 0.00014213193207979202, 0.00014822371304035187, 0.0001543154940009117, 0.00016040727496147156, 0.0001664990559220314, 0.00017259083688259125, 0.0001786826178431511, 0.00018477439880371094]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 3.0, 8.0, 8.0, 13.0, 15.0, 13.0, 22.0, 16.0, 15.0, 22.0, 19.0, 24.0, 28.0, 39.0, 44.0, 24.0, 39.0, 52.0, 37.0, 62.0, 39.0, 37.0, 40.0, 37.0, 30.0, 32.0, 32.0, 22.0, 32.0, 30.0, 23.0, 27.0, 17.0, 21.0, 16.0, 19.0, 11.0, 6.0, 7.0, 9.0, 4.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.57421875, -2.492279052734375, -2.41033935546875, -2.328399658203125, -2.2464599609375, -2.164520263671875, -2.08258056640625, -2.000640869140625, -1.918701171875, -1.836761474609375, -1.75482177734375, -1.672882080078125, -1.5909423828125, -1.509002685546875, -1.42706298828125, -1.345123291015625, -1.26318359375, -1.181243896484375, -1.09930419921875, -1.017364501953125, -0.9354248046875, -0.853485107421875, -0.77154541015625, -0.689605712890625, -0.607666015625, -0.525726318359375, -0.44378662109375, -0.361846923828125, -0.2799072265625, -0.197967529296875, -0.11602783203125, -0.034088134765625, 0.0478515625, 0.129791259765625, 0.21173095703125, 0.293670654296875, 0.3756103515625, 0.457550048828125, 0.53948974609375, 0.621429443359375, 0.703369140625, 0.785308837890625, 0.86724853515625, 0.949188232421875, 1.0311279296875, 1.113067626953125, 1.19500732421875, 1.276947021484375, 1.35888671875, 1.440826416015625, 1.52276611328125, 1.604705810546875, 1.6866455078125, 1.768585205078125, 1.85052490234375, 1.932464599609375, 2.014404296875, 2.096343994140625, 2.17828369140625, 2.260223388671875, 2.3421630859375, 2.424102783203125, 2.50604248046875, 2.587982177734375, 2.669921875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 12.0, 8.0, 14.0, 25.0, 44.0, 40.0, 78.0, 90.0, 158.0, 264.0, 407.0, 648.0, 1192.0, 2021.0, 3733.0, 6698.0, 13118.0, 26176.0, 55939.0, 119129.0, 228575.0, 271230.0, 165755.0, 78258.0, 36960.0, 17842.0, 8890.0, 4875.0, 2695.0, 1492.0, 881.0, 466.0, 300.0, 178.0, 137.0, 66.0, 39.0, 43.0, 25.0, 17.0, 11.0, 9.0, 3.0, 3.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.7216796875, -1.6647186279296875, -1.607757568359375, -1.5507965087890625, -1.49383544921875, -1.4368743896484375, -1.379913330078125, -1.3229522705078125, -1.2659912109375, -1.2090301513671875, -1.152069091796875, -1.0951080322265625, -1.03814697265625, -0.9811859130859375, -0.924224853515625, -0.8672637939453125, -0.810302734375, -0.7533416748046875, -0.696380615234375, -0.6394195556640625, -0.58245849609375, -0.5254974365234375, -0.468536376953125, -0.4115753173828125, -0.3546142578125, -0.2976531982421875, -0.240692138671875, -0.1837310791015625, -0.12677001953125, -0.0698089599609375, -0.012847900390625, 0.0441131591796875, 0.10107421875, 0.1580352783203125, 0.214996337890625, 0.2719573974609375, 0.32891845703125, 0.3858795166015625, 0.442840576171875, 0.4998016357421875, 0.5567626953125, 0.6137237548828125, 0.670684814453125, 0.7276458740234375, 0.78460693359375, 0.8415679931640625, 0.898529052734375, 0.9554901123046875, 1.012451171875, 1.0694122314453125, 1.126373291015625, 1.1833343505859375, 1.24029541015625, 1.2972564697265625, 1.354217529296875, 1.4111785888671875, 1.4681396484375, 1.5251007080078125, 1.582061767578125, 1.6390228271484375, 1.69598388671875, 1.7529449462890625, 1.809906005859375, 1.8668670654296875, 1.923828125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 2.0, 5.0, 2.0, 6.0, 4.0, 14.0, 17.0, 18.0, 21.0, 28.0, 28.0, 30.0, 33.0, 47.0, 46.0, 42.0, 68.0, 82.0, 216.0, 1511.0, 260.0, 122.0, 70.0, 49.0, 43.0, 31.0, 26.0, 30.0, 38.0, 27.0, 19.0, 15.0, 13.0, 8.0, 13.0, 9.0, 11.0, 10.0, 7.0, 4.0, 5.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.0, -8.715576171875, -8.43115234375, -8.146728515625, -7.8623046875, -7.577880859375, -7.29345703125, -7.009033203125, -6.724609375, -6.440185546875, -6.15576171875, -5.871337890625, -5.5869140625, -5.302490234375, -5.01806640625, -4.733642578125, -4.44921875, -4.164794921875, -3.88037109375, -3.595947265625, -3.3115234375, -3.027099609375, -2.74267578125, -2.458251953125, -2.173828125, -1.889404296875, -1.60498046875, -1.320556640625, -1.0361328125, -0.751708984375, -0.46728515625, -0.182861328125, 0.1015625, 0.385986328125, 0.67041015625, 0.954833984375, 1.2392578125, 1.523681640625, 1.80810546875, 2.092529296875, 2.376953125, 2.661376953125, 2.94580078125, 3.230224609375, 3.5146484375, 3.799072265625, 4.08349609375, 4.367919921875, 4.65234375, 4.936767578125, 5.22119140625, 5.505615234375, 5.7900390625, 6.074462890625, 6.35888671875, 6.643310546875, 6.927734375, 7.212158203125, 7.49658203125, 7.781005859375, 8.0654296875, 8.349853515625, 8.63427734375, 8.918701171875, 9.203125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 11.0, 6.0, 11.0, 21.0, 13.0, 18.0, 21.0, 21.0, 28.0, 44.0, 78.0, 89.0, 133.0, 207.0, 379.0, 988.0, 7812.0, 1425322.0, 1700015.0, 8370.0, 1045.0, 373.0, 202.0, 144.0, 81.0, 78.0, 45.0, 35.0, 35.0, 17.0, 10.0, 8.0, 9.0, 4.0, 6.0, 9.0, 7.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-20.078125, -19.53564453125, -18.9931640625, -18.45068359375, -17.908203125, -17.36572265625, -16.8232421875, -16.28076171875, -15.73828125, -15.19580078125, -14.6533203125, -14.11083984375, -13.568359375, -13.02587890625, -12.4833984375, -11.94091796875, -11.3984375, -10.85595703125, -10.3134765625, -9.77099609375, -9.228515625, -8.68603515625, -8.1435546875, -7.60107421875, -7.05859375, -6.51611328125, -5.9736328125, -5.43115234375, -4.888671875, -4.34619140625, -3.8037109375, -3.26123046875, -2.71875, -2.17626953125, -1.6337890625, -1.09130859375, -0.548828125, -0.00634765625, 0.5361328125, 1.07861328125, 1.62109375, 2.16357421875, 2.7060546875, 3.24853515625, 3.791015625, 4.33349609375, 4.8759765625, 5.41845703125, 5.9609375, 6.50341796875, 7.0458984375, 7.58837890625, 8.130859375, 8.67333984375, 9.2158203125, 9.75830078125, 10.30078125, 10.84326171875, 11.3857421875, 11.92822265625, 12.470703125, 13.01318359375, 13.5556640625, 14.09814453125, 14.640625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 61.0, 572.0, 366.0, 15.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.350950241088867, -14.81060791015625, -12.270264625549316, -9.729921340942383, -7.189579010009766, -4.649236679077148, -2.108893394470215, 0.43144989013671875, 2.971792221069336, 5.512135028839111, 8.052477836608887, 10.59282112121582, 13.133163452148438, 15.673505783081055, 18.213848114013672, 20.754192352294922, 23.29453468322754, 25.834877014160156, 28.375221252441406, 30.915563583374023, 33.45590591430664, 35.996246337890625, 38.536590576171875, 41.076934814453125, 43.617279052734375, 46.157623291015625, 48.69796371459961, 51.23830795288086, 53.778648376464844, 56.318992614746094, 58.859336853027344, 61.399681091308594, 63.94001770019531, 66.48036193847656, 69.02070617675781, 71.56104278564453, 74.10138702392578, 76.64173126220703, 79.18207550048828, 81.72241973876953, 84.26275634765625, 86.8031005859375, 89.34344482421875, 91.88378143310547, 94.42412567138672, 96.96446990966797, 99.50481414794922, 102.04515838623047, 104.58550262451172, 107.12584686279297, 109.66619110107422, 112.20652770996094, 114.74687194824219, 117.28721618652344, 119.82756042480469, 122.36790466308594, 124.90824890136719, 127.44859313964844, 129.9889373779297, 132.52928161621094, 135.0696258544922, 137.60995483398438, 140.15029907226562, 142.69064331054688, 145.23098754882812]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 3.0, 5.0, 9.0, 12.0, 6.0, 12.0, 12.0, 16.0, 15.0, 13.0, 19.0, 35.0, 27.0, 23.0, 44.0, 33.0, 35.0, 44.0, 40.0, 48.0, 41.0, 38.0, 38.0, 38.0, 47.0, 39.0, 28.0, 34.0, 42.0, 21.0, 31.0, 35.0, 19.0, 20.0, 10.0, 13.0, 10.0, 10.0, 9.0, 6.0, 6.0, 6.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-32.31574249267578, -31.393869400024414, -30.471996307373047, -29.55012321472168, -28.628250122070312, -27.706377029418945, -26.784503936767578, -25.86263084411621, -24.940757751464844, -24.018884658813477, -23.09701156616211, -22.175138473510742, -21.253265380859375, -20.331392288208008, -19.40951919555664, -18.487646102905273, -17.565773010253906, -16.64389991760254, -15.722026824951172, -14.800153732299805, -13.878280639648438, -12.95640754699707, -12.034534454345703, -11.112661361694336, -10.190786361694336, -9.268913269042969, -8.347040176391602, -7.425167083740234, -6.503293991088867, -5.581420421600342, -4.659547328948975, -3.7376742362976074, -2.8158016204833984, -1.8939285278320312, -0.9720553159713745, -0.05018210411071777, 0.8716909885406494, 1.7935643196105957, 2.715437412261963, 3.63731050491333, 4.559183597564697, 5.4810566902160645, 6.402929782867432, 7.324803352355957, 8.246676445007324, 9.168549537658691, 10.090422630310059, 11.012295722961426, 11.934168815612793, 12.85604190826416, 13.777915000915527, 14.699788093566895, 15.621661186218262, 16.543535232543945, 17.465408325195312, 18.38728141784668, 19.309154510498047, 20.231027603149414, 21.15290069580078, 22.07477378845215, 22.996646881103516, 23.918519973754883, 24.84039306640625, 25.762266159057617, 26.684139251708984]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 7.0, 4.0, 9.0, 10.0, 16.0, 16.0, 16.0, 15.0, 20.0, 18.0, 32.0, 32.0, 27.0, 41.0, 39.0, 30.0, 46.0, 51.0, 49.0, 45.0, 47.0, 39.0, 29.0, 33.0, 35.0, 38.0, 32.0, 33.0, 30.0, 27.0, 20.0, 24.0, 20.0, 16.0, 16.0, 11.0, 11.0, 6.0, 6.0, 3.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8046875, -2.71368408203125, -2.6226806640625, -2.53167724609375, -2.440673828125, -2.34967041015625, -2.2586669921875, -2.16766357421875, -2.07666015625, -1.98565673828125, -1.8946533203125, -1.80364990234375, -1.712646484375, -1.62164306640625, -1.5306396484375, -1.43963623046875, -1.3486328125, -1.25762939453125, -1.1666259765625, -1.07562255859375, -0.984619140625, -0.89361572265625, -0.8026123046875, -0.71160888671875, -0.62060546875, -0.52960205078125, -0.4385986328125, -0.34759521484375, -0.256591796875, -0.16558837890625, -0.0745849609375, 0.01641845703125, 0.107421875, 0.19842529296875, 0.2894287109375, 0.38043212890625, 0.471435546875, 0.56243896484375, 0.6534423828125, 0.74444580078125, 0.83544921875, 0.92645263671875, 1.0174560546875, 1.10845947265625, 1.199462890625, 1.29046630859375, 1.3814697265625, 1.47247314453125, 1.5634765625, 1.65447998046875, 1.7454833984375, 1.83648681640625, 1.927490234375, 2.01849365234375, 2.1094970703125, 2.20050048828125, 2.29150390625, 2.38250732421875, 2.4735107421875, 2.56451416015625, 2.655517578125, 2.74652099609375, 2.8375244140625, 2.92852783203125, 3.01953125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 7.0, 7.0, 8.0, 10.0, 19.0, 15.0, 22.0, 27.0, 32.0, 53.0, 69.0, 96.0, 153.0, 265.0, 636.0, 1964.0, 10765.0, 96903.0, 1266255.0, 2469257.0, 314634.0, 26891.0, 4078.0, 1030.0, 393.0, 190.0, 130.0, 89.0, 64.0, 44.0, 29.0, 30.0, 24.0, 16.0, 14.0, 13.0, 9.0, 7.0, 7.0, 8.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.31640625, -7.08935546875, -6.8623046875, -6.63525390625, -6.408203125, -6.18115234375, -5.9541015625, -5.72705078125, -5.5, -5.27294921875, -5.0458984375, -4.81884765625, -4.591796875, -4.36474609375, -4.1376953125, -3.91064453125, -3.68359375, -3.45654296875, -3.2294921875, -3.00244140625, -2.775390625, -2.54833984375, -2.3212890625, -2.09423828125, -1.8671875, -1.64013671875, -1.4130859375, -1.18603515625, -0.958984375, -0.73193359375, -0.5048828125, -0.27783203125, -0.05078125, 0.17626953125, 0.4033203125, 0.63037109375, 0.857421875, 1.08447265625, 1.3115234375, 1.53857421875, 1.765625, 1.99267578125, 2.2197265625, 2.44677734375, 2.673828125, 2.90087890625, 3.1279296875, 3.35498046875, 3.58203125, 3.80908203125, 4.0361328125, 4.26318359375, 4.490234375, 4.71728515625, 4.9443359375, 5.17138671875, 5.3984375, 5.62548828125, 5.8525390625, 6.07958984375, 6.306640625, 6.53369140625, 6.7607421875, 6.98779296875, 7.21484375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 8.0, 9.0, 14.0, 22.0, 37.0, 47.0, 51.0, 98.0, 116.0, 198.0, 233.0, 309.0, 392.0, 513.0, 475.0, 398.0, 327.0, 238.0, 162.0, 136.0, 80.0, 61.0, 50.0, 27.0, 24.0, 10.0, 7.0, 5.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.1875, -8.93231201171875, -8.6771240234375, -8.42193603515625, -8.166748046875, -7.91156005859375, -7.6563720703125, -7.40118408203125, -7.14599609375, -6.89080810546875, -6.6356201171875, -6.38043212890625, -6.125244140625, -5.87005615234375, -5.6148681640625, -5.35968017578125, -5.1044921875, -4.84930419921875, -4.5941162109375, -4.33892822265625, -4.083740234375, -3.82855224609375, -3.5733642578125, -3.31817626953125, -3.06298828125, -2.80780029296875, -2.5526123046875, -2.29742431640625, -2.042236328125, -1.78704833984375, -1.5318603515625, -1.27667236328125, -1.021484375, -0.76629638671875, -0.5111083984375, -0.25592041015625, -0.000732421875, 0.25445556640625, 0.5096435546875, 0.76483154296875, 1.02001953125, 1.27520751953125, 1.5303955078125, 1.78558349609375, 2.040771484375, 2.29595947265625, 2.5511474609375, 2.80633544921875, 3.0615234375, 3.31671142578125, 3.5718994140625, 3.82708740234375, 4.082275390625, 4.33746337890625, 4.5926513671875, 4.84783935546875, 5.10302734375, 5.35821533203125, 5.6134033203125, 5.86859130859375, 6.123779296875, 6.37896728515625, 6.6341552734375, 6.88934326171875, 7.14453125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 9.0, 7.0, 12.0, 17.0, 31.0, 38.0, 47.0, 89.0, 110.0, 190.0, 358.0, 865.0, 4771.0, 289000.0, 3850190.0, 44976.0, 2104.0, 641.0, 282.0, 178.0, 124.0, 71.0, 38.0, 38.0, 38.0, 26.0, 8.0, 9.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.640625, -23.770751953125, -22.90087890625, -22.031005859375, -21.1611328125, -20.291259765625, -19.42138671875, -18.551513671875, -17.681640625, -16.811767578125, -15.94189453125, -15.072021484375, -14.2021484375, -13.332275390625, -12.46240234375, -11.592529296875, -10.72265625, -9.852783203125, -8.98291015625, -8.113037109375, -7.2431640625, -6.373291015625, -5.50341796875, -4.633544921875, -3.763671875, -2.893798828125, -2.02392578125, -1.154052734375, -0.2841796875, 0.585693359375, 1.45556640625, 2.325439453125, 3.1953125, 4.065185546875, 4.93505859375, 5.804931640625, 6.6748046875, 7.544677734375, 8.41455078125, 9.284423828125, 10.154296875, 11.024169921875, 11.89404296875, 12.763916015625, 13.6337890625, 14.503662109375, 15.37353515625, 16.243408203125, 17.11328125, 17.983154296875, 18.85302734375, 19.722900390625, 20.5927734375, 21.462646484375, 22.33251953125, 23.202392578125, 24.072265625, 24.942138671875, 25.81201171875, 26.681884765625, 27.5517578125, 28.421630859375, 29.29150390625, 30.161376953125, 31.03125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 18.0, 49.0, 214.0, 318.0, 274.0, 116.0, 21.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.165061950683594, -49.234886169433594, -46.304710388183594, -43.374534606933594, -40.444358825683594, -37.514183044433594, -34.58400344848633, -31.653827667236328, -28.723651885986328, -25.793476104736328, -22.863300323486328, -19.933122634887695, -17.002946853637695, -14.072771072387695, -11.142593383789062, -8.212417602539062, -5.2822418212890625, -2.3520655632019043, 0.5781106948852539, 3.5082874298095703, 6.43846321105957, 9.36863899230957, 12.298816680908203, 15.228992462158203, 18.159168243408203, 21.089344024658203, 24.019519805908203, 26.949697494506836, 29.879873275756836, 32.81005096435547, 35.74022674560547, 38.67040252685547, 41.60057067871094, 44.53074645996094, 47.46092224121094, 50.39109802246094, 53.32127380371094, 56.25144958496094, 59.1816291809082, 62.1118049621582, 65.04197692871094, 67.97215270996094, 70.90232849121094, 73.83250427246094, 76.76268005371094, 79.69285583496094, 82.62303161621094, 85.55320739746094, 88.48339080810547, 91.41356658935547, 94.34374237060547, 97.27391815185547, 100.20409393310547, 103.13426971435547, 106.064453125, 108.99462890625, 111.9248046875, 114.85498046875, 117.78515625, 120.71533203125, 123.6455078125, 126.57568359375, 129.505859375, 132.43603515625, 135.3662109375]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 12.0, 5.0, 12.0, 11.0, 11.0, 13.0, 14.0, 21.0, 24.0, 23.0, 30.0, 37.0, 35.0, 42.0, 27.0, 24.0, 45.0, 43.0, 40.0, 38.0, 35.0, 43.0, 38.0, 36.0, 42.0, 37.0, 34.0, 36.0, 26.0, 25.0, 16.0, 20.0, 15.0, 14.0, 16.0, 12.0, 7.0, 10.0, 6.0, 0.0, 6.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.087722778320312, -24.257740020751953, -23.427757263183594, -22.597774505615234, -21.767791748046875, -20.937808990478516, -20.107826232910156, -19.277843475341797, -18.447860717773438, -17.617877960205078, -16.78789520263672, -15.95791244506836, -15.1279296875, -14.29794692993164, -13.467963218688965, -12.637980461120605, -11.80799674987793, -10.97801399230957, -10.148031234741211, -9.318048477172852, -8.488065719604492, -7.658082485198975, -6.828099250793457, -5.998116493225098, -5.168133735656738, -4.338150978088379, -3.5081679821014404, -2.678184986114502, -1.8482022285461426, -1.0182194709777832, -0.18823623657226562, 0.6417465209960938, 1.4717273712158203, 2.3017101287841797, 3.131693124771118, 3.9616761207580566, 4.791658878326416, 5.621641635894775, 6.451624870300293, 7.281607627868652, 8.111590385437012, 8.941573143005371, 9.77155590057373, 10.601539611816406, 11.431522369384766, 12.261505126953125, 13.091487884521484, 13.921470642089844, 14.751453399658203, 15.581436157226562, 16.411418914794922, 17.24140167236328, 18.07138442993164, 18.9013671875, 19.73134994506836, 20.56133270263672, 21.391315460205078, 22.221298217773438, 23.051280975341797, 23.881263732910156, 24.711246490478516, 25.541229248046875, 26.371212005615234, 27.201194763183594, 28.031179428100586]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 2.0, 2.0, 7.0, 9.0, 12.0, 9.0, 16.0, 15.0, 19.0, 17.0, 22.0, 17.0, 27.0, 31.0, 33.0, 38.0, 37.0, 39.0, 37.0, 46.0, 38.0, 40.0, 31.0, 34.0, 35.0, 44.0, 35.0, 25.0, 42.0, 29.0, 24.0, 22.0, 28.0, 32.0, 15.0, 14.0, 13.0, 16.0, 10.0, 11.0, 5.0, 7.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-2.830078125, -2.743896484375, -2.65771484375, -2.571533203125, -2.4853515625, -2.399169921875, -2.31298828125, -2.226806640625, -2.140625, -2.054443359375, -1.96826171875, -1.882080078125, -1.7958984375, -1.709716796875, -1.62353515625, -1.537353515625, -1.451171875, -1.364990234375, -1.27880859375, -1.192626953125, -1.1064453125, -1.020263671875, -0.93408203125, -0.847900390625, -0.76171875, -0.675537109375, -0.58935546875, -0.503173828125, -0.4169921875, -0.330810546875, -0.24462890625, -0.158447265625, -0.072265625, 0.013916015625, 0.10009765625, 0.186279296875, 0.2724609375, 0.358642578125, 0.44482421875, 0.531005859375, 0.6171875, 0.703369140625, 0.78955078125, 0.875732421875, 0.9619140625, 1.048095703125, 1.13427734375, 1.220458984375, 1.306640625, 1.392822265625, 1.47900390625, 1.565185546875, 1.6513671875, 1.737548828125, 1.82373046875, 1.909912109375, 1.99609375, 2.082275390625, 2.16845703125, 2.254638671875, 2.3408203125, 2.427001953125, 2.51318359375, 2.599365234375, 2.685546875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 8.0, 7.0, 3.0, 17.0, 28.0, 34.0, 44.0, 66.0, 97.0, 133.0, 195.0, 303.0, 396.0, 545.0, 846.0, 1213.0, 1811.0, 2469.0, 3681.0, 5271.0, 7839.0, 11418.0, 16695.0, 25121.0, 37884.0, 58619.0, 96140.0, 196925.0, 270959.0, 113106.0, 66394.0, 42791.0, 28187.0, 18756.0, 12756.0, 8608.0, 5998.0, 4116.0, 2735.0, 1961.0, 1371.0, 902.0, 621.0, 443.0, 344.0, 213.0, 157.0, 103.0, 71.0, 56.0, 33.0, 28.0, 28.0, 4.0, 3.0, 10.0, 5.0, 0.0, 1.0, 3.0], "bins": [-0.5595703125, -0.5421600341796875, -0.524749755859375, -0.5073394775390625, -0.48992919921875, -0.4725189208984375, -0.455108642578125, -0.4376983642578125, -0.4202880859375, -0.4028778076171875, -0.385467529296875, -0.3680572509765625, -0.35064697265625, -0.3332366943359375, -0.315826416015625, -0.2984161376953125, -0.281005859375, -0.2635955810546875, -0.246185302734375, -0.2287750244140625, -0.21136474609375, -0.1939544677734375, -0.176544189453125, -0.1591339111328125, -0.1417236328125, -0.1243133544921875, -0.106903076171875, -0.0894927978515625, -0.07208251953125, -0.0546722412109375, -0.037261962890625, -0.0198516845703125, -0.00244140625, 0.0149688720703125, 0.032379150390625, 0.0497894287109375, 0.06719970703125, 0.0846099853515625, 0.102020263671875, 0.1194305419921875, 0.1368408203125, 0.1542510986328125, 0.171661376953125, 0.1890716552734375, 0.20648193359375, 0.2238922119140625, 0.241302490234375, 0.2587127685546875, 0.276123046875, 0.2935333251953125, 0.310943603515625, 0.3283538818359375, 0.34576416015625, 0.3631744384765625, 0.380584716796875, 0.3979949951171875, 0.4154052734375, 0.4328155517578125, 0.450225830078125, 0.4676361083984375, 0.48504638671875, 0.5024566650390625, 0.519866943359375, 0.5372772216796875, 0.5546875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 0.0, 6.0, 4.0, 3.0, 3.0, 8.0, 11.0, 8.0, 11.0, 11.0, 16.0, 19.0, 22.0, 30.0, 27.0, 34.0, 20.0, 39.0, 39.0, 42.0, 36.0, 32.0, 41.0, 1060.0, 44.0, 47.0, 43.0, 32.0, 46.0, 36.0, 34.0, 36.0, 21.0, 28.0, 20.0, 12.0, 22.0, 13.0, 17.0, 12.0, 13.0, 4.0, 3.0, 5.0, 9.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.7734375, -1.7177734375, -1.662109375, -1.6064453125, -1.55078125, -1.4951171875, -1.439453125, -1.3837890625, -1.328125, -1.2724609375, -1.216796875, -1.1611328125, -1.10546875, -1.0498046875, -0.994140625, -0.9384765625, -0.8828125, -0.8271484375, -0.771484375, -0.7158203125, -0.66015625, -0.6044921875, -0.548828125, -0.4931640625, -0.4375, -0.3818359375, -0.326171875, -0.2705078125, -0.21484375, -0.1591796875, -0.103515625, -0.0478515625, 0.0078125, 0.0634765625, 0.119140625, 0.1748046875, 0.23046875, 0.2861328125, 0.341796875, 0.3974609375, 0.453125, 0.5087890625, 0.564453125, 0.6201171875, 0.67578125, 0.7314453125, 0.787109375, 0.8427734375, 0.8984375, 0.9541015625, 1.009765625, 1.0654296875, 1.12109375, 1.1767578125, 1.232421875, 1.2880859375, 1.34375, 1.3994140625, 1.455078125, 1.5107421875, 1.56640625, 1.6220703125, 1.677734375, 1.7333984375, 1.7890625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 12.0, 13.0, 21.0, 34.0, 37.0, 52.0, 105.0, 142.0, 202.0, 325.0, 496.0, 807.0, 1201.0, 1941.0, 3006.0, 4931.0, 8063.0, 13758.0, 23804.0, 41822.0, 78372.0, 161328.0, 1427507.0, 155259.0, 75846.0, 40866.0, 22806.0, 13284.0, 7933.0, 4967.0, 2932.0, 1861.0, 1210.0, 736.0, 507.0, 319.0, 212.0, 119.0, 105.0, 73.0, 31.0, 29.0, 21.0, 13.0, 9.0, 3.0, 4.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.75048828125, -0.7273788452148438, -0.7042694091796875, -0.6811599731445312, -0.658050537109375, -0.6349411010742188, -0.6118316650390625, -0.5887222290039062, -0.56561279296875, -0.5425033569335938, -0.5193939208984375, -0.49628448486328125, -0.473175048828125, -0.45006561279296875, -0.4269561767578125, -0.40384674072265625, -0.3807373046875, -0.35762786865234375, -0.3345184326171875, -0.31140899658203125, -0.288299560546875, -0.26519012451171875, -0.2420806884765625, -0.21897125244140625, -0.19586181640625, -0.17275238037109375, -0.1496429443359375, -0.12653350830078125, -0.103424072265625, -0.08031463623046875, -0.0572052001953125, -0.03409576416015625, -0.010986328125, 0.01212310791015625, 0.0352325439453125, 0.05834197998046875, 0.081451416015625, 0.10456085205078125, 0.1276702880859375, 0.15077972412109375, 0.17388916015625, 0.19699859619140625, 0.2201080322265625, 0.24321746826171875, 0.266326904296875, 0.28943634033203125, 0.3125457763671875, 0.33565521240234375, 0.3587646484375, 0.38187408447265625, 0.4049835205078125, 0.42809295654296875, 0.451202392578125, 0.47431182861328125, 0.4974212646484375, 0.5205307006835938, 0.54364013671875, 0.5667495727539062, 0.5898590087890625, 0.6129684448242188, 0.636077880859375, 0.6591873168945312, 0.6822967529296875, 0.7054061889648438, 0.728515625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 10.0, 6.0, 16.0, 12.0, 15.0, 20.0, 26.0, 29.0, 43.0, 48.0, 75.0, 73.0, 101.0, 111.0, 96.0, 75.0, 60.0, 27.0, 30.0, 18.0, 15.0, 12.0, 13.0, 9.0, 7.0, 10.0, 5.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0006213188171386719, -0.0006041377782821655, -0.0005869567394256592, -0.0005697757005691528, -0.0005525946617126465, -0.0005354136228561401, -0.0005182325839996338, -0.0005010515451431274, -0.0004838705062866211, -0.00046668946743011475, -0.0004495084285736084, -0.00043232738971710205, -0.0004151463508605957, -0.00039796531200408936, -0.000380784273147583, -0.00036360323429107666, -0.0003464221954345703, -0.00032924115657806396, -0.0003120601177215576, -0.00029487907886505127, -0.0002776980400085449, -0.0002605170011520386, -0.00024333596229553223, -0.00022615492343902588, -0.00020897388458251953, -0.00019179284572601318, -0.00017461180686950684, -0.0001574307680130005, -0.00014024972915649414, -0.0001230686902999878, -0.00010588765144348145, -8.87066125869751e-05, -7.152557373046875e-05, -5.43445348739624e-05, -3.7163496017456055e-05, -1.9982457160949707e-05, -2.8014183044433594e-06, 1.4379620552062988e-05, 3.1560659408569336e-05, 4.8741698265075684e-05, 6.592273712158203e-05, 8.310377597808838e-05, 0.00010028481483459473, 0.00011746585369110107, 0.00013464689254760742, 0.00015182793140411377, 0.00016900897026062012, 0.00018619000911712646, 0.0002033710479736328, 0.00022055208683013916, 0.0002377331256866455, 0.00025491416454315186, 0.0002720952033996582, 0.00028927624225616455, 0.0003064572811126709, 0.00032363831996917725, 0.0003408193588256836, 0.00035800039768218994, 0.0003751814365386963, 0.00039236247539520264, 0.000409543514251709, 0.00042672455310821533, 0.0004439055919647217, 0.00046108663082122803, 0.0004782676696777344]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 7.0, 9.0, 8.0, 9.0, 11.0, 19.0, 24.0, 30.0, 53.0, 60.0, 97.0, 136.0, 260.0, 463.0, 1822.0, 938278.0, 105300.0, 962.0, 377.0, 167.0, 141.0, 88.0, 64.0, 35.0, 25.0, 19.0, 20.0, 17.0, 8.0, 7.0, 6.0, 6.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0084686279296875, -0.008113622665405273, -0.007758617401123047, -0.00740361213684082, -0.007048606872558594, -0.006693601608276367, -0.006338596343994141, -0.005983591079711914, -0.0056285858154296875, -0.005273580551147461, -0.004918575286865234, -0.004563570022583008, -0.004208564758300781, -0.0038535594940185547, -0.003498554229736328, -0.0031435489654541016, -0.002788543701171875, -0.0024335384368896484, -0.002078533172607422, -0.0017235279083251953, -0.0013685226440429688, -0.0010135173797607422, -0.0006585121154785156, -0.00030350685119628906, 5.14984130859375e-05, 0.00040650367736816406, 0.0007615089416503906, 0.0011165142059326172, 0.0014715194702148438, 0.0018265247344970703, 0.002181529998779297, 0.0025365352630615234, 0.00289154052734375, 0.0032465457916259766, 0.003601551055908203, 0.00395655632019043, 0.004311561584472656, 0.004666566848754883, 0.005021572113037109, 0.005376577377319336, 0.0057315826416015625, 0.006086587905883789, 0.006441593170166016, 0.006796598434448242, 0.007151603698730469, 0.007506608963012695, 0.007861614227294922, 0.008216619491577148, 0.008571624755859375, 0.008926630020141602, 0.009281635284423828, 0.009636640548706055, 0.009991645812988281, 0.010346651077270508, 0.010701656341552734, 0.011056661605834961, 0.011411666870117188, 0.011766672134399414, 0.01212167739868164, 0.012476682662963867, 0.012831687927246094, 0.01318669319152832, 0.013541698455810547, 0.013896703720092773, 0.014251708984375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [7.0, 28.0, 124.0, 330.0, 326.0, 151.0, 35.0, 11.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001202230341732502, -9.109482925850898e-05, -6.196661706781015e-05, -3.2838404877111316e-05, -3.7101999623700976e-06, 2.541800495237112e-05, 5.454622441902757e-05, 8.367442933376878e-05, 0.00011280263424851, 0.00014193083916325122, 0.00017105904407799244, 0.00020018726354464889, 0.0002293154684593901, 0.0002584436733741313, 0.00028757189284078777, 0.00031670008320361376, 0.0003458283026702702, 0.00037495652213692665, 0.00040408471249975264, 0.0004332129319664091, 0.0004623411223292351, 0.0004914693417958915, 0.000520597561262548, 0.0005497257807292044, 0.0005788540001958609, 0.0006079822196625173, 0.0006371104391291738, 0.0006662386003881693, 0.0006953668198548257, 0.0007244950393214822, 0.0007536232587881386, 0.0007827514782547951, 0.0008118796395137906, 0.000841007858980447, 0.0008701360784471035, 0.000899264239706099, 0.0009283924591727555, 0.0009575206786394119, 0.0009866489563137293, 0.0010157771175727248, 0.0010449052788317204, 0.0010740334400907159, 0.0011031617177650332, 0.0011322898790240288, 0.0011614181566983461, 0.0011905463179573417, 0.0012196744792163372, 0.0012488027568906546, 0.001277931034564972, 0.0013070591958239675, 0.0013361874734982848, 0.0013653156347572803, 0.0013944439124315977, 0.0014235720736905932, 0.0014527002349495888, 0.0014818285126239061, 0.0015109566738829017, 0.0015400848351418972, 0.0015692131128162146, 0.00159834127407521, 0.0016274695517495275, 0.001656597713008523, 0.0016857259906828403, 0.0017148541519418359, 0.0017439823132008314]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 7.0, 8.0, 4.0, 9.0, 17.0, 17.0, 24.0, 27.0, 25.0, 24.0, 31.0, 31.0, 33.0, 41.0, 37.0, 40.0, 38.0, 42.0, 42.0, 35.0, 39.0, 40.0, 33.0, 40.0, 46.0, 21.0, 36.0, 28.0, 23.0, 26.0, 24.0, 20.0, 21.0, 13.0, 9.0, 12.0, 12.0, 5.0, 3.0, 9.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022232532501220703, -0.000214453786611557, -0.00020658224821090698, -0.00019871070981025696, -0.00019083917140960693, -0.0001829676330089569, -0.00017509609460830688, -0.00016722455620765686, -0.00015935301780700684, -0.0001514814794063568, -0.0001436099410057068, -0.00013573840260505676, -0.00012786686420440674, -0.00011999532580375671, -0.00011212378740310669, -0.00010425224900245667, -9.638071060180664e-05, -8.850917220115662e-05, -8.063763380050659e-05, -7.276609539985657e-05, -6.489455699920654e-05, -5.702301859855652e-05, -4.9151480197906494e-05, -4.127994179725647e-05, -3.3408403396606445e-05, -2.553686499595642e-05, -1.7665326595306396e-05, -9.793788194656372e-06, -1.9222497940063477e-06, 5.949288606643677e-06, 1.3820827007293701e-05, 2.1692365407943726e-05, 2.956390380859375e-05, 3.7435442209243774e-05, 4.53069806098938e-05, 5.317851901054382e-05, 6.105005741119385e-05, 6.892159581184387e-05, 7.67931342124939e-05, 8.466467261314392e-05, 9.253621101379395e-05, 0.00010040774941444397, 0.000108279287815094, 0.00011615082621574402, 0.00012402236461639404, 0.00013189390301704407, 0.0001397654414176941, 0.00014763697981834412, 0.00015550851821899414, 0.00016338005661964417, 0.0001712515950202942, 0.00017912313342094421, 0.00018699467182159424, 0.00019486621022224426, 0.0002027377486228943, 0.0002106092870235443, 0.00021848082542419434, 0.00022635236382484436, 0.00023422390222549438, 0.0002420954406261444, 0.00024996697902679443, 0.00025783851742744446, 0.0002657100558280945, 0.0002735815942287445, 0.00028145313262939453]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 2.0, 2.0, 7.0, 9.0, 12.0, 9.0, 16.0, 15.0, 19.0, 17.0, 22.0, 17.0, 27.0, 31.0, 33.0, 38.0, 37.0, 39.0, 37.0, 46.0, 38.0, 40.0, 31.0, 34.0, 35.0, 44.0, 35.0, 25.0, 42.0, 29.0, 24.0, 22.0, 28.0, 32.0, 15.0, 14.0, 13.0, 16.0, 10.0, 11.0, 5.0, 7.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-2.830078125, -2.743896484375, -2.65771484375, -2.571533203125, -2.4853515625, -2.399169921875, -2.31298828125, -2.226806640625, -2.140625, -2.054443359375, -1.96826171875, -1.882080078125, -1.7958984375, -1.709716796875, -1.62353515625, -1.537353515625, -1.451171875, -1.364990234375, -1.27880859375, -1.192626953125, -1.1064453125, -1.020263671875, -0.93408203125, -0.847900390625, -0.76171875, -0.675537109375, -0.58935546875, -0.503173828125, -0.4169921875, -0.330810546875, -0.24462890625, -0.158447265625, -0.072265625, 0.013916015625, 0.10009765625, 0.186279296875, 0.2724609375, 0.358642578125, 0.44482421875, 0.531005859375, 0.6171875, 0.703369140625, 0.78955078125, 0.875732421875, 0.9619140625, 1.048095703125, 1.13427734375, 1.220458984375, 1.306640625, 1.392822265625, 1.47900390625, 1.565185546875, 1.6513671875, 1.737548828125, 1.82373046875, 1.909912109375, 1.99609375, 2.082275390625, 2.16845703125, 2.254638671875, 2.3408203125, 2.427001953125, 2.51318359375, 2.599365234375, 2.685546875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 4.0, 16.0, 20.0, 28.0, 20.0, 32.0, 33.0, 56.0, 93.0, 92.0, 162.0, 223.0, 297.0, 415.0, 656.0, 939.0, 1463.0, 2226.0, 3626.0, 5719.0, 9814.0, 18245.0, 37966.0, 94326.0, 277997.0, 364290.0, 128822.0, 48371.0, 22379.0, 11662.0, 6767.0, 4065.0, 2595.0, 1617.0, 1125.0, 710.0, 488.0, 353.0, 223.0, 169.0, 122.0, 83.0, 70.0, 54.0, 40.0, 30.0, 19.0, 15.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.994140625, -2.90380859375, -2.8134765625, -2.72314453125, -2.6328125, -2.54248046875, -2.4521484375, -2.36181640625, -2.271484375, -2.18115234375, -2.0908203125, -2.00048828125, -1.91015625, -1.81982421875, -1.7294921875, -1.63916015625, -1.548828125, -1.45849609375, -1.3681640625, -1.27783203125, -1.1875, -1.09716796875, -1.0068359375, -0.91650390625, -0.826171875, -0.73583984375, -0.6455078125, -0.55517578125, -0.46484375, -0.37451171875, -0.2841796875, -0.19384765625, -0.103515625, -0.01318359375, 0.0771484375, 0.16748046875, 0.2578125, 0.34814453125, 0.4384765625, 0.52880859375, 0.619140625, 0.70947265625, 0.7998046875, 0.89013671875, 0.98046875, 1.07080078125, 1.1611328125, 1.25146484375, 1.341796875, 1.43212890625, 1.5224609375, 1.61279296875, 1.703125, 1.79345703125, 1.8837890625, 1.97412109375, 2.064453125, 2.15478515625, 2.2451171875, 2.33544921875, 2.42578125, 2.51611328125, 2.6064453125, 2.69677734375, 2.787109375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 5.0, 5.0, 8.0, 5.0, 6.0, 10.0, 16.0, 21.0, 19.0, 23.0, 32.0, 32.0, 23.0, 45.0, 42.0, 50.0, 52.0, 68.0, 146.0, 1469.0, 409.0, 129.0, 75.0, 60.0, 30.0, 44.0, 32.0, 30.0, 25.0, 29.0, 17.0, 27.0, 13.0, 12.0, 10.0, 9.0, 5.0, 7.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.046875, -10.701416015625, -10.35595703125, -10.010498046875, -9.6650390625, -9.319580078125, -8.97412109375, -8.628662109375, -8.283203125, -7.937744140625, -7.59228515625, -7.246826171875, -6.9013671875, -6.555908203125, -6.21044921875, -5.864990234375, -5.51953125, -5.174072265625, -4.82861328125, -4.483154296875, -4.1376953125, -3.792236328125, -3.44677734375, -3.101318359375, -2.755859375, -2.410400390625, -2.06494140625, -1.719482421875, -1.3740234375, -1.028564453125, -0.68310546875, -0.337646484375, 0.0078125, 0.353271484375, 0.69873046875, 1.044189453125, 1.3896484375, 1.735107421875, 2.08056640625, 2.426025390625, 2.771484375, 3.116943359375, 3.46240234375, 3.807861328125, 4.1533203125, 4.498779296875, 4.84423828125, 5.189697265625, 5.53515625, 5.880615234375, 6.22607421875, 6.571533203125, 6.9169921875, 7.262451171875, 7.60791015625, 7.953369140625, 8.298828125, 8.644287109375, 8.98974609375, 9.335205078125, 9.6806640625, 10.026123046875, 10.37158203125, 10.717041015625, 11.0625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 6.0, 4.0, 8.0, 14.0, 6.0, 20.0, 21.0, 29.0, 32.0, 43.0, 52.0, 68.0, 116.0, 158.0, 288.0, 525.0, 2394.0, 49436.0, 3032185.0, 56192.0, 2631.0, 528.0, 306.0, 192.0, 103.0, 74.0, 48.0, 47.0, 36.0, 18.0, 26.0, 15.0, 22.0, 10.0, 12.0, 6.0, 3.0, 9.0, 4.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-22.84375, -22.118896484375, -21.39404296875, -20.669189453125, -19.9443359375, -19.219482421875, -18.49462890625, -17.769775390625, -17.044921875, -16.320068359375, -15.59521484375, -14.870361328125, -14.1455078125, -13.420654296875, -12.69580078125, -11.970947265625, -11.24609375, -10.521240234375, -9.79638671875, -9.071533203125, -8.3466796875, -7.621826171875, -6.89697265625, -6.172119140625, -5.447265625, -4.722412109375, -3.99755859375, -3.272705078125, -2.5478515625, -1.822998046875, -1.09814453125, -0.373291015625, 0.3515625, 1.076416015625, 1.80126953125, 2.526123046875, 3.2509765625, 3.975830078125, 4.70068359375, 5.425537109375, 6.150390625, 6.875244140625, 7.60009765625, 8.324951171875, 9.0498046875, 9.774658203125, 10.49951171875, 11.224365234375, 11.94921875, 12.674072265625, 13.39892578125, 14.123779296875, 14.8486328125, 15.573486328125, 16.29833984375, 17.023193359375, 17.748046875, 18.472900390625, 19.19775390625, 19.922607421875, 20.6474609375, 21.372314453125, 22.09716796875, 22.822021484375, 23.546875]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 9.0, 463.0, 536.0, 7.0, 1.0, 1.0], "bins": [-290.40313720703125, -285.5629577636719, -280.7227478027344, -275.882568359375, -271.0423889160156, -266.2021789550781, -261.36199951171875, -256.5218200683594, -251.68161010742188, -246.84141540527344, -242.00123596191406, -237.16104125976562, -232.3208465576172, -227.48065185546875, -222.64047241210938, -217.80027770996094, -212.96009826660156, -208.11990356445312, -203.27972412109375, -198.4395294189453, -193.59933471679688, -188.7591552734375, -183.91896057128906, -179.07876586914062, -174.23858642578125, -169.3983917236328, -164.55821228027344, -159.718017578125, -154.87782287597656, -150.03762817382812, -145.19744873046875, -140.3572540283203, -135.51705932617188, -130.67686462402344, -125.83667755126953, -120.99649047851562, -116.15629577636719, -111.31610870361328, -106.47592163085938, -101.63572692871094, -96.79553985595703, -91.95535278320312, -87.11515808105469, -82.27497100830078, -77.43478393554688, -72.59458923339844, -67.75440216064453, -62.91421127319336, -58.07402038574219, -53.233829498291016, -48.393638610839844, -43.55345153808594, -38.713260650634766, -33.873069763183594, -29.032880783081055, -24.192691802978516, -19.35249900817871, -14.512309074401855, -9.672119140625, -4.8319292068481445, 0.008260726928710938, 4.848451614379883, 9.688640594482422, 14.528829574584961, 19.369020462036133]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 8.0, 7.0, 6.0, 8.0, 9.0, 13.0, 8.0, 20.0, 20.0, 26.0, 27.0, 45.0, 39.0, 29.0, 50.0, 39.0, 45.0, 51.0, 43.0, 60.0, 49.0, 40.0, 44.0, 41.0, 38.0, 22.0, 38.0, 31.0, 36.0, 23.0, 15.0, 20.0, 7.0, 9.0, 8.0, 5.0, 3.0, 11.0, 7.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.334327697753906, -37.260040283203125, -36.18574905395508, -35.1114616394043, -34.03717041015625, -32.96288299560547, -31.888593673706055, -30.81430435180664, -29.740015029907227, -28.665725708007812, -27.5914363861084, -26.517147064208984, -25.442859649658203, -24.368568420410156, -23.294281005859375, -22.21999168395996, -21.145702362060547, -20.071413040161133, -18.99712371826172, -17.922834396362305, -16.84854507446289, -15.774256706237793, -14.699968338012695, -13.625679016113281, -12.551389694213867, -11.477100372314453, -10.402811050415039, -9.328522682189941, -8.254233360290527, -7.179944038391113, -6.105655193328857, -5.031366348266602, -3.957080841064453, -2.882791757583618, -1.8085026741027832, -0.7342135906219482, 0.3400754928588867, 1.4143648147583008, 2.4886536598205566, 3.5629425048828125, 4.637231826782227, 5.711521148681641, 6.7858099937438965, 7.860098838806152, 8.934388160705566, 10.00867748260498, 11.082965850830078, 12.157255172729492, 13.231544494628906, 14.30583381652832, 15.380123138427734, 16.45441246032715, 17.528701782226562, 18.602989196777344, 19.677278518676758, 20.751567840576172, 21.825857162475586, 22.900146484375, 23.974435806274414, 25.048725128173828, 26.12301254272461, 27.197303771972656, 28.271591186523438, 29.34588050842285, 30.420169830322266]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 2.0, 2.0, 10.0, 7.0, 5.0, 7.0, 10.0, 19.0, 17.0, 14.0, 20.0, 24.0, 20.0, 35.0, 25.0, 34.0, 39.0, 31.0, 30.0, 42.0, 31.0, 34.0, 44.0, 43.0, 34.0, 39.0, 37.0, 31.0, 25.0, 32.0, 24.0, 28.0, 27.0, 26.0, 25.0, 19.0, 19.0, 16.0, 11.0, 12.0, 7.0, 19.0, 5.0, 6.0, 4.0, 7.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.703125, -2.6162109375, -2.529296875, -2.4423828125, -2.35546875, -2.2685546875, -2.181640625, -2.0947265625, -2.0078125, -1.9208984375, -1.833984375, -1.7470703125, -1.66015625, -1.5732421875, -1.486328125, -1.3994140625, -1.3125, -1.2255859375, -1.138671875, -1.0517578125, -0.96484375, -0.8779296875, -0.791015625, -0.7041015625, -0.6171875, -0.5302734375, -0.443359375, -0.3564453125, -0.26953125, -0.1826171875, -0.095703125, -0.0087890625, 0.078125, 0.1650390625, 0.251953125, 0.3388671875, 0.42578125, 0.5126953125, 0.599609375, 0.6865234375, 0.7734375, 0.8603515625, 0.947265625, 1.0341796875, 1.12109375, 1.2080078125, 1.294921875, 1.3818359375, 1.46875, 1.5556640625, 1.642578125, 1.7294921875, 1.81640625, 1.9033203125, 1.990234375, 2.0771484375, 2.1640625, 2.2509765625, 2.337890625, 2.4248046875, 2.51171875, 2.5986328125, 2.685546875, 2.7724609375, 2.859375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 8.0, 5.0, 7.0, 12.0, 13.0, 16.0, 31.0, 40.0, 50.0, 76.0, 78.0, 114.0, 231.0, 368.0, 663.0, 1323.0, 2771.0, 6800.0, 19035.0, 61547.0, 222037.0, 726538.0, 1419166.0, 1142020.0, 421663.0, 115642.0, 33772.0, 11477.0, 4496.0, 1947.0, 903.0, 520.0, 285.0, 188.0, 127.0, 90.0, 59.0, 47.0, 26.0, 22.0, 19.0, 14.0, 12.0, 11.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.58203125, -3.46923828125, -3.3564453125, -3.24365234375, -3.130859375, -3.01806640625, -2.9052734375, -2.79248046875, -2.6796875, -2.56689453125, -2.4541015625, -2.34130859375, -2.228515625, -2.11572265625, -2.0029296875, -1.89013671875, -1.77734375, -1.66455078125, -1.5517578125, -1.43896484375, -1.326171875, -1.21337890625, -1.1005859375, -0.98779296875, -0.875, -0.76220703125, -0.6494140625, -0.53662109375, -0.423828125, -0.31103515625, -0.1982421875, -0.08544921875, 0.02734375, 0.14013671875, 0.2529296875, 0.36572265625, 0.478515625, 0.59130859375, 0.7041015625, 0.81689453125, 0.9296875, 1.04248046875, 1.1552734375, 1.26806640625, 1.380859375, 1.49365234375, 1.6064453125, 1.71923828125, 1.83203125, 1.94482421875, 2.0576171875, 2.17041015625, 2.283203125, 2.39599609375, 2.5087890625, 2.62158203125, 2.734375, 2.84716796875, 2.9599609375, 3.07275390625, 3.185546875, 3.29833984375, 3.4111328125, 3.52392578125, 3.63671875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 9.0, 16.0, 27.0, 46.0, 69.0, 108.0, 125.0, 183.0, 283.0, 388.0, 532.0, 582.0, 504.0, 403.0, 259.0, 168.0, 137.0, 68.0, 61.0, 33.0, 19.0, 16.0, 10.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-13.625, -13.310302734375, -12.99560546875, -12.680908203125, -12.3662109375, -12.051513671875, -11.73681640625, -11.422119140625, -11.107421875, -10.792724609375, -10.47802734375, -10.163330078125, -9.8486328125, -9.533935546875, -9.21923828125, -8.904541015625, -8.58984375, -8.275146484375, -7.96044921875, -7.645751953125, -7.3310546875, -7.016357421875, -6.70166015625, -6.386962890625, -6.072265625, -5.757568359375, -5.44287109375, -5.128173828125, -4.8134765625, -4.498779296875, -4.18408203125, -3.869384765625, -3.5546875, -3.239990234375, -2.92529296875, -2.610595703125, -2.2958984375, -1.981201171875, -1.66650390625, -1.351806640625, -1.037109375, -0.722412109375, -0.40771484375, -0.093017578125, 0.2216796875, 0.536376953125, 0.85107421875, 1.165771484375, 1.48046875, 1.795166015625, 2.10986328125, 2.424560546875, 2.7392578125, 3.053955078125, 3.36865234375, 3.683349609375, 3.998046875, 4.312744140625, 4.62744140625, 4.942138671875, 5.2568359375, 5.571533203125, 5.88623046875, 6.200927734375, 6.515625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 5.0, 11.0, 10.0, 26.0, 19.0, 42.0, 52.0, 76.0, 120.0, 202.0, 434.0, 1636.0, 39143.0, 3930409.0, 217936.0, 2880.0, 600.0, 255.0, 149.0, 83.0, 49.0, 37.0, 24.0, 21.0, 22.0, 15.0, 9.0, 4.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.953125, -24.979248046875, -24.00537109375, -23.031494140625, -22.0576171875, -21.083740234375, -20.10986328125, -19.135986328125, -18.162109375, -17.188232421875, -16.21435546875, -15.240478515625, -14.2666015625, -13.292724609375, -12.31884765625, -11.344970703125, -10.37109375, -9.397216796875, -8.42333984375, -7.449462890625, -6.4755859375, -5.501708984375, -4.52783203125, -3.553955078125, -2.580078125, -1.606201171875, -0.63232421875, 0.341552734375, 1.3154296875, 2.289306640625, 3.26318359375, 4.237060546875, 5.2109375, 6.184814453125, 7.15869140625, 8.132568359375, 9.1064453125, 10.080322265625, 11.05419921875, 12.028076171875, 13.001953125, 13.975830078125, 14.94970703125, 15.923583984375, 16.8974609375, 17.871337890625, 18.84521484375, 19.819091796875, 20.79296875, 21.766845703125, 22.74072265625, 23.714599609375, 24.6884765625, 25.662353515625, 26.63623046875, 27.610107421875, 28.583984375, 29.557861328125, 30.53173828125, 31.505615234375, 32.4794921875, 33.453369140625, 34.42724609375, 35.401123046875, 36.375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 11.0, 17.0, 21.0, 42.0, 60.0, 96.0, 117.0, 124.0, 150.0, 103.0, 91.0, 64.0, 50.0, 28.0, 16.0, 4.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.13124084472656, -41.021175384521484, -39.911109924316406, -38.80104446411133, -37.69097900390625, -36.580909729003906, -35.47084426879883, -34.36077880859375, -33.25071334838867, -32.140647888183594, -31.030582427978516, -29.920515060424805, -28.810449600219727, -27.70038414001465, -26.590316772460938, -25.48025131225586, -24.37018585205078, -23.260120391845703, -22.150054931640625, -21.039987564086914, -19.929922103881836, -18.819856643676758, -17.709789276123047, -16.59972381591797, -15.48965835571289, -14.379592895507812, -13.269526481628418, -12.159460067749023, -11.049394607543945, -9.939329147338867, -8.829262733459473, -7.719196796417236, -6.609128952026367, -5.499063014984131, -4.3889970779418945, -3.278931140899658, -2.168865203857422, -1.0587992668151855, 0.05126667022705078, 1.161332607269287, 2.2713985443115234, 3.3814644813537598, 4.491530418395996, 5.601596355438232, 6.711662292480469, 7.821728229522705, 8.931794166564941, 10.041860580444336, 11.151926040649414, 12.261991500854492, 13.372057914733887, 14.482124328613281, 15.59218978881836, 16.702255249023438, 17.812320709228516, 18.922388076782227, 20.032453536987305, 21.142518997192383, 22.252586364746094, 23.362651824951172, 24.47271728515625, 25.582782745361328, 26.692848205566406, 27.802915573120117, 28.912981033325195]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 11.0, 11.0, 9.0, 9.0, 12.0, 17.0, 8.0, 17.0, 20.0, 31.0, 25.0, 26.0, 36.0, 32.0, 38.0, 44.0, 35.0, 39.0, 40.0, 47.0, 31.0, 40.0, 33.0, 36.0, 36.0, 41.0, 28.0, 34.0, 27.0, 26.0, 27.0, 15.0, 21.0, 6.0, 17.0, 13.0, 13.0, 7.0, 7.0, 4.0, 9.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.80202865600586, -21.04667854309082, -20.29132843017578, -19.535980224609375, -18.780630111694336, -18.025279998779297, -17.269929885864258, -16.51457977294922, -15.759230613708496, -15.003880500793457, -14.248531341552734, -13.493181228637695, -12.737831115722656, -11.982481956481934, -11.227131843566895, -10.471782684326172, -9.716432571411133, -8.961082458496094, -8.205733299255371, -7.450383186340332, -6.695033550262451, -5.93968391418457, -5.184333801269531, -4.42898416519165, -3.6736345291137695, -2.9182848930358887, -2.1629350185394287, -1.4075851440429688, -0.6522355079650879, 0.10311412811279297, 0.858464241027832, 1.613813877105713, 2.3691654205322266, 3.1245150566101074, 3.8798649311065674, 4.635214805603027, 5.390564441680908, 6.145914077758789, 6.901264190673828, 7.656613826751709, 8.41196346282959, 9.167313575744629, 9.922662734985352, 10.67801284790039, 11.43336296081543, 12.188712120056152, 12.944062232971191, 13.699411392211914, 14.454761505126953, 15.210111618041992, 15.965460777282715, 16.720809936523438, 17.476160049438477, 18.231510162353516, 18.986860275268555, 19.742210388183594, 20.49755859375, 21.25290870666504, 22.008258819580078, 22.763607025146484, 23.518957138061523, 24.274307250976562, 25.0296573638916, 25.78500747680664, 26.54035758972168]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 10.0, 8.0, 5.0, 10.0, 11.0, 15.0, 21.0, 22.0, 16.0, 21.0, 32.0, 34.0, 26.0, 36.0, 34.0, 29.0, 33.0, 37.0, 36.0, 40.0, 45.0, 44.0, 37.0, 37.0, 32.0, 38.0, 33.0, 30.0, 25.0, 28.0, 21.0, 21.0, 15.0, 14.0, 23.0, 23.0, 9.0, 11.0, 11.0, 5.0, 8.0, 5.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.869140625, -2.7779541015625, -2.686767578125, -2.5955810546875, -2.50439453125, -2.4132080078125, -2.322021484375, -2.2308349609375, -2.1396484375, -2.0484619140625, -1.957275390625, -1.8660888671875, -1.77490234375, -1.6837158203125, -1.592529296875, -1.5013427734375, -1.41015625, -1.3189697265625, -1.227783203125, -1.1365966796875, -1.04541015625, -0.9542236328125, -0.863037109375, -0.7718505859375, -0.6806640625, -0.5894775390625, -0.498291015625, -0.4071044921875, -0.31591796875, -0.2247314453125, -0.133544921875, -0.0423583984375, 0.048828125, 0.1400146484375, 0.231201171875, 0.3223876953125, 0.41357421875, 0.5047607421875, 0.595947265625, 0.6871337890625, 0.7783203125, 0.8695068359375, 0.960693359375, 1.0518798828125, 1.14306640625, 1.2342529296875, 1.325439453125, 1.4166259765625, 1.5078125, 1.5989990234375, 1.690185546875, 1.7813720703125, 1.87255859375, 1.9637451171875, 2.054931640625, 2.1461181640625, 2.2373046875, 2.3284912109375, 2.419677734375, 2.5108642578125, 2.60205078125, 2.6932373046875, 2.784423828125, 2.8756103515625, 2.966796875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 9.0, 20.0, 18.0, 32.0, 39.0, 58.0, 75.0, 135.0, 191.0, 275.0, 390.0, 577.0, 840.0, 1245.0, 1899.0, 2925.0, 4513.0, 6987.0, 10807.0, 17901.0, 28582.0, 47063.0, 81298.0, 163661.0, 344067.0, 144285.0, 74495.0, 43949.0, 26533.0, 16532.0, 10378.0, 6425.0, 4112.0, 2719.0, 1825.0, 1219.0, 794.0, 520.0, 345.0, 235.0, 203.0, 114.0, 70.0, 63.0, 43.0, 31.0, 17.0, 14.0, 12.0, 8.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.76318359375, -0.7396469116210938, -0.7161102294921875, -0.6925735473632812, -0.669036865234375, -0.6455001831054688, -0.6219635009765625, -0.5984268188476562, -0.57489013671875, -0.5513534545898438, -0.5278167724609375, -0.5042800903320312, -0.480743408203125, -0.45720672607421875, -0.4336700439453125, -0.41013336181640625, -0.3865966796875, -0.36305999755859375, -0.3395233154296875, -0.31598663330078125, -0.292449951171875, -0.26891326904296875, -0.2453765869140625, -0.22183990478515625, -0.19830322265625, -0.17476654052734375, -0.1512298583984375, -0.12769317626953125, -0.104156494140625, -0.08061981201171875, -0.0570831298828125, -0.03354644775390625, -0.010009765625, 0.01352691650390625, 0.0370635986328125, 0.06060028076171875, 0.084136962890625, 0.10767364501953125, 0.1312103271484375, 0.15474700927734375, 0.17828369140625, 0.20182037353515625, 0.2253570556640625, 0.24889373779296875, 0.272430419921875, 0.29596710205078125, 0.3195037841796875, 0.34304046630859375, 0.3665771484375, 0.39011383056640625, 0.4136505126953125, 0.43718719482421875, 0.460723876953125, 0.48426055908203125, 0.5077972412109375, 0.5313339233398438, 0.55487060546875, 0.5784072875976562, 0.6019439697265625, 0.6254806518554688, 0.649017333984375, 0.6725540161132812, 0.6960906982421875, 0.7196273803710938, 0.7431640625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 4.0, 3.0, 5.0, 7.0, 6.0, 14.0, 2.0, 14.0, 20.0, 16.0, 21.0, 29.0, 39.0, 29.0, 40.0, 42.0, 37.0, 34.0, 39.0, 34.0, 39.0, 1077.0, 56.0, 38.0, 45.0, 51.0, 31.0, 41.0, 36.0, 25.0, 33.0, 23.0, 21.0, 23.0, 11.0, 7.0, 6.0, 6.0, 8.0, 5.0, 7.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.02734375, -1.960723876953125, -1.89410400390625, -1.827484130859375, -1.7608642578125, -1.694244384765625, -1.62762451171875, -1.561004638671875, -1.494384765625, -1.427764892578125, -1.36114501953125, -1.294525146484375, -1.2279052734375, -1.161285400390625, -1.09466552734375, -1.028045654296875, -0.96142578125, -0.894805908203125, -0.82818603515625, -0.761566162109375, -0.6949462890625, -0.628326416015625, -0.56170654296875, -0.495086669921875, -0.428466796875, -0.361846923828125, -0.29522705078125, -0.228607177734375, -0.1619873046875, -0.095367431640625, -0.02874755859375, 0.037872314453125, 0.1044921875, 0.171112060546875, 0.23773193359375, 0.304351806640625, 0.3709716796875, 0.437591552734375, 0.50421142578125, 0.570831298828125, 0.637451171875, 0.704071044921875, 0.77069091796875, 0.837310791015625, 0.9039306640625, 0.970550537109375, 1.03717041015625, 1.103790283203125, 1.17041015625, 1.237030029296875, 1.30364990234375, 1.370269775390625, 1.4368896484375, 1.503509521484375, 1.57012939453125, 1.636749267578125, 1.703369140625, 1.769989013671875, 1.83660888671875, 1.903228759765625, 1.9698486328125, 2.036468505859375, 2.10308837890625, 2.169708251953125, 2.236328125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 6.0, 10.0, 8.0, 4.0, 22.0, 25.0, 37.0, 54.0, 98.0, 117.0, 218.0, 291.0, 464.0, 825.0, 1270.0, 2038.0, 3510.0, 5856.0, 10155.0, 18235.0, 33634.0, 63618.0, 126817.0, 1425827.0, 206385.0, 92010.0, 47253.0, 24876.0, 13732.0, 7836.0, 4604.0, 2702.0, 1700.0, 1046.0, 659.0, 420.0, 248.0, 175.0, 140.0, 58.0, 59.0, 33.0, 22.0, 10.0, 15.0, 9.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.9091796875, -0.8822555541992188, -0.8553314208984375, -0.8284072875976562, -0.801483154296875, -0.7745590209960938, -0.7476348876953125, -0.7207107543945312, -0.69378662109375, -0.6668624877929688, -0.6399383544921875, -0.6130142211914062, -0.586090087890625, -0.5591659545898438, -0.5322418212890625, -0.5053176879882812, -0.4783935546875, -0.45146942138671875, -0.4245452880859375, -0.39762115478515625, -0.370697021484375, -0.34377288818359375, -0.3168487548828125, -0.28992462158203125, -0.26300048828125, -0.23607635498046875, -0.2091522216796875, -0.18222808837890625, -0.155303955078125, -0.12837982177734375, -0.1014556884765625, -0.07453155517578125, -0.047607421875, -0.02068328857421875, 0.0062408447265625, 0.03316497802734375, 0.060089111328125, 0.08701324462890625, 0.1139373779296875, 0.14086151123046875, 0.16778564453125, 0.19470977783203125, 0.2216339111328125, 0.24855804443359375, 0.275482177734375, 0.30240631103515625, 0.3293304443359375, 0.35625457763671875, 0.3831787109375, 0.41010284423828125, 0.4370269775390625, 0.46395111083984375, 0.490875244140625, 0.5177993774414062, 0.5447235107421875, 0.5716476440429688, 0.59857177734375, 0.6254959106445312, 0.6524200439453125, 0.6793441772460938, 0.706268310546875, 0.7331924438476562, 0.7601165771484375, 0.7870407104492188, 0.81396484375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 6.0, 8.0, 7.0, 5.0, 3.0, 4.0, 11.0, 15.0, 19.0, 15.0, 33.0, 42.0, 56.0, 66.0, 114.0, 109.0, 110.0, 84.0, 70.0, 29.0, 34.0, 24.0, 26.0, 22.0, 21.0, 15.0, 15.0, 6.0, 9.0, 8.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0007166862487792969, -0.0006976425647735596, -0.0006785988807678223, -0.000659555196762085, -0.0006405115127563477, -0.0006214678287506104, -0.000602424144744873, -0.0005833804607391357, -0.0005643367767333984, -0.0005452930927276611, -0.0005262494087219238, -0.0005072057247161865, -0.0004881620407104492, -0.0004691183567047119, -0.0004500746726989746, -0.0004310309886932373, -0.0004119873046875, -0.0003929436206817627, -0.0003738999366760254, -0.0003548562526702881, -0.0003358125686645508, -0.0003167688846588135, -0.00029772520065307617, -0.00027868151664733887, -0.00025963783264160156, -0.00024059414863586426, -0.00022155046463012695, -0.00020250678062438965, -0.00018346309661865234, -0.00016441941261291504, -0.00014537572860717773, -0.00012633204460144043, -0.00010728836059570312, -8.824467658996582e-05, -6.920099258422852e-05, -5.015730857849121e-05, -3.1113624572753906e-05, -1.2069940567016602e-05, 6.973743438720703e-06, 2.6017427444458008e-05, 4.506111145019531e-05, 6.410479545593262e-05, 8.314847946166992e-05, 0.00010219216346740723, 0.00012123584747314453, 0.00014027953147888184, 0.00015932321548461914, 0.00017836689949035645, 0.00019741058349609375, 0.00021645426750183105, 0.00023549795150756836, 0.00025454163551330566, 0.00027358531951904297, 0.0002926290035247803, 0.0003116726875305176, 0.0003307163715362549, 0.0003497600555419922, 0.0003688037395477295, 0.0003878474235534668, 0.0004068911075592041, 0.0004259347915649414, 0.0004449784755706787, 0.000464022159576416, 0.0004830658435821533, 0.0005021095275878906]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 8.0, 8.0, 8.0, 22.0, 18.0, 24.0, 27.0, 40.0, 52.0, 67.0, 97.0, 240.0, 577.0, 6759.0, 1035299.0, 4139.0, 529.0, 272.0, 132.0, 72.0, 45.0, 28.0, 20.0, 12.0, 7.0, 6.0, 9.0, 4.0, 3.0, 8.0, 2.0, 2.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0120849609375, -0.011660337448120117, -0.011235713958740234, -0.010811090469360352, -0.010386466979980469, -0.009961843490600586, -0.009537220001220703, -0.00911259651184082, -0.008687973022460938, -0.008263349533081055, -0.007838726043701172, -0.007414102554321289, -0.006989479064941406, -0.0065648555755615234, -0.006140232086181641, -0.005715608596801758, -0.005290985107421875, -0.004866361618041992, -0.004441738128662109, -0.0040171146392822266, -0.0035924911499023438, -0.003167867660522461, -0.002743244171142578, -0.0023186206817626953, -0.0018939971923828125, -0.0014693737030029297, -0.0010447502136230469, -0.0006201267242431641, -0.00019550323486328125, 0.00022912025451660156, 0.0006537437438964844, 0.0010783672332763672, 0.00150299072265625, 0.0019276142120361328, 0.0023522377014160156, 0.0027768611907958984, 0.0032014846801757812, 0.003626108169555664, 0.004050731658935547, 0.00447535514831543, 0.0048999786376953125, 0.005324602127075195, 0.005749225616455078, 0.006173849105834961, 0.006598472595214844, 0.0070230960845947266, 0.007447719573974609, 0.007872343063354492, 0.008296966552734375, 0.008721590042114258, 0.00914621353149414, 0.009570837020874023, 0.009995460510253906, 0.010420083999633789, 0.010844707489013672, 0.011269330978393555, 0.011693954467773438, 0.01211857795715332, 0.012543201446533203, 0.012967824935913086, 0.013392448425292969, 0.013817071914672852, 0.014241695404052734, 0.014666318893432617, 0.0150909423828125]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 19.0, 111.0, 353.0, 390.0, 112.0, 27.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006598635809496045, -0.0006233363528735936, -0.0005868090665899217, -0.0005502818385139108, -0.0005137546104378998, -0.00047722735325805843, -0.00044070009607821703, -0.0004041728680022061, -0.0003676456108223647, -0.0003311183536425233, -0.00029459112556651235, -0.00025806386838667095, -0.00022153662575874478, -0.0001850093831308186, -0.0001484821259509772, -0.00011195489787496626, -7.542764069512486e-05, -3.890039442921989e-05, -2.3731481633149087e-06, 3.4154101740568876e-05, 7.068134436849505e-05, 0.00010720858699642122, 0.00014373584417626262, 0.00018026307225227356, 0.00021679032943211496, 0.00025331758661195636, 0.0002898448146879673, 0.0003263720718678087, 0.0003628993290476501, 0.00039942655712366104, 0.00043595381430350244, 0.0004724810423795134, 0.0005090082995593548, 0.0005455355276353657, 0.0005820628139190376, 0.0006185900419950485, 0.0006551172700710595, 0.0006916444981470704, 0.0007281717844307423, 0.0007646990125067532, 0.0008012262405827641, 0.0008377534686587751, 0.000874280754942447, 0.0009108079830184579, 0.0009473352110944688, 0.0009838624391704798, 0.0010203897254541516, 0.0010569170117378235, 0.0010934441816061735, 0.0011299714678898454, 0.0011664986377581954, 0.0012030259240418673, 0.0012395532103255391, 0.0012760803801938891, 0.001312607666477561, 0.001349134836345911, 0.0013856622390449047, 0.0014221895253285766, 0.0014587166951969266, 0.0014952439814805984, 0.0015317712677642703, 0.0015682984376326203, 0.0016048257239162922, 0.0016413528937846422, 0.001677880180068314]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 5.0, 7.0, 5.0, 2.0, 8.0, 7.0, 10.0, 17.0, 11.0, 9.0, 13.0, 15.0, 22.0, 24.0, 31.0, 34.0, 24.0, 35.0, 30.0, 33.0, 28.0, 32.0, 31.0, 34.0, 26.0, 44.0, 33.0, 38.0, 41.0, 39.0, 27.0, 29.0, 23.0, 36.0, 24.0, 23.0, 27.0, 18.0, 12.0, 19.0, 14.0, 6.0, 8.0, 8.0, 11.0, 10.0, 4.0, 10.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0002008676528930664, -0.00019372627139091492, -0.00018658488988876343, -0.00017944350838661194, -0.00017230212688446045, -0.00016516074538230896, -0.00015801936388015747, -0.00015087798237800598, -0.0001437366008758545, -0.000136595219373703, -0.00012945383787155151, -0.00012231245636940002, -0.00011517107486724854, -0.00010802969336509705, -0.00010088831186294556, -9.374693036079407e-05, -8.660554885864258e-05, -7.946416735649109e-05, -7.23227858543396e-05, -6.518140435218811e-05, -5.804002285003662e-05, -5.089864134788513e-05, -4.375725984573364e-05, -3.661587834358215e-05, -2.9474496841430664e-05, -2.2333115339279175e-05, -1.5191733837127686e-05, -8.050352334976196e-06, -9.08970832824707e-07, 6.232410669326782e-06, 1.3373792171478271e-05, 2.051517367362976e-05, 2.765655517578125e-05, 3.479793667793274e-05, 4.193931818008423e-05, 4.908069968223572e-05, 5.622208118438721e-05, 6.33634626865387e-05, 7.050484418869019e-05, 7.764622569084167e-05, 8.478760719299316e-05, 9.192898869514465e-05, 9.907037019729614e-05, 0.00010621175169944763, 0.00011335313320159912, 0.00012049451470375061, 0.0001276358962059021, 0.0001347772777080536, 0.00014191865921020508, 0.00014906004071235657, 0.00015620142221450806, 0.00016334280371665955, 0.00017048418521881104, 0.00017762556672096252, 0.00018476694822311401, 0.0001919083297252655, 0.000199049711227417, 0.00020619109272956848, 0.00021333247423171997, 0.00022047385573387146, 0.00022761523723602295, 0.00023475661873817444, 0.00024189800024032593, 0.0002490393817424774, 0.0002561807632446289]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 10.0, 8.0, 5.0, 10.0, 11.0, 15.0, 21.0, 22.0, 16.0, 21.0, 32.0, 34.0, 26.0, 36.0, 34.0, 29.0, 33.0, 37.0, 36.0, 40.0, 45.0, 44.0, 37.0, 37.0, 32.0, 38.0, 33.0, 30.0, 25.0, 28.0, 21.0, 21.0, 15.0, 14.0, 23.0, 23.0, 9.0, 11.0, 11.0, 5.0, 8.0, 5.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.869140625, -2.7779541015625, -2.686767578125, -2.5955810546875, -2.50439453125, -2.4132080078125, -2.322021484375, -2.2308349609375, -2.1396484375, -2.0484619140625, -1.957275390625, -1.8660888671875, -1.77490234375, -1.6837158203125, -1.592529296875, -1.5013427734375, -1.41015625, -1.3189697265625, -1.227783203125, -1.1365966796875, -1.04541015625, -0.9542236328125, -0.863037109375, -0.7718505859375, -0.6806640625, -0.5894775390625, -0.498291015625, -0.4071044921875, -0.31591796875, -0.2247314453125, -0.133544921875, -0.0423583984375, 0.048828125, 0.1400146484375, 0.231201171875, 0.3223876953125, 0.41357421875, 0.5047607421875, 0.595947265625, 0.6871337890625, 0.7783203125, 0.8695068359375, 0.960693359375, 1.0518798828125, 1.14306640625, 1.2342529296875, 1.325439453125, 1.4166259765625, 1.5078125, 1.5989990234375, 1.690185546875, 1.7813720703125, 1.87255859375, 1.9637451171875, 2.054931640625, 2.1461181640625, 2.2373046875, 2.3284912109375, 2.419677734375, 2.5108642578125, 2.60205078125, 2.6932373046875, 2.784423828125, 2.8756103515625, 2.966796875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 11.0, 8.0, 6.0, 10.0, 28.0, 27.0, 45.0, 73.0, 122.0, 187.0, 305.0, 553.0, 989.0, 1892.0, 3595.0, 7094.0, 14642.0, 32520.0, 83745.0, 239450.0, 383511.0, 171083.0, 60620.0, 24667.0, 11464.0, 5538.0, 2790.0, 1511.0, 846.0, 462.0, 258.0, 182.0, 98.0, 64.0, 36.0, 32.0, 15.0, 16.0, 8.0, 12.0, 7.0, 11.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.224609375, -3.1217041015625, -3.018798828125, -2.9158935546875, -2.81298828125, -2.7100830078125, -2.607177734375, -2.5042724609375, -2.4013671875, -2.2984619140625, -2.195556640625, -2.0926513671875, -1.98974609375, -1.8868408203125, -1.783935546875, -1.6810302734375, -1.578125, -1.4752197265625, -1.372314453125, -1.2694091796875, -1.16650390625, -1.0635986328125, -0.960693359375, -0.8577880859375, -0.7548828125, -0.6519775390625, -0.549072265625, -0.4461669921875, -0.34326171875, -0.2403564453125, -0.137451171875, -0.0345458984375, 0.068359375, 0.1712646484375, 0.274169921875, 0.3770751953125, 0.47998046875, 0.5828857421875, 0.685791015625, 0.7886962890625, 0.8916015625, 0.9945068359375, 1.097412109375, 1.2003173828125, 1.30322265625, 1.4061279296875, 1.509033203125, 1.6119384765625, 1.71484375, 1.8177490234375, 1.920654296875, 2.0235595703125, 2.12646484375, 2.2293701171875, 2.332275390625, 2.4351806640625, 2.5380859375, 2.6409912109375, 2.743896484375, 2.8468017578125, 2.94970703125, 3.0526123046875, 3.155517578125, 3.2584228515625, 3.361328125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 5.0, 7.0, 8.0, 16.0, 12.0, 23.0, 20.0, 29.0, 20.0, 36.0, 33.0, 35.0, 43.0, 58.0, 72.0, 111.0, 259.0, 1506.0, 206.0, 110.0, 61.0, 58.0, 39.0, 42.0, 38.0, 34.0, 40.0, 16.0, 24.0, 12.0, 19.0, 7.0, 13.0, 11.0, 3.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.3828125, -12.0106201171875, -11.638427734375, -11.2662353515625, -10.89404296875, -10.5218505859375, -10.149658203125, -9.7774658203125, -9.4052734375, -9.0330810546875, -8.660888671875, -8.2886962890625, -7.91650390625, -7.5443115234375, -7.172119140625, -6.7999267578125, -6.427734375, -6.0555419921875, -5.683349609375, -5.3111572265625, -4.93896484375, -4.5667724609375, -4.194580078125, -3.8223876953125, -3.4501953125, -3.0780029296875, -2.705810546875, -2.3336181640625, -1.96142578125, -1.5892333984375, -1.217041015625, -0.8448486328125, -0.47265625, -0.1004638671875, 0.271728515625, 0.6439208984375, 1.01611328125, 1.3883056640625, 1.760498046875, 2.1326904296875, 2.5048828125, 2.8770751953125, 3.249267578125, 3.6214599609375, 3.99365234375, 4.3658447265625, 4.738037109375, 5.1102294921875, 5.482421875, 5.8546142578125, 6.226806640625, 6.5989990234375, 6.97119140625, 7.3433837890625, 7.715576171875, 8.0877685546875, 8.4599609375, 8.8321533203125, 9.204345703125, 9.5765380859375, 9.94873046875, 10.3209228515625, 10.693115234375, 11.0653076171875, 11.4375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 5.0, 5.0, 15.0, 20.0, 26.0, 29.0, 53.0, 71.0, 124.0, 181.0, 291.0, 677.0, 4312.0, 2992285.0, 144846.0, 1681.0, 412.0, 236.0, 147.0, 75.0, 69.0, 37.0, 39.0, 17.0, 13.0, 8.0, 4.0, 5.0, 10.0, 5.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.28125, -40.060546875, -38.83984375, -37.619140625, -36.3984375, -35.177734375, -33.95703125, -32.736328125, -31.515625, -30.294921875, -29.07421875, -27.853515625, -26.6328125, -25.412109375, -24.19140625, -22.970703125, -21.75, -20.529296875, -19.30859375, -18.087890625, -16.8671875, -15.646484375, -14.42578125, -13.205078125, -11.984375, -10.763671875, -9.54296875, -8.322265625, -7.1015625, -5.880859375, -4.66015625, -3.439453125, -2.21875, -0.998046875, 0.22265625, 1.443359375, 2.6640625, 3.884765625, 5.10546875, 6.326171875, 7.546875, 8.767578125, 9.98828125, 11.208984375, 12.4296875, 13.650390625, 14.87109375, 16.091796875, 17.3125, 18.533203125, 19.75390625, 20.974609375, 22.1953125, 23.416015625, 24.63671875, 25.857421875, 27.078125, 28.298828125, 29.51953125, 30.740234375, 31.9609375, 33.181640625, 34.40234375, 35.623046875, 36.84375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 1004.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.31707763671875, -92.31100463867188, -84.304931640625, -76.29886627197266, -68.29279327392578, -60.286720275878906, -52.2806510925293, -44.27458190917969, -36.26850891113281, -28.26243782043457, -20.256366729736328, -12.250295639038086, -4.244224548339844, 3.7618484497070312, 11.76791763305664, 19.77398681640625, 27.780059814453125, 35.7861328125, 43.79220199584961, 51.79827117919922, 59.804344177246094, 67.81041717529297, 75.81648254394531, 83.82255554199219, 91.82862854003906, 99.83470153808594, 107.84077453613281, 115.84683990478516, 123.85291290283203, 131.85897827148438, 139.86505126953125, 147.87112426757812, 155.87716674804688, 163.88323974609375, 171.88931274414062, 179.8953857421875, 187.90145874023438, 195.90753173828125, 203.91358947753906, 211.91966247558594, 219.9257354736328, 227.9318084716797, 235.93788146972656, 243.94395446777344, 251.95001220703125, 259.9560852050781, 267.962158203125, 275.9682312011719, 283.97430419921875, 291.9803771972656, 299.9864501953125, 307.9925231933594, 315.99859619140625, 324.0046691894531, 332.0107421875, 340.01678466796875, 348.02288818359375, 356.0289611816406, 364.0350341796875, 372.0411071777344, 380.04718017578125, 388.0532531738281, 396.059326171875, 404.06536865234375, 412.0714416503906]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 5.0, 3.0, 9.0, 8.0, 8.0, 10.0, 18.0, 15.0, 28.0, 20.0, 28.0, 23.0, 33.0, 15.0, 34.0, 34.0, 32.0, 43.0, 37.0, 52.0, 37.0, 48.0, 45.0, 40.0, 42.0, 40.0, 45.0, 31.0, 42.0, 32.0, 30.0, 16.0, 16.0, 15.0, 11.0, 11.0, 10.0, 8.0, 11.0, 3.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.759153366088867, -22.88620376586914, -22.01325225830078, -21.140300750732422, -20.267351150512695, -19.39440155029297, -18.52145004272461, -17.64849853515625, -16.775548934936523, -15.90259838104248, -15.029647827148438, -14.156697273254395, -13.283746719360352, -12.410796165466309, -11.537845611572266, -10.664895057678223, -9.79194450378418, -8.918993949890137, -8.046043395996094, -7.173092842102051, -6.300142288208008, -5.427191734313965, -4.554241180419922, -3.681290626525879, -2.808340072631836, -1.935389518737793, -1.06243896484375, -0.18948841094970703, 0.6834621429443359, 1.556412696838379, 2.429363250732422, 3.302313804626465, 4.175266265869141, 5.048216819763184, 5.921167373657227, 6.7941179275512695, 7.6670684814453125, 8.540019035339355, 9.412969589233398, 10.285920143127441, 11.158870697021484, 12.031821250915527, 12.90477180480957, 13.777722358703613, 14.650672912597656, 15.5236234664917, 16.396574020385742, 17.26952362060547, 18.142475128173828, 19.015426635742188, 19.888376235961914, 20.76132583618164, 21.63427734375, 22.50722885131836, 23.380178451538086, 24.253128051757812, 25.126079559326172, 25.99903106689453, 26.871980667114258, 27.744930267333984, 28.617881774902344, 29.490833282470703, 30.36378288269043, 31.236732482910156, 32.109683990478516]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 5.0, 4.0, 8.0, 7.0, 12.0, 14.0, 6.0, 20.0, 14.0, 26.0, 18.0, 29.0, 37.0, 23.0, 33.0, 41.0, 32.0, 27.0, 38.0, 38.0, 35.0, 44.0, 49.0, 36.0, 33.0, 38.0, 41.0, 30.0, 30.0, 30.0, 28.0, 20.0, 16.0, 16.0, 22.0, 19.0, 21.0, 13.0, 13.0, 3.0, 10.0, 6.0, 6.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.09375, -2.9964599609375, -2.899169921875, -2.8018798828125, -2.70458984375, -2.6072998046875, -2.510009765625, -2.4127197265625, -2.3154296875, -2.2181396484375, -2.120849609375, -2.0235595703125, -1.92626953125, -1.8289794921875, -1.731689453125, -1.6343994140625, -1.537109375, -1.4398193359375, -1.342529296875, -1.2452392578125, -1.14794921875, -1.0506591796875, -0.953369140625, -0.8560791015625, -0.7587890625, -0.6614990234375, -0.564208984375, -0.4669189453125, -0.36962890625, -0.2723388671875, -0.175048828125, -0.0777587890625, 0.01953125, 0.1168212890625, 0.214111328125, 0.3114013671875, 0.40869140625, 0.5059814453125, 0.603271484375, 0.7005615234375, 0.7978515625, 0.8951416015625, 0.992431640625, 1.0897216796875, 1.18701171875, 1.2843017578125, 1.381591796875, 1.4788818359375, 1.576171875, 1.6734619140625, 1.770751953125, 1.8680419921875, 1.96533203125, 2.0626220703125, 2.159912109375, 2.2572021484375, 2.3544921875, 2.4517822265625, 2.549072265625, 2.6463623046875, 2.74365234375, 2.8409423828125, 2.938232421875, 3.0355224609375, 3.1328125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 3.0, 4.0, 5.0, 9.0, 3.0, 17.0, 18.0, 17.0, 22.0, 23.0, 22.0, 37.0, 50.0, 59.0, 72.0, 81.0, 140.0, 154.0, 312.0, 1161.0, 19430.0, 1916710.0, 2229700.0, 23822.0, 1325.0, 355.0, 174.0, 110.0, 91.0, 68.0, 50.0, 41.0, 32.0, 37.0, 18.0, 21.0, 20.0, 15.0, 14.0, 11.0, 2.0, 7.0, 8.0, 5.0, 2.0, 5.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.6171875, -15.1295166015625, -14.641845703125, -14.1541748046875, -13.66650390625, -13.1788330078125, -12.691162109375, -12.2034912109375, -11.7158203125, -11.2281494140625, -10.740478515625, -10.2528076171875, -9.76513671875, -9.2774658203125, -8.789794921875, -8.3021240234375, -7.814453125, -7.3267822265625, -6.839111328125, -6.3514404296875, -5.86376953125, -5.3760986328125, -4.888427734375, -4.4007568359375, -3.9130859375, -3.4254150390625, -2.937744140625, -2.4500732421875, -1.96240234375, -1.4747314453125, -0.987060546875, -0.4993896484375, -0.01171875, 0.4759521484375, 0.963623046875, 1.4512939453125, 1.93896484375, 2.4266357421875, 2.914306640625, 3.4019775390625, 3.8896484375, 4.3773193359375, 4.864990234375, 5.3526611328125, 5.84033203125, 6.3280029296875, 6.815673828125, 7.3033447265625, 7.791015625, 8.2786865234375, 8.766357421875, 9.2540283203125, 9.74169921875, 10.2293701171875, 10.717041015625, 11.2047119140625, 11.6923828125, 12.1800537109375, 12.667724609375, 13.1553955078125, 13.64306640625, 14.1307373046875, 14.618408203125, 15.1060791015625, 15.59375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 6.0, 8.0, 11.0, 13.0, 7.0, 21.0, 59.0, 66.0, 105.0, 181.0, 255.0, 386.0, 555.0, 616.0, 591.0, 422.0, 282.0, 176.0, 116.0, 80.0, 43.0, 36.0, 16.0, 12.0, 7.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.0234375, -14.67010498046875, -14.3167724609375, -13.96343994140625, -13.610107421875, -13.25677490234375, -12.9034423828125, -12.55010986328125, -12.19677734375, -11.84344482421875, -11.4901123046875, -11.13677978515625, -10.783447265625, -10.43011474609375, -10.0767822265625, -9.72344970703125, -9.3701171875, -9.01678466796875, -8.6634521484375, -8.31011962890625, -7.956787109375, -7.60345458984375, -7.2501220703125, -6.89678955078125, -6.54345703125, -6.19012451171875, -5.8367919921875, -5.48345947265625, -5.130126953125, -4.77679443359375, -4.4234619140625, -4.07012939453125, -3.716796875, -3.36346435546875, -3.0101318359375, -2.65679931640625, -2.303466796875, -1.95013427734375, -1.5968017578125, -1.24346923828125, -0.89013671875, -0.53680419921875, -0.1834716796875, 0.16986083984375, 0.523193359375, 0.87652587890625, 1.2298583984375, 1.58319091796875, 1.9365234375, 2.28985595703125, 2.6431884765625, 2.99652099609375, 3.349853515625, 3.70318603515625, 4.0565185546875, 4.40985107421875, 4.76318359375, 5.11651611328125, 5.4698486328125, 5.82318115234375, 6.176513671875, 6.52984619140625, 6.8831787109375, 7.23651123046875, 7.58984375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 9.0, 16.0, 29.0, 32.0, 42.0, 72.0, 105.0, 169.0, 256.0, 403.0, 872.0, 4598.0, 976240.0, 3199167.0, 10087.0, 1000.0, 419.0, 267.0, 162.0, 110.0, 80.0, 45.0, 35.0, 23.0, 16.0, 12.0, 8.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.578125, -22.511962890625, -21.44580078125, -20.379638671875, -19.3134765625, -18.247314453125, -17.18115234375, -16.114990234375, -15.048828125, -13.982666015625, -12.91650390625, -11.850341796875, -10.7841796875, -9.718017578125, -8.65185546875, -7.585693359375, -6.51953125, -5.453369140625, -4.38720703125, -3.321044921875, -2.2548828125, -1.188720703125, -0.12255859375, 0.943603515625, 2.009765625, 3.075927734375, 4.14208984375, 5.208251953125, 6.2744140625, 7.340576171875, 8.40673828125, 9.472900390625, 10.5390625, 11.605224609375, 12.67138671875, 13.737548828125, 14.8037109375, 15.869873046875, 16.93603515625, 18.002197265625, 19.068359375, 20.134521484375, 21.20068359375, 22.266845703125, 23.3330078125, 24.399169921875, 25.46533203125, 26.531494140625, 27.59765625, 28.663818359375, 29.72998046875, 30.796142578125, 31.8623046875, 32.928466796875, 33.99462890625, 35.060791015625, 36.126953125, 37.193115234375, 38.25927734375, 39.325439453125, 40.3916015625, 41.457763671875, 42.52392578125, 43.590087890625, 44.65625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 8.0, 21.0, 52.0, 102.0, 144.0, 161.0, 171.0, 147.0, 103.0, 54.0, 23.0, 12.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.486167907714844, -43.67652893066406, -41.86688995361328, -40.057247161865234, -38.24760818481445, -36.43796920776367, -34.628326416015625, -32.818687438964844, -31.009048461914062, -29.19940948486328, -27.389768600463867, -25.580127716064453, -23.770488739013672, -21.96084976196289, -20.151208877563477, -18.341567993164062, -16.53192901611328, -14.722289085388184, -12.912649154663086, -11.103009223937988, -9.29336929321289, -7.483729362487793, -5.674089431762695, -3.8644495010375977, -2.0548095703125, -0.24516963958740234, 1.5644702911376953, 3.374110221862793, 5.183750152587891, 6.993390083312988, 8.803030014038086, 10.612669944763184, 12.422309875488281, 14.231949806213379, 16.041589736938477, 17.85123062133789, 19.660869598388672, 21.470508575439453, 23.280149459838867, 25.08979034423828, 26.899429321289062, 28.709068298339844, 30.518709182739258, 32.32835006713867, 34.13798904418945, 35.947628021240234, 37.75727081298828, 39.56690979003906, 41.376548767089844, 43.186187744140625, 44.995826721191406, 46.80546951293945, 48.615108489990234, 50.424747467041016, 52.23439025878906, 54.044029235839844, 55.853668212890625, 57.663307189941406, 59.47294616699219, 61.282588958740234, 63.092227935791016, 64.90187072753906, 66.71150970458984, 68.52114868164062, 70.3307876586914]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 6.0, 10.0, 10.0, 16.0, 11.0, 20.0, 22.0, 16.0, 18.0, 20.0, 26.0, 33.0, 19.0, 28.0, 26.0, 43.0, 38.0, 45.0, 46.0, 35.0, 36.0, 47.0, 39.0, 31.0, 38.0, 38.0, 27.0, 38.0, 28.0, 25.0, 35.0, 25.0, 13.0, 18.0, 10.0, 14.0, 8.0, 15.0, 7.0, 7.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-26.277694702148438, -25.503896713256836, -24.730098724365234, -23.956302642822266, -23.182504653930664, -22.408706665039062, -21.634910583496094, -20.861112594604492, -20.08731460571289, -19.31351661682129, -18.539718627929688, -17.76592254638672, -16.992124557495117, -16.218326568603516, -15.44452953338623, -14.670732498168945, -13.896934509277344, -13.123136520385742, -12.349339485168457, -11.575542449951172, -10.80174446105957, -10.027946472167969, -9.254149436950684, -8.480352401733398, -7.706554412841797, -6.9327569007873535, -6.15895938873291, -5.385161876678467, -4.611364364624023, -3.83756685256958, -3.0637693405151367, -2.2899718284606934, -1.51617431640625, -0.7423768043518066, 0.03142070770263672, 0.8052182197570801, 1.5790157318115234, 2.352813243865967, 3.12661075592041, 3.9004082679748535, 4.674205780029297, 5.44800329208374, 6.221800804138184, 6.995598316192627, 7.76939582824707, 8.543193817138672, 9.316990852355957, 10.090787887573242, 10.864585876464844, 11.638383865356445, 12.41218090057373, 13.185977935791016, 13.959775924682617, 14.733573913574219, 15.507370948791504, 16.28116798400879, 17.05496597290039, 17.828763961791992, 18.602561950683594, 19.376358032226562, 20.150156021118164, 20.923954010009766, 21.697750091552734, 22.471548080444336, 23.245346069335938]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 4.0, 4.0, 10.0, 11.0, 10.0, 7.0, 20.0, 11.0, 24.0, 31.0, 29.0, 25.0, 33.0, 38.0, 25.0, 32.0, 31.0, 30.0, 40.0, 41.0, 49.0, 39.0, 45.0, 59.0, 31.0, 36.0, 33.0, 24.0, 31.0, 17.0, 24.0, 22.0, 21.0, 22.0, 17.0, 16.0, 10.0, 12.0, 6.0, 7.0, 8.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.259765625, -3.160186767578125, -3.06060791015625, -2.961029052734375, -2.8614501953125, -2.761871337890625, -2.66229248046875, -2.562713623046875, -2.463134765625, -2.363555908203125, -2.26397705078125, -2.164398193359375, -2.0648193359375, -1.965240478515625, -1.86566162109375, -1.766082763671875, -1.66650390625, -1.566925048828125, -1.46734619140625, -1.367767333984375, -1.2681884765625, -1.168609619140625, -1.06903076171875, -0.969451904296875, -0.869873046875, -0.770294189453125, -0.67071533203125, -0.571136474609375, -0.4715576171875, -0.371978759765625, -0.27239990234375, -0.172821044921875, -0.0732421875, 0.026336669921875, 0.12591552734375, 0.225494384765625, 0.3250732421875, 0.424652099609375, 0.52423095703125, 0.623809814453125, 0.723388671875, 0.822967529296875, 0.92254638671875, 1.022125244140625, 1.1217041015625, 1.221282958984375, 1.32086181640625, 1.420440673828125, 1.52001953125, 1.619598388671875, 1.71917724609375, 1.818756103515625, 1.9183349609375, 2.017913818359375, 2.11749267578125, 2.217071533203125, 2.316650390625, 2.416229248046875, 2.51580810546875, 2.615386962890625, 2.7149658203125, 2.814544677734375, 2.91412353515625, 3.013702392578125, 3.11328125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 6.0, 10.0, 19.0, 25.0, 38.0, 54.0, 83.0, 121.0, 155.0, 256.0, 383.0, 551.0, 865.0, 1244.0, 1921.0, 2891.0, 4335.0, 6737.0, 10548.0, 16153.0, 25280.0, 40024.0, 64173.0, 110888.0, 300590.0, 210070.0, 95574.0, 56599.0, 35001.0, 22477.0, 14367.0, 9194.0, 6018.0, 3994.0, 2618.0, 1746.0, 1150.0, 822.0, 515.0, 309.0, 231.0, 180.0, 121.0, 64.0, 56.0, 34.0, 22.0, 13.0, 13.0, 11.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.72216796875, -0.6995086669921875, -0.676849365234375, -0.6541900634765625, -0.63153076171875, -0.6088714599609375, -0.586212158203125, -0.5635528564453125, -0.5408935546875, -0.5182342529296875, -0.495574951171875, -0.4729156494140625, -0.45025634765625, -0.4275970458984375, -0.404937744140625, -0.3822784423828125, -0.359619140625, -0.3369598388671875, -0.314300537109375, -0.2916412353515625, -0.26898193359375, -0.2463226318359375, -0.223663330078125, -0.2010040283203125, -0.1783447265625, -0.1556854248046875, -0.133026123046875, -0.1103668212890625, -0.08770751953125, -0.0650482177734375, -0.042388916015625, -0.0197296142578125, 0.0029296875, 0.0255889892578125, 0.048248291015625, 0.0709075927734375, 0.09356689453125, 0.1162261962890625, 0.138885498046875, 0.1615447998046875, 0.1842041015625, 0.2068634033203125, 0.229522705078125, 0.2521820068359375, 0.27484130859375, 0.2975006103515625, 0.320159912109375, 0.3428192138671875, 0.365478515625, 0.3881378173828125, 0.410797119140625, 0.4334564208984375, 0.45611572265625, 0.4787750244140625, 0.501434326171875, 0.5240936279296875, 0.5467529296875, 0.5694122314453125, 0.592071533203125, 0.6147308349609375, 0.63739013671875, 0.6600494384765625, 0.682708740234375, 0.7053680419921875, 0.72802734375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 2.0, 5.0, 4.0, 6.0, 3.0, 13.0, 10.0, 19.0, 17.0, 13.0, 11.0, 20.0, 29.0, 27.0, 29.0, 34.0, 27.0, 46.0, 43.0, 36.0, 42.0, 36.0, 1069.0, 48.0, 33.0, 39.0, 42.0, 36.0, 35.0, 30.0, 37.0, 20.0, 21.0, 18.0, 19.0, 18.0, 19.0, 16.0, 11.0, 10.0, 7.0, 7.0, 10.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.125, -2.05877685546875, -1.9925537109375, -1.92633056640625, -1.860107421875, -1.79388427734375, -1.7276611328125, -1.66143798828125, -1.59521484375, -1.52899169921875, -1.4627685546875, -1.39654541015625, -1.330322265625, -1.26409912109375, -1.1978759765625, -1.13165283203125, -1.0654296875, -0.99920654296875, -0.9329833984375, -0.86676025390625, -0.800537109375, -0.73431396484375, -0.6680908203125, -0.60186767578125, -0.53564453125, -0.46942138671875, -0.4031982421875, -0.33697509765625, -0.270751953125, -0.20452880859375, -0.1383056640625, -0.07208251953125, -0.005859375, 0.06036376953125, 0.1265869140625, 0.19281005859375, 0.259033203125, 0.32525634765625, 0.3914794921875, 0.45770263671875, 0.52392578125, 0.59014892578125, 0.6563720703125, 0.72259521484375, 0.788818359375, 0.85504150390625, 0.9212646484375, 0.98748779296875, 1.0537109375, 1.11993408203125, 1.1861572265625, 1.25238037109375, 1.318603515625, 1.38482666015625, 1.4510498046875, 1.51727294921875, 1.58349609375, 1.64971923828125, 1.7159423828125, 1.78216552734375, 1.848388671875, 1.91461181640625, 1.9808349609375, 2.04705810546875, 2.11328125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 12.0, 16.0, 23.0, 33.0, 40.0, 67.0, 115.0, 156.0, 259.0, 377.0, 600.0, 907.0, 1465.0, 2262.0, 3724.0, 6058.0, 9856.0, 16957.0, 28891.0, 51405.0, 96331.0, 230170.0, 1385948.0, 117494.0, 60559.0, 33564.0, 19676.0, 11589.0, 7218.0, 4342.0, 2606.0, 1655.0, 1010.0, 617.0, 388.0, 245.0, 161.0, 125.0, 70.0, 42.0, 39.0, 18.0, 11.0, 11.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8798828125, -0.852508544921875, -0.82513427734375, -0.797760009765625, -0.7703857421875, -0.743011474609375, -0.71563720703125, -0.688262939453125, -0.660888671875, -0.633514404296875, -0.60614013671875, -0.578765869140625, -0.5513916015625, -0.524017333984375, -0.49664306640625, -0.469268798828125, -0.44189453125, -0.414520263671875, -0.38714599609375, -0.359771728515625, -0.3323974609375, -0.305023193359375, -0.27764892578125, -0.250274658203125, -0.222900390625, -0.195526123046875, -0.16815185546875, -0.140777587890625, -0.1134033203125, -0.086029052734375, -0.05865478515625, -0.031280517578125, -0.00390625, 0.023468017578125, 0.05084228515625, 0.078216552734375, 0.1055908203125, 0.132965087890625, 0.16033935546875, 0.187713623046875, 0.215087890625, 0.242462158203125, 0.26983642578125, 0.297210693359375, 0.3245849609375, 0.351959228515625, 0.37933349609375, 0.406707763671875, 0.43408203125, 0.461456298828125, 0.48883056640625, 0.516204833984375, 0.5435791015625, 0.570953369140625, 0.59832763671875, 0.625701904296875, 0.653076171875, 0.680450439453125, 0.70782470703125, 0.735198974609375, 0.7625732421875, 0.789947509765625, 0.81732177734375, 0.844696044921875, 0.8720703125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 6.0, 5.0, 2.0, 1.0, 4.0, 4.0, 6.0, 3.0, 5.0, 6.0, 11.0, 22.0, 13.0, 19.0, 24.0, 34.0, 49.0, 76.0, 105.0, 123.0, 124.0, 99.0, 60.0, 53.0, 26.0, 21.0, 13.0, 14.0, 10.0, 8.0, 10.0, 4.0, 7.0, 7.0, 4.0, 2.0, 3.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0007624626159667969, -0.0007386058568954468, -0.0007147490978240967, -0.0006908923387527466, -0.0006670355796813965, -0.0006431788206100464, -0.0006193220615386963, -0.0005954653024673462, -0.0005716085433959961, -0.000547751784324646, -0.0005238950252532959, -0.0005000382661819458, -0.0004761815071105957, -0.0004523247480392456, -0.0004284679889678955, -0.0004046112298965454, -0.0003807544708251953, -0.0003568977117538452, -0.0003330409526824951, -0.000309184193611145, -0.0002853274345397949, -0.0002614706754684448, -0.00023761391639709473, -0.00021375715732574463, -0.00018990039825439453, -0.00016604363918304443, -0.00014218688011169434, -0.00011833012104034424, -9.447336196899414e-05, -7.061660289764404e-05, -4.6759843826293945e-05, -2.2903084754943848e-05, 9.5367431640625e-07, 2.4810433387756348e-05, 4.8667192459106445e-05, 7.252395153045654e-05, 9.638071060180664e-05, 0.00012023746967315674, 0.00014409422874450684, 0.00016795098781585693, 0.00019180774688720703, 0.00021566450595855713, 0.00023952126502990723, 0.0002633780241012573, 0.0002872347831726074, 0.0003110915422439575, 0.0003349483013153076, 0.0003588050603866577, 0.0003826618194580078, 0.0004065185785293579, 0.000430375337600708, 0.0004542320966720581, 0.0004780888557434082, 0.0005019456148147583, 0.0005258023738861084, 0.0005496591329574585, 0.0005735158920288086, 0.0005973726511001587, 0.0006212294101715088, 0.0006450861692428589, 0.000668942928314209, 0.0006927996873855591, 0.0007166564464569092, 0.0007405132055282593, 0.0007643699645996094]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 7.0, 1.0, 2.0, 4.0, 10.0, 11.0, 6.0, 7.0, 28.0, 14.0, 31.0, 39.0, 50.0, 89.0, 168.0, 311.0, 757.0, 42285.0, 1001775.0, 1915.0, 395.0, 235.0, 132.0, 74.0, 52.0, 40.0, 24.0, 25.0, 15.0, 7.0, 8.0, 3.0, 3.0, 5.0, 3.0, 2.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0153045654296875, -0.014814615249633789, -0.014324665069580078, -0.013834714889526367, -0.013344764709472656, -0.012854814529418945, -0.012364864349365234, -0.011874914169311523, -0.011384963989257812, -0.010895013809204102, -0.01040506362915039, -0.00991511344909668, -0.009425163269042969, -0.008935213088989258, -0.008445262908935547, -0.007955312728881836, -0.007465362548828125, -0.006975412368774414, -0.006485462188720703, -0.005995512008666992, -0.005505561828613281, -0.00501561164855957, -0.004525661468505859, -0.0040357112884521484, -0.0035457611083984375, -0.0030558109283447266, -0.0025658607482910156, -0.0020759105682373047, -0.0015859603881835938, -0.0010960102081298828, -0.0006060600280761719, -0.00011610984802246094, 0.00037384033203125, 0.0008637905120849609, 0.0013537406921386719, 0.0018436908721923828, 0.0023336410522460938, 0.0028235912322998047, 0.0033135414123535156, 0.0038034915924072266, 0.0042934417724609375, 0.0047833919525146484, 0.005273342132568359, 0.00576329231262207, 0.006253242492675781, 0.006743192672729492, 0.007233142852783203, 0.007723093032836914, 0.008213043212890625, 0.008702993392944336, 0.009192943572998047, 0.009682893753051758, 0.010172843933105469, 0.01066279411315918, 0.01115274429321289, 0.011642694473266602, 0.012132644653320312, 0.012622594833374023, 0.013112545013427734, 0.013602495193481445, 0.014092445373535156, 0.014582395553588867, 0.015072345733642578, 0.015562295913696289, 0.01605224609375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 10.0, 80.0, 432.0, 405.0, 82.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002764529548585415, -0.002709224121645093, -0.002653918694704771, -0.0025986130349338055, -0.0025433076079934835, -0.0024880021810531616, -0.0024326967541128397, -0.002377391094341874, -0.002322085667401552, -0.0022667802404612303, -0.0022114748135209084, -0.0021561691537499428, -0.002100863726809621, -0.002045558299869299, -0.001990252872928977, -0.0019349473295733333, -0.0018796417862176895, -0.0018243363592773676, -0.0017690308159217238, -0.001713725388981402, -0.0016584198456257582, -0.0016031144186854362, -0.0015478088753297925, -0.0014925034483894706, -0.0014371980214491487, -0.0013818925945088267, -0.001326587051153183, -0.001271281624212861, -0.0012159760808572173, -0.0011606706539168954, -0.0011053651105612516, -0.0010500596836209297, -0.0009947542566806078, -0.000939448771532625, -0.0008841432863846421, -0.0008288378012366593, -0.0007735323160886765, -0.0007182268891483545, -0.0006629213457927108, -0.0006076159188523889, -0.0005523103754967451, -0.0004970048903487623, -0.00044169940520077944, -0.0003863939200527966, -0.00033108843490481377, -0.0002757829788606614, -0.00022047749371267855, -0.00016517200856469572, -0.00010986649431288242, -5.4561012802878395e-05, 7.44468707125634e-07, 5.6049946579150856e-05, 0.00011135543172713369, 0.0001666609023232013, 0.00022196638747118413, 0.00027727187261916697, 0.0003325773577671498, 0.00038788284291513264, 0.0004431883280631155, 0.0004984937841072679, 0.0005537992692552507, 0.0006091047544032335, 0.0006644102395512164, 0.0007197157246991992, 0.000775021209847182]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 8.0, 8.0, 7.0, 8.0, 8.0, 10.0, 17.0, 17.0, 15.0, 15.0, 20.0, 23.0, 21.0, 34.0, 37.0, 43.0, 35.0, 27.0, 43.0, 43.0, 36.0, 41.0, 30.0, 30.0, 28.0, 39.0, 34.0, 41.0, 28.0, 39.0, 27.0, 18.0, 30.0, 27.0, 19.0, 11.0, 11.0, 12.0, 8.0, 7.0, 9.0, 7.0, 7.0, 10.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.0003108978271484375, -0.000300760380923748, -0.00029062293469905853, -0.00028048548847436905, -0.00027034804224967957, -0.0002602105960249901, -0.0002500731498003006, -0.00023993570357561111, -0.00022979825735092163, -0.00021966081112623215, -0.00020952336490154266, -0.00019938591867685318, -0.0001892484724521637, -0.0001791110262274742, -0.00016897358000278473, -0.00015883613377809525, -0.00014869868755340576, -0.00013856124132871628, -0.0001284237951040268, -0.00011828634887933731, -0.00010814890265464783, -9.801145642995834e-05, -8.787401020526886e-05, -7.773656398057938e-05, -6.759911775588989e-05, -5.746167153120041e-05, -4.7324225306510925e-05, -3.718677908182144e-05, -2.7049332857131958e-05, -1.6911886632442474e-05, -6.774440407752991e-06, 3.363005816936493e-06, 1.3500452041625977e-05, 2.363789826631546e-05, 3.3775344491004944e-05, 4.391279071569443e-05, 5.405023694038391e-05, 6.41876831650734e-05, 7.432512938976288e-05, 8.446257561445236e-05, 9.460002183914185e-05, 0.00010473746806383133, 0.00011487491428852081, 0.0001250123605132103, 0.00013514980673789978, 0.00014528725296258926, 0.00015542469918727875, 0.00016556214541196823, 0.00017569959163665771, 0.0001858370378613472, 0.00019597448408603668, 0.00020611193031072617, 0.00021624937653541565, 0.00022638682276010513, 0.00023652426898479462, 0.0002466617152094841, 0.0002567991614341736, 0.00026693660765886307, 0.00027707405388355255, 0.00028721150010824203, 0.0002973489463329315, 0.000307486392557621, 0.0003176238387823105, 0.00032776128500699997, 0.00033789873123168945]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 4.0, 4.0, 10.0, 11.0, 10.0, 7.0, 20.0, 11.0, 24.0, 31.0, 29.0, 25.0, 33.0, 38.0, 25.0, 32.0, 31.0, 30.0, 40.0, 41.0, 49.0, 39.0, 45.0, 59.0, 31.0, 36.0, 33.0, 24.0, 31.0, 17.0, 24.0, 22.0, 21.0, 22.0, 17.0, 16.0, 10.0, 12.0, 6.0, 7.0, 8.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.259765625, -3.160186767578125, -3.06060791015625, -2.961029052734375, -2.8614501953125, -2.761871337890625, -2.66229248046875, -2.562713623046875, -2.463134765625, -2.363555908203125, -2.26397705078125, -2.164398193359375, -2.0648193359375, -1.965240478515625, -1.86566162109375, -1.766082763671875, -1.66650390625, -1.566925048828125, -1.46734619140625, -1.367767333984375, -1.2681884765625, -1.168609619140625, -1.06903076171875, -0.969451904296875, -0.869873046875, -0.770294189453125, -0.67071533203125, -0.571136474609375, -0.4715576171875, -0.371978759765625, -0.27239990234375, -0.172821044921875, -0.0732421875, 0.026336669921875, 0.12591552734375, 0.225494384765625, 0.3250732421875, 0.424652099609375, 0.52423095703125, 0.623809814453125, 0.723388671875, 0.822967529296875, 0.92254638671875, 1.022125244140625, 1.1217041015625, 1.221282958984375, 1.32086181640625, 1.420440673828125, 1.52001953125, 1.619598388671875, 1.71917724609375, 1.818756103515625, 1.9183349609375, 2.017913818359375, 2.11749267578125, 2.217071533203125, 2.316650390625, 2.416229248046875, 2.51580810546875, 2.615386962890625, 2.7149658203125, 2.814544677734375, 2.91412353515625, 3.013702392578125, 3.11328125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 4.0, 2.0, 8.0, 14.0, 16.0, 23.0, 35.0, 30.0, 55.0, 76.0, 115.0, 174.0, 310.0, 503.0, 873.0, 1482.0, 2619.0, 4645.0, 8413.0, 15156.0, 27127.0, 49520.0, 95872.0, 208725.0, 309103.0, 157274.0, 75221.0, 40423.0, 22120.0, 12516.0, 6920.0, 3918.0, 2195.0, 1204.0, 713.0, 403.0, 287.0, 151.0, 97.0, 70.0, 58.0, 28.0, 12.0, 11.0, 14.0, 5.0, 6.0, 4.0, 0.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.5, -2.42266845703125, -2.3453369140625, -2.26800537109375, -2.190673828125, -2.11334228515625, -2.0360107421875, -1.95867919921875, -1.88134765625, -1.80401611328125, -1.7266845703125, -1.64935302734375, -1.572021484375, -1.49468994140625, -1.4173583984375, -1.34002685546875, -1.2626953125, -1.18536376953125, -1.1080322265625, -1.03070068359375, -0.953369140625, -0.87603759765625, -0.7987060546875, -0.72137451171875, -0.64404296875, -0.56671142578125, -0.4893798828125, -0.41204833984375, -0.334716796875, -0.25738525390625, -0.1800537109375, -0.10272216796875, -0.025390625, 0.05194091796875, 0.1292724609375, 0.20660400390625, 0.283935546875, 0.36126708984375, 0.4385986328125, 0.51593017578125, 0.59326171875, 0.67059326171875, 0.7479248046875, 0.82525634765625, 0.902587890625, 0.97991943359375, 1.0572509765625, 1.13458251953125, 1.2119140625, 1.28924560546875, 1.3665771484375, 1.44390869140625, 1.521240234375, 1.59857177734375, 1.6759033203125, 1.75323486328125, 1.83056640625, 1.90789794921875, 1.9852294921875, 2.06256103515625, 2.139892578125, 2.21722412109375, 2.2945556640625, 2.37188720703125, 2.44921875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 7.0, 8.0, 6.0, 9.0, 13.0, 13.0, 15.0, 14.0, 20.0, 29.0, 28.0, 29.0, 40.0, 37.0, 36.0, 41.0, 51.0, 76.0, 144.0, 1461.0, 358.0, 123.0, 65.0, 55.0, 44.0, 35.0, 39.0, 39.0, 24.0, 19.0, 16.0, 20.0, 25.0, 21.0, 16.0, 12.0, 15.0, 6.0, 8.0, 6.0, 3.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.5390625, -11.1883544921875, -10.837646484375, -10.4869384765625, -10.13623046875, -9.7855224609375, -9.434814453125, -9.0841064453125, -8.7333984375, -8.3826904296875, -8.031982421875, -7.6812744140625, -7.33056640625, -6.9798583984375, -6.629150390625, -6.2784423828125, -5.927734375, -5.5770263671875, -5.226318359375, -4.8756103515625, -4.52490234375, -4.1741943359375, -3.823486328125, -3.4727783203125, -3.1220703125, -2.7713623046875, -2.420654296875, -2.0699462890625, -1.71923828125, -1.3685302734375, -1.017822265625, -0.6671142578125, -0.31640625, 0.0343017578125, 0.385009765625, 0.7357177734375, 1.08642578125, 1.4371337890625, 1.787841796875, 2.1385498046875, 2.4892578125, 2.8399658203125, 3.190673828125, 3.5413818359375, 3.89208984375, 4.2427978515625, 4.593505859375, 4.9442138671875, 5.294921875, 5.6456298828125, 5.996337890625, 6.3470458984375, 6.69775390625, 7.0484619140625, 7.399169921875, 7.7498779296875, 8.1005859375, 8.4512939453125, 8.802001953125, 9.1527099609375, 9.50341796875, 9.8541259765625, 10.204833984375, 10.5555419921875, 10.90625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 1.0, 6.0, 4.0, 4.0, 4.0, 8.0, 15.0, 14.0, 17.0, 23.0, 30.0, 67.0, 97.0, 131.0, 273.0, 707.0, 9884.0, 3126108.0, 6962.0, 632.0, 273.0, 146.0, 94.0, 63.0, 42.0, 31.0, 22.0, 16.0, 5.0, 7.0, 5.0, 6.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-65.3125, -63.5693359375, -61.826171875, -60.0830078125, -58.33984375, -56.5966796875, -54.853515625, -53.1103515625, -51.3671875, -49.6240234375, -47.880859375, -46.1376953125, -44.39453125, -42.6513671875, -40.908203125, -39.1650390625, -37.421875, -35.6787109375, -33.935546875, -32.1923828125, -30.44921875, -28.7060546875, -26.962890625, -25.2197265625, -23.4765625, -21.7333984375, -19.990234375, -18.2470703125, -16.50390625, -14.7607421875, -13.017578125, -11.2744140625, -9.53125, -7.7880859375, -6.044921875, -4.3017578125, -2.55859375, -0.8154296875, 0.927734375, 2.6708984375, 4.4140625, 6.1572265625, 7.900390625, 9.6435546875, 11.38671875, 13.1298828125, 14.873046875, 16.6162109375, 18.359375, 20.1025390625, 21.845703125, 23.5888671875, 25.33203125, 27.0751953125, 28.818359375, 30.5615234375, 32.3046875, 34.0478515625, 35.791015625, 37.5341796875, 39.27734375, 41.0205078125, 42.763671875, 44.5068359375, 46.25]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 74.0, 937.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.73299026489258, -25.17411231994629, -17.615234375, -10.056354522705078, -2.497476577758789, 5.0614013671875, 12.620281219482422, 20.179157257080078, 27.738037109375, 35.29691696166992, 42.85579299926758, 50.4146728515625, 57.973548889160156, 65.53242492675781, 73.09130859375, 80.65018463134766, 88.20906066894531, 95.76793670654297, 103.32682037353516, 110.88569641113281, 118.44457244873047, 126.00344848632812, 133.5623321533203, 141.1212158203125, 148.68008422851562, 156.2389678955078, 163.79783630371094, 171.35671997070312, 178.9156036376953, 186.47447204589844, 194.03335571289062, 201.59222412109375, 209.15110778808594, 216.70999145507812, 224.26885986328125, 231.82774353027344, 239.38662719726562, 246.94549560546875, 254.50437927246094, 262.0632629394531, 269.62213134765625, 277.1809997558594, 284.7398986816406, 292.29876708984375, 299.8576354980469, 307.4165344238281, 314.97540283203125, 322.5342712402344, 330.0931701660156, 337.65203857421875, 345.2109375, 352.7698059082031, 360.32867431640625, 367.8875732421875, 375.4464416503906, 383.00531005859375, 390.5641784667969, 398.123046875, 405.68194580078125, 413.2408142089844, 420.7996826171875, 428.35858154296875, 435.9174499511719, 443.476318359375, 451.03521728515625]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 6.0, 7.0, 7.0, 8.0, 10.0, 9.0, 19.0, 23.0, 26.0, 33.0, 23.0, 30.0, 37.0, 31.0, 36.0, 42.0, 49.0, 51.0, 45.0, 39.0, 38.0, 48.0, 52.0, 32.0, 32.0, 30.0, 33.0, 34.0, 26.0, 13.0, 29.0, 13.0, 15.0, 14.0, 9.0, 11.0, 12.0, 8.0, 10.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-36.23344421386719, -35.129539489746094, -34.025634765625, -32.921730041503906, -31.81782341003418, -30.713916778564453, -29.61001205444336, -28.506107330322266, -27.402202606201172, -26.298297882080078, -25.19439125061035, -24.090486526489258, -22.986581802368164, -21.882675170898438, -20.778770446777344, -19.67486572265625, -18.570959091186523, -17.46705436706543, -16.363147735595703, -15.25924301147461, -14.155338287353516, -13.051432609558105, -11.947526931762695, -10.843622207641602, -9.739716529846191, -8.635810852050781, -7.5319061279296875, -6.428000450134277, -5.324095249176025, -4.220190048217773, -3.1162843704223633, -2.0123791694641113, -0.9084739685058594, 0.19543135166168213, 1.2993366718292236, 2.4032421112060547, 3.5071473121643066, 4.611052513122559, 5.714958190917969, 6.818863391876221, 7.922768592834473, 9.026674270629883, 10.130578994750977, 11.234484672546387, 12.338390350341797, 13.44229507446289, 14.5462007522583, 15.650106430053711, 16.754011154174805, 17.8579158782959, 18.961822509765625, 20.06572723388672, 21.169631958007812, 22.273536682128906, 23.377443313598633, 24.481348037719727, 25.585254669189453, 26.689159393310547, 27.793066024780273, 28.896970748901367, 30.00087547302246, 31.104782104492188, 32.20868682861328, 33.312591552734375, 34.41649627685547]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 6.0, 5.0, 18.0, 6.0, 16.0, 16.0, 12.0, 23.0, 34.0, 29.0, 28.0, 32.0, 44.0, 23.0, 33.0, 43.0, 38.0, 42.0, 41.0, 43.0, 43.0, 45.0, 48.0, 38.0, 34.0, 35.0, 28.0, 25.0, 22.0, 18.0, 26.0, 15.0, 14.0, 17.0, 12.0, 8.0, 11.0, 8.0, 8.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.8828125, -3.76837158203125, -3.6539306640625, -3.53948974609375, -3.425048828125, -3.31060791015625, -3.1961669921875, -3.08172607421875, -2.96728515625, -2.85284423828125, -2.7384033203125, -2.62396240234375, -2.509521484375, -2.39508056640625, -2.2806396484375, -2.16619873046875, -2.0517578125, -1.93731689453125, -1.8228759765625, -1.70843505859375, -1.593994140625, -1.47955322265625, -1.3651123046875, -1.25067138671875, -1.13623046875, -1.02178955078125, -0.9073486328125, -0.79290771484375, -0.678466796875, -0.56402587890625, -0.4495849609375, -0.33514404296875, -0.220703125, -0.10626220703125, 0.0081787109375, 0.12261962890625, 0.237060546875, 0.35150146484375, 0.4659423828125, 0.58038330078125, 0.69482421875, 0.80926513671875, 0.9237060546875, 1.03814697265625, 1.152587890625, 1.26702880859375, 1.3814697265625, 1.49591064453125, 1.6103515625, 1.72479248046875, 1.8392333984375, 1.95367431640625, 2.068115234375, 2.18255615234375, 2.2969970703125, 2.41143798828125, 2.52587890625, 2.64031982421875, 2.7547607421875, 2.86920166015625, 2.983642578125, 3.09808349609375, 3.2125244140625, 3.32696533203125, 3.44140625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 8.0, 10.0, 6.0, 19.0, 18.0, 20.0, 32.0, 40.0, 44.0, 60.0, 98.0, 106.0, 145.0, 241.0, 386.0, 697.0, 1661.0, 4418.0, 14453.0, 59029.0, 278023.0, 998928.0, 1634334.0, 896934.0, 233446.0, 50653.0, 13018.0, 3982.0, 1489.0, 694.0, 401.0, 272.0, 173.0, 124.0, 66.0, 65.0, 45.0, 31.0, 30.0, 17.0, 18.0, 11.0, 10.0, 6.0, 4.0, 9.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-5.015625, -4.86566162109375, -4.7156982421875, -4.56573486328125, -4.415771484375, -4.26580810546875, -4.1158447265625, -3.96588134765625, -3.81591796875, -3.66595458984375, -3.5159912109375, -3.36602783203125, -3.216064453125, -3.06610107421875, -2.9161376953125, -2.76617431640625, -2.6162109375, -2.46624755859375, -2.3162841796875, -2.16632080078125, -2.016357421875, -1.86639404296875, -1.7164306640625, -1.56646728515625, -1.41650390625, -1.26654052734375, -1.1165771484375, -0.96661376953125, -0.816650390625, -0.66668701171875, -0.5167236328125, -0.36676025390625, -0.216796875, -0.06683349609375, 0.0831298828125, 0.23309326171875, 0.383056640625, 0.53302001953125, 0.6829833984375, 0.83294677734375, 0.98291015625, 1.13287353515625, 1.2828369140625, 1.43280029296875, 1.582763671875, 1.73272705078125, 1.8826904296875, 2.03265380859375, 2.1826171875, 2.33258056640625, 2.4825439453125, 2.63250732421875, 2.782470703125, 2.93243408203125, 3.0823974609375, 3.23236083984375, 3.38232421875, 3.53228759765625, 3.6822509765625, 3.83221435546875, 3.982177734375, 4.13214111328125, 4.2821044921875, 4.43206787109375, 4.58203125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 9.0, 12.0, 8.0, 21.0, 32.0, 48.0, 86.0, 122.0, 226.0, 357.0, 476.0, 658.0, 600.0, 490.0, 335.0, 197.0, 155.0, 82.0, 68.0, 45.0, 18.0, 16.0, 12.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6328125, -13.243408203125, -12.85400390625, -12.464599609375, -12.0751953125, -11.685791015625, -11.29638671875, -10.906982421875, -10.517578125, -10.128173828125, -9.73876953125, -9.349365234375, -8.9599609375, -8.570556640625, -8.18115234375, -7.791748046875, -7.40234375, -7.012939453125, -6.62353515625, -6.234130859375, -5.8447265625, -5.455322265625, -5.06591796875, -4.676513671875, -4.287109375, -3.897705078125, -3.50830078125, -3.118896484375, -2.7294921875, -2.340087890625, -1.95068359375, -1.561279296875, -1.171875, -0.782470703125, -0.39306640625, -0.003662109375, 0.3857421875, 0.775146484375, 1.16455078125, 1.553955078125, 1.943359375, 2.332763671875, 2.72216796875, 3.111572265625, 3.5009765625, 3.890380859375, 4.27978515625, 4.669189453125, 5.05859375, 5.447998046875, 5.83740234375, 6.226806640625, 6.6162109375, 7.005615234375, 7.39501953125, 7.784423828125, 8.173828125, 8.563232421875, 8.95263671875, 9.342041015625, 9.7314453125, 10.120849609375, 10.51025390625, 10.899658203125, 11.2890625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 4.0, 9.0, 9.0, 4.0, 15.0, 18.0, 16.0, 39.0, 59.0, 66.0, 66.0, 134.0, 178.0, 294.0, 548.0, 1541.0, 17613.0, 2139127.0, 2015109.0, 16535.0, 1454.0, 563.0, 308.0, 150.0, 118.0, 81.0, 53.0, 44.0, 29.0, 25.0, 11.0, 16.0, 13.0, 7.0, 9.0, 6.0, 2.0, 3.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.453125, -18.642333984375, -17.83154296875, -17.020751953125, -16.2099609375, -15.399169921875, -14.58837890625, -13.777587890625, -12.966796875, -12.156005859375, -11.34521484375, -10.534423828125, -9.7236328125, -8.912841796875, -8.10205078125, -7.291259765625, -6.48046875, -5.669677734375, -4.85888671875, -4.048095703125, -3.2373046875, -2.426513671875, -1.61572265625, -0.804931640625, 0.005859375, 0.816650390625, 1.62744140625, 2.438232421875, 3.2490234375, 4.059814453125, 4.87060546875, 5.681396484375, 6.4921875, 7.302978515625, 8.11376953125, 8.924560546875, 9.7353515625, 10.546142578125, 11.35693359375, 12.167724609375, 12.978515625, 13.789306640625, 14.60009765625, 15.410888671875, 16.2216796875, 17.032470703125, 17.84326171875, 18.654052734375, 19.46484375, 20.275634765625, 21.08642578125, 21.897216796875, 22.7080078125, 23.518798828125, 24.32958984375, 25.140380859375, 25.951171875, 26.761962890625, 27.57275390625, 28.383544921875, 29.1943359375, 30.005126953125, 30.81591796875, 31.626708984375, 32.4375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 12.0, 137.0, 392.0, 366.0, 97.0, 12.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.17577362060547, -76.65739440917969, -72.13900756835938, -67.6206283569336, -63.10224533081055, -58.5838623046875, -54.06548309326172, -49.54710006713867, -45.028717041015625, -40.51033401489258, -35.99195098876953, -31.47357177734375, -26.955188751220703, -22.436805725097656, -17.918424606323242, -13.400043487548828, -8.881660461425781, -4.363278388977051, 0.1551036834716797, 4.67348575592041, 9.19186782836914, 13.710250854492188, 18.2286319732666, 22.747013092041016, 27.265396118164062, 31.78377914428711, 36.302162170410156, 40.82054138183594, 45.338924407958984, 49.85730743408203, 54.37568664550781, 58.89406967163086, 63.41246032714844, 67.93083953857422, 72.44922637939453, 76.96760559082031, 81.48599243164062, 86.0043716430664, 90.52275085449219, 95.0411376953125, 99.55951690673828, 104.07789611816406, 108.59628295898438, 113.11466217041016, 117.63304138183594, 122.15142822265625, 126.66980743408203, 131.1881866455078, 135.70657348632812, 140.22496032714844, 144.7433319091797, 149.26171875, 153.7801055908203, 158.29849243164062, 162.81686401367188, 167.3352508544922, 171.8536376953125, 176.3720245361328, 180.89039611816406, 185.40878295898438, 189.9271697998047, 194.445556640625, 198.96392822265625, 203.48231506347656, 208.0006866455078]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 1.0, 3.0, 9.0, 4.0, 13.0, 19.0, 21.0, 20.0, 23.0, 21.0, 21.0, 30.0, 27.0, 35.0, 38.0, 49.0, 42.0, 42.0, 54.0, 47.0, 47.0, 39.0, 43.0, 35.0, 33.0, 41.0, 30.0, 27.0, 25.0, 23.0, 18.0, 15.0, 23.0, 14.0, 14.0, 12.0, 9.0, 7.0, 5.0, 6.0, 5.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.767471313476562, -26.87171745300293, -25.975963592529297, -25.080211639404297, -24.184457778930664, -23.28870391845703, -22.3929500579834, -21.497196197509766, -20.601444244384766, -19.705690383911133, -18.8099365234375, -17.9141845703125, -17.018430709838867, -16.122676849365234, -15.226922988891602, -14.331170082092285, -13.435416221618652, -12.53966236114502, -11.643909454345703, -10.74815559387207, -9.852402687072754, -8.956648826599121, -8.060895919799805, -7.165142059326172, -6.269388675689697, -5.373635292053223, -4.477881908416748, -3.5821282863616943, -2.6863749027252197, -1.790621280670166, -0.8948678970336914, 0.0008854866027832031, 0.8966388702392578, 1.7923922538757324, 2.688145637512207, 3.5838992595672607, 4.479652404785156, 5.375406265258789, 6.271159648895264, 7.166913032531738, 8.062665939331055, 8.958419799804688, 9.854172706604004, 10.749926567077637, 11.645679473876953, 12.541433334350586, 13.437187194824219, 14.332940101623535, 15.228693962097168, 16.124446868896484, 17.020200729370117, 17.91595458984375, 18.811708450317383, 19.707462310791016, 20.603214263916016, 21.49896812438965, 22.39472198486328, 23.290475845336914, 24.186229705810547, 25.081981658935547, 25.97773551940918, 26.873489379882812, 27.769243240356445, 28.664997100830078, 29.560749053955078]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 8.0, 5.0, 6.0, 5.0, 3.0, 13.0, 12.0, 15.0, 15.0, 15.0, 14.0, 21.0, 25.0, 22.0, 33.0, 30.0, 33.0, 35.0, 44.0, 36.0, 34.0, 40.0, 42.0, 50.0, 51.0, 37.0, 45.0, 45.0, 25.0, 24.0, 34.0, 27.0, 23.0, 22.0, 24.0, 16.0, 12.0, 14.0, 20.0, 10.0, 4.0, 7.0, 2.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.904296875, -3.79156494140625, -3.6788330078125, -3.56610107421875, -3.453369140625, -3.34063720703125, -3.2279052734375, -3.11517333984375, -3.00244140625, -2.88970947265625, -2.7769775390625, -2.66424560546875, -2.551513671875, -2.43878173828125, -2.3260498046875, -2.21331787109375, -2.1005859375, -1.98785400390625, -1.8751220703125, -1.76239013671875, -1.649658203125, -1.53692626953125, -1.4241943359375, -1.31146240234375, -1.19873046875, -1.08599853515625, -0.9732666015625, -0.86053466796875, -0.747802734375, -0.63507080078125, -0.5223388671875, -0.40960693359375, -0.296875, -0.18414306640625, -0.0714111328125, 0.04132080078125, 0.154052734375, 0.26678466796875, 0.3795166015625, 0.49224853515625, 0.60498046875, 0.71771240234375, 0.8304443359375, 0.94317626953125, 1.055908203125, 1.16864013671875, 1.2813720703125, 1.39410400390625, 1.5068359375, 1.61956787109375, 1.7322998046875, 1.84503173828125, 1.957763671875, 2.07049560546875, 2.1832275390625, 2.29595947265625, 2.40869140625, 2.52142333984375, 2.6341552734375, 2.74688720703125, 2.859619140625, 2.97235107421875, 3.0850830078125, 3.19781494140625, 3.310546875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 11.0, 18.0, 14.0, 26.0, 58.0, 86.0, 115.0, 140.0, 232.0, 353.0, 511.0, 747.0, 1154.0, 1776.0, 2589.0, 4108.0, 6507.0, 9645.0, 15128.0, 23262.0, 38184.0, 64814.0, 121477.0, 323482.0, 202583.0, 92369.0, 52044.0, 31270.0, 19795.0, 12345.0, 8078.0, 5356.0, 3473.0, 2300.0, 1515.0, 1016.0, 656.0, 432.0, 299.0, 176.0, 118.0, 90.0, 77.0, 43.0, 23.0, 17.0, 14.0, 9.0, 8.0, 6.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.89892578125, -0.8723297119140625, -0.845733642578125, -0.8191375732421875, -0.79254150390625, -0.7659454345703125, -0.739349365234375, -0.7127532958984375, -0.6861572265625, -0.6595611572265625, -0.632965087890625, -0.6063690185546875, -0.57977294921875, -0.5531768798828125, -0.526580810546875, -0.4999847412109375, -0.473388671875, -0.4467926025390625, -0.420196533203125, -0.3936004638671875, -0.36700439453125, -0.3404083251953125, -0.313812255859375, -0.2872161865234375, -0.2606201171875, -0.2340240478515625, -0.207427978515625, -0.1808319091796875, -0.15423583984375, -0.1276397705078125, -0.101043701171875, -0.0744476318359375, -0.0478515625, -0.0212554931640625, 0.005340576171875, 0.0319366455078125, 0.05853271484375, 0.0851287841796875, 0.111724853515625, 0.1383209228515625, 0.1649169921875, 0.1915130615234375, 0.218109130859375, 0.2447052001953125, 0.27130126953125, 0.2978973388671875, 0.324493408203125, 0.3510894775390625, 0.377685546875, 0.4042816162109375, 0.430877685546875, 0.4574737548828125, 0.48406982421875, 0.5106658935546875, 0.537261962890625, 0.5638580322265625, 0.5904541015625, 0.6170501708984375, 0.643646240234375, 0.6702423095703125, 0.69683837890625, 0.7234344482421875, 0.750030517578125, 0.7766265869140625, 0.80322265625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 8.0, 5.0, 10.0, 11.0, 10.0, 20.0, 18.0, 18.0, 22.0, 20.0, 32.0, 23.0, 28.0, 38.0, 40.0, 33.0, 48.0, 38.0, 31.0, 34.0, 1057.0, 37.0, 40.0, 41.0, 38.0, 41.0, 39.0, 32.0, 37.0, 25.0, 20.0, 24.0, 17.0, 13.0, 5.0, 9.0, 13.0, 7.0, 3.0, 9.0, 4.0, 4.0, 4.0, 4.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.185546875, -2.115081787109375, -2.04461669921875, -1.974151611328125, -1.9036865234375, -1.833221435546875, -1.76275634765625, -1.692291259765625, -1.621826171875, -1.551361083984375, -1.48089599609375, -1.410430908203125, -1.3399658203125, -1.269500732421875, -1.19903564453125, -1.128570556640625, -1.05810546875, -0.987640380859375, -0.91717529296875, -0.846710205078125, -0.7762451171875, -0.705780029296875, -0.63531494140625, -0.564849853515625, -0.494384765625, -0.423919677734375, -0.35345458984375, -0.282989501953125, -0.2125244140625, -0.142059326171875, -0.07159423828125, -0.001129150390625, 0.0693359375, 0.139801025390625, 0.21026611328125, 0.280731201171875, 0.3511962890625, 0.421661376953125, 0.49212646484375, 0.562591552734375, 0.633056640625, 0.703521728515625, 0.77398681640625, 0.844451904296875, 0.9149169921875, 0.985382080078125, 1.05584716796875, 1.126312255859375, 1.19677734375, 1.267242431640625, 1.33770751953125, 1.408172607421875, 1.4786376953125, 1.549102783203125, 1.61956787109375, 1.690032958984375, 1.760498046875, 1.830963134765625, 1.90142822265625, 1.971893310546875, 2.0423583984375, 2.112823486328125, 2.18328857421875, 2.253753662109375, 2.32421875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 8.0, 8.0, 5.0, 6.0, 8.0, 30.0, 26.0, 47.0, 82.0, 106.0, 156.0, 170.0, 336.0, 506.0, 713.0, 1194.0, 1757.0, 2823.0, 4562.0, 7335.0, 11939.0, 19848.0, 33605.0, 60072.0, 114278.0, 1346599.0, 250285.0, 104873.0, 56236.0, 31583.0, 18122.0, 10904.0, 6849.0, 4161.0, 2817.0, 1759.0, 1157.0, 783.0, 503.0, 289.0, 221.0, 125.0, 89.0, 51.0, 32.0, 26.0, 31.0, 8.0, 9.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.93603515625, -0.9076156616210938, -0.8791961669921875, -0.8507766723632812, -0.822357177734375, -0.7939376831054688, -0.7655181884765625, -0.7370986938476562, -0.70867919921875, -0.6802597045898438, -0.6518402099609375, -0.6234207153320312, -0.595001220703125, -0.5665817260742188, -0.5381622314453125, -0.5097427368164062, -0.4813232421875, -0.45290374755859375, -0.4244842529296875, -0.39606475830078125, -0.367645263671875, -0.33922576904296875, -0.3108062744140625, -0.28238677978515625, -0.25396728515625, -0.22554779052734375, -0.1971282958984375, -0.16870880126953125, -0.140289306640625, -0.11186981201171875, -0.0834503173828125, -0.05503082275390625, -0.026611328125, 0.00180816650390625, 0.0302276611328125, 0.05864715576171875, 0.087066650390625, 0.11548614501953125, 0.1439056396484375, 0.17232513427734375, 0.20074462890625, 0.22916412353515625, 0.2575836181640625, 0.28600311279296875, 0.314422607421875, 0.34284210205078125, 0.3712615966796875, 0.39968109130859375, 0.4281005859375, 0.45652008056640625, 0.4849395751953125, 0.5133590698242188, 0.541778564453125, 0.5701980590820312, 0.5986175537109375, 0.6270370483398438, 0.65545654296875, 0.6838760375976562, 0.7122955322265625, 0.7407150268554688, 0.769134521484375, 0.7975540161132812, 0.8259735107421875, 0.8543930053710938, 0.8828125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 2.0, 4.0, 7.0, 8.0, 3.0, 15.0, 12.0, 17.0, 21.0, 24.0, 38.0, 41.0, 46.0, 63.0, 71.0, 73.0, 85.0, 82.0, 74.0, 64.0, 43.0, 39.0, 36.0, 24.0, 16.0, 19.0, 14.0, 9.0, 8.0, 3.0, 10.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0006814002990722656, -0.0006605237722396851, -0.0006396472454071045, -0.0006187707185745239, -0.0005978941917419434, -0.0005770176649093628, -0.0005561411380767822, -0.0005352646112442017, -0.0005143880844116211, -0.0004935115575790405, -0.00047263503074645996, -0.0004517585039138794, -0.00043088197708129883, -0.00041000545024871826, -0.0003891289234161377, -0.00036825239658355713, -0.00034737586975097656, -0.000326499342918396, -0.00030562281608581543, -0.00028474628925323486, -0.0002638697624206543, -0.00024299323558807373, -0.00022211670875549316, -0.0002012401819229126, -0.00018036365509033203, -0.00015948712825775146, -0.0001386106014251709, -0.00011773407459259033, -9.685754776000977e-05, -7.59810209274292e-05, -5.510449409484863e-05, -3.4227967262268066e-05, -1.33514404296875e-05, 7.525086402893066e-06, 2.8401613235473633e-05, 4.92781400680542e-05, 7.015466690063477e-05, 9.103119373321533e-05, 0.0001119077205657959, 0.00013278424739837646, 0.00015366077423095703, 0.0001745373010635376, 0.00019541382789611816, 0.00021629035472869873, 0.0002371668815612793, 0.00025804340839385986, 0.00027891993522644043, 0.000299796462059021, 0.00032067298889160156, 0.00034154951572418213, 0.0003624260425567627, 0.00038330256938934326, 0.00040417909622192383, 0.0004250556230545044, 0.00044593214988708496, 0.00046680867671966553, 0.0004876852035522461, 0.0005085617303848267, 0.0005294382572174072, 0.0005503147840499878, 0.0005711913108825684, 0.0005920678377151489, 0.0006129443645477295, 0.0006338208913803101, 0.0006546974182128906]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 5.0, 7.0, 4.0, 5.0, 10.0, 9.0, 18.0, 19.0, 27.0, 45.0, 58.0, 90.0, 179.0, 354.0, 814.0, 29872.0, 1012999.0, 2798.0, 566.0, 255.0, 123.0, 89.0, 62.0, 37.0, 24.0, 13.0, 14.0, 12.0, 4.0, 8.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 3.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.01558685302734375, -0.015118718147277832, -0.014650583267211914, -0.014182448387145996, -0.013714313507080078, -0.01324617862701416, -0.012778043746948242, -0.012309908866882324, -0.011841773986816406, -0.011373639106750488, -0.01090550422668457, -0.010437369346618652, -0.009969234466552734, -0.009501099586486816, -0.009032964706420898, -0.00856482982635498, -0.008096694946289062, -0.0076285600662231445, -0.0071604251861572266, -0.006692290306091309, -0.006224155426025391, -0.005756020545959473, -0.005287885665893555, -0.004819750785827637, -0.004351615905761719, -0.0038834810256958008, -0.003415346145629883, -0.002947211265563965, -0.002479076385498047, -0.002010941505432129, -0.001542806625366211, -0.001074671745300293, -0.000606536865234375, -0.00013840198516845703, 0.00032973289489746094, 0.0007978677749633789, 0.0012660026550292969, 0.0017341375350952148, 0.002202272415161133, 0.0026704072952270508, 0.0031385421752929688, 0.0036066770553588867, 0.004074811935424805, 0.004542946815490723, 0.005011081695556641, 0.005479216575622559, 0.0059473514556884766, 0.0064154863357543945, 0.0068836212158203125, 0.0073517560958862305, 0.007819890975952148, 0.008288025856018066, 0.008756160736083984, 0.009224295616149902, 0.00969243049621582, 0.010160565376281738, 0.010628700256347656, 0.011096835136413574, 0.011564970016479492, 0.01203310489654541, 0.012501239776611328, 0.012969374656677246, 0.013437509536743164, 0.013905644416809082, 0.014373779296875]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 9.0, 75.0, 221.0, 352.0, 247.0, 84.0, 19.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001797436154447496, -0.0017618568381294608, -0.0017262775218114257, -0.0016906982054933906, -0.0016551188891753554, -0.0016195395728573203, -0.0015839602565392852, -0.00154838094022125, -0.001512801623903215, -0.0014772223075851798, -0.0014416429912671447, -0.0014060636749491096, -0.0013704843586310744, -0.0013349050423130393, -0.0012993257259950042, -0.001263746409676969, -0.001228167093358934, -0.0011925877770408988, -0.0011570084607228637, -0.0011214291444048285, -0.0010858498280867934, -0.0010502705117687583, -0.0010146911954507232, -0.000979111879132688, -0.0009435325628146529, -0.0009079532464966178, -0.0008723739301785827, -0.0008367946138605475, -0.0008012152975425124, -0.0007656359812244773, -0.0007300566649064422, -0.000694477348588407, -0.0006588980322703719, -0.0006233187159523368, -0.0005877393996343017, -0.0005521600833162665, -0.0005165807669982314, -0.0004810014506801963, -0.00044542213436216116, -0.00040984281804412603, -0.0003742635017260909, -0.0003386841854080558, -0.00030310486909002066, -0.00026752555277198553, -0.0002319462364539504, -0.00019636692013591528, -0.00016078760381788015, -0.00012520828749984503, -8.96289711818099e-05, -5.4049654863774776e-05, -1.847033854573965e-05, 1.7108977772295475e-05, 5.26882940903306e-05, 8.826761040836573e-05, 0.00012384692672640085, 0.00015942624304443598, 0.0001950055593624711, 0.00023058487568050623, 0.00026616419199854136, 0.0003017435083165765, 0.0003373228246346116, 0.00037290214095264673, 0.00040848145727068186, 0.000444060773588717, 0.0004796400899067521]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 7.0, 6.0, 3.0, 9.0, 16.0, 10.0, 24.0, 8.0, 15.0, 27.0, 20.0, 27.0, 24.0, 35.0, 31.0, 37.0, 38.0, 38.0, 33.0, 44.0, 31.0, 38.0, 38.0, 30.0, 38.0, 36.0, 34.0, 30.0, 24.0, 38.0, 35.0, 17.0, 31.0, 14.0, 19.0, 12.0, 15.0, 10.0, 7.0, 9.0, 14.0, 7.0, 4.0, 12.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0003033876419067383, -0.0002940865233540535, -0.0002847854048013687, -0.00027548428624868393, -0.00026618316769599915, -0.00025688204914331436, -0.0002475809305906296, -0.0002382798120379448, -0.00022897869348526, -0.00021967757493257523, -0.00021037645637989044, -0.00020107533782720566, -0.00019177421927452087, -0.0001824731007218361, -0.0001731719821691513, -0.00016387086361646652, -0.00015456974506378174, -0.00014526862651109695, -0.00013596750795841217, -0.0001266663894057274, -0.0001173652708530426, -0.00010806415230035782, -9.876303374767303e-05, -8.946191519498825e-05, -8.016079664230347e-05, -7.085967808961868e-05, -6.15585595369339e-05, -5.2257440984249115e-05, -4.295632243156433e-05, -3.365520387887955e-05, -2.4354085326194763e-05, -1.505296677350998e-05, -5.751848220825195e-06, 3.5492703318595886e-06, 1.2850388884544373e-05, 2.2151507437229156e-05, 3.145262598991394e-05, 4.0753744542598724e-05, 5.005486309528351e-05, 5.935598164796829e-05, 6.865710020065308e-05, 7.795821875333786e-05, 8.725933730602264e-05, 9.656045585870743e-05, 0.00010586157441139221, 0.000115162692964077, 0.00012446381151676178, 0.00013376493006944656, 0.00014306604862213135, 0.00015236716717481613, 0.00016166828572750092, 0.0001709694042801857, 0.00018027052283287048, 0.00018957164138555527, 0.00019887275993824005, 0.00020817387849092484, 0.00021747499704360962, 0.0002267761155962944, 0.0002360772341489792, 0.00024537835270166397, 0.00025467947125434875, 0.00026398058980703354, 0.0002732817083597183, 0.0002825828269124031, 0.0002918839454650879]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 8.0, 5.0, 6.0, 5.0, 3.0, 13.0, 12.0, 15.0, 15.0, 15.0, 14.0, 21.0, 25.0, 22.0, 33.0, 30.0, 33.0, 35.0, 44.0, 36.0, 34.0, 40.0, 42.0, 50.0, 51.0, 37.0, 46.0, 44.0, 25.0, 24.0, 34.0, 27.0, 23.0, 22.0, 24.0, 16.0, 12.0, 14.0, 20.0, 10.0, 4.0, 7.0, 2.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.904296875, -3.79156494140625, -3.6788330078125, -3.56610107421875, -3.453369140625, -3.34063720703125, -3.2279052734375, -3.11517333984375, -3.00244140625, -2.88970947265625, -2.7769775390625, -2.66424560546875, -2.551513671875, -2.43878173828125, -2.3260498046875, -2.21331787109375, -2.1005859375, -1.98785400390625, -1.8751220703125, -1.76239013671875, -1.649658203125, -1.53692626953125, -1.4241943359375, -1.31146240234375, -1.19873046875, -1.08599853515625, -0.9732666015625, -0.86053466796875, -0.747802734375, -0.63507080078125, -0.5223388671875, -0.40960693359375, -0.296875, -0.18414306640625, -0.0714111328125, 0.04132080078125, 0.154052734375, 0.26678466796875, 0.3795166015625, 0.49224853515625, 0.60498046875, 0.71771240234375, 0.8304443359375, 0.94317626953125, 1.055908203125, 1.16864013671875, 1.2813720703125, 1.39410400390625, 1.5068359375, 1.61956787109375, 1.7322998046875, 1.84503173828125, 1.957763671875, 2.07049560546875, 2.1832275390625, 2.29595947265625, 2.40869140625, 2.52142333984375, 2.6341552734375, 2.74688720703125, 2.859619140625, 2.97235107421875, 3.0850830078125, 3.19781494140625, 3.310546875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 5.0, 10.0, 15.0, 26.0, 39.0, 42.0, 68.0, 82.0, 149.0, 230.0, 315.0, 521.0, 879.0, 1452.0, 2719.0, 5154.0, 10025.0, 19005.0, 36478.0, 70618.0, 138808.0, 247586.0, 240357.0, 132232.0, 67479.0, 34853.0, 18198.0, 9637.0, 5040.0, 2736.0, 1491.0, 832.0, 497.0, 305.0, 218.0, 138.0, 104.0, 74.0, 52.0, 35.0, 21.0, 9.0, 8.0, 10.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.03515625, -2.94580078125, -2.8564453125, -2.76708984375, -2.677734375, -2.58837890625, -2.4990234375, -2.40966796875, -2.3203125, -2.23095703125, -2.1416015625, -2.05224609375, -1.962890625, -1.87353515625, -1.7841796875, -1.69482421875, -1.60546875, -1.51611328125, -1.4267578125, -1.33740234375, -1.248046875, -1.15869140625, -1.0693359375, -0.97998046875, -0.890625, -0.80126953125, -0.7119140625, -0.62255859375, -0.533203125, -0.44384765625, -0.3544921875, -0.26513671875, -0.17578125, -0.08642578125, 0.0029296875, 0.09228515625, 0.181640625, 0.27099609375, 0.3603515625, 0.44970703125, 0.5390625, 0.62841796875, 0.7177734375, 0.80712890625, 0.896484375, 0.98583984375, 1.0751953125, 1.16455078125, 1.25390625, 1.34326171875, 1.4326171875, 1.52197265625, 1.611328125, 1.70068359375, 1.7900390625, 1.87939453125, 1.96875, 2.05810546875, 2.1474609375, 2.23681640625, 2.326171875, 2.41552734375, 2.5048828125, 2.59423828125, 2.68359375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 5.0, 8.0, 6.0, 7.0, 12.0, 7.0, 12.0, 12.0, 23.0, 17.0, 33.0, 28.0, 35.0, 34.0, 45.0, 45.0, 59.0, 71.0, 114.0, 221.0, 1392.0, 254.0, 124.0, 75.0, 56.0, 47.0, 39.0, 39.0, 36.0, 30.0, 24.0, 19.0, 11.0, 25.0, 15.0, 17.0, 12.0, 6.0, 3.0, 7.0, 6.0, 7.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.125, -13.704833984375, -13.28466796875, -12.864501953125, -12.4443359375, -12.024169921875, -11.60400390625, -11.183837890625, -10.763671875, -10.343505859375, -9.92333984375, -9.503173828125, -9.0830078125, -8.662841796875, -8.24267578125, -7.822509765625, -7.40234375, -6.982177734375, -6.56201171875, -6.141845703125, -5.7216796875, -5.301513671875, -4.88134765625, -4.461181640625, -4.041015625, -3.620849609375, -3.20068359375, -2.780517578125, -2.3603515625, -1.940185546875, -1.52001953125, -1.099853515625, -0.6796875, -0.259521484375, 0.16064453125, 0.580810546875, 1.0009765625, 1.421142578125, 1.84130859375, 2.261474609375, 2.681640625, 3.101806640625, 3.52197265625, 3.942138671875, 4.3623046875, 4.782470703125, 5.20263671875, 5.622802734375, 6.04296875, 6.463134765625, 6.88330078125, 7.303466796875, 7.7236328125, 8.143798828125, 8.56396484375, 8.984130859375, 9.404296875, 9.824462890625, 10.24462890625, 10.664794921875, 11.0849609375, 11.505126953125, 11.92529296875, 12.345458984375, 12.765625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 8.0, 7.0, 9.0, 16.0, 33.0, 46.0, 73.0, 113.0, 173.0, 295.0, 662.0, 8434.0, 3129426.0, 5036.0, 629.0, 301.0, 175.0, 103.0, 55.0, 40.0, 27.0, 17.0, 14.0, 6.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.875, -59.7001953125, -57.525390625, -55.3505859375, -53.17578125, -51.0009765625, -48.826171875, -46.6513671875, -44.4765625, -42.3017578125, -40.126953125, -37.9521484375, -35.77734375, -33.6025390625, -31.427734375, -29.2529296875, -27.078125, -24.9033203125, -22.728515625, -20.5537109375, -18.37890625, -16.2041015625, -14.029296875, -11.8544921875, -9.6796875, -7.5048828125, -5.330078125, -3.1552734375, -0.98046875, 1.1943359375, 3.369140625, 5.5439453125, 7.71875, 9.8935546875, 12.068359375, 14.2431640625, 16.41796875, 18.5927734375, 20.767578125, 22.9423828125, 25.1171875, 27.2919921875, 29.466796875, 31.6416015625, 33.81640625, 35.9912109375, 38.166015625, 40.3408203125, 42.515625, 44.6904296875, 46.865234375, 49.0400390625, 51.21484375, 53.3896484375, 55.564453125, 57.7392578125, 59.9140625, 62.0888671875, 64.263671875, 66.4384765625, 68.61328125, 70.7880859375, 72.962890625, 75.1376953125, 77.3125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 12.0, 854.0, 150.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.3556137084961, -70.14604187011719, -62.93647003173828, -55.726898193359375, -48.51732635498047, -41.30775833129883, -34.09818649291992, -26.888614654541016, -19.67904281616211, -12.469470977783203, -5.259900093078613, 1.9496707916259766, 9.159242630004883, 16.368812561035156, 23.578384399414062, 30.78795623779297, 37.997528076171875, 45.20709991455078, 52.41667175292969, 59.626243591308594, 66.8358154296875, 74.04537963867188, 81.25495910644531, 88.46452331542969, 95.67410278320312, 102.88367462158203, 110.09324645996094, 117.30281829833984, 124.51239013671875, 131.72195434570312, 138.93153381347656, 146.14109802246094, 153.3506622314453, 160.5602264404297, 167.76980590820312, 174.9793701171875, 182.18894958496094, 189.3985137939453, 196.60809326171875, 203.81765747070312, 211.02723693847656, 218.23680114746094, 225.44638061523438, 232.65594482421875, 239.8655242919922, 247.07508850097656, 254.28466796875, 261.4942321777344, 268.70379638671875, 275.9133605957031, 283.1229248046875, 290.33251953125, 297.5420837402344, 304.75164794921875, 311.9612121582031, 319.1708068847656, 326.38037109375, 333.5899353027344, 340.79949951171875, 348.00909423828125, 355.2186584472656, 362.42822265625, 369.6377868652344, 376.8473815917969, 384.05694580078125]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 7.0, 11.0, 6.0, 16.0, 15.0, 15.0, 18.0, 10.0, 14.0, 20.0, 34.0, 21.0, 31.0, 34.0, 30.0, 41.0, 42.0, 32.0, 37.0, 32.0, 45.0, 34.0, 35.0, 41.0, 37.0, 35.0, 34.0, 24.0, 24.0, 21.0, 21.0, 19.0, 21.0, 15.0, 22.0, 17.0, 18.0, 12.0, 7.0, 7.0, 7.0, 9.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.411911010742188, -26.490345001220703, -25.56878089904785, -24.647214889526367, -23.725650787353516, -22.80408477783203, -21.88252067565918, -20.960954666137695, -20.039390563964844, -19.11782455444336, -18.196260452270508, -17.274694442749023, -16.353130340576172, -15.431564331054688, -14.510000228881836, -13.588434219360352, -12.666869163513184, -11.745304107666016, -10.823739051818848, -9.90217399597168, -8.980608940124512, -8.059043884277344, -7.137478351593018, -6.21591329574585, -5.294348239898682, -4.372783184051514, -3.4512181282043457, -2.5296528339385986, -1.6080877780914307, -0.6865224838256836, 0.23504257202148438, 1.1566076278686523, 2.0781726837158203, 2.9997377395629883, 3.9213027954101562, 4.842867851257324, 5.764432907104492, 6.685998439788818, 7.607563495635986, 8.529129028320312, 9.450693130493164, 10.372258186340332, 11.2938232421875, 12.215388298034668, 13.136953353881836, 14.05851936340332, 14.980083465576172, 15.901649475097656, 16.82321548461914, 17.744781494140625, 18.666345596313477, 19.58791160583496, 20.509475708007812, 21.431041717529297, 22.35260581970215, 23.274171829223633, 24.195735931396484, 25.11730194091797, 26.03886604309082, 26.960432052612305, 27.881996154785156, 28.80356216430664, 29.725126266479492, 30.646692276000977, 31.568256378173828]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 7.0, 10.0, 7.0, 14.0, 6.0, 8.0, 16.0, 18.0, 18.0, 17.0, 19.0, 26.0, 28.0, 31.0, 33.0, 39.0, 34.0, 48.0, 34.0, 39.0, 33.0, 30.0, 54.0, 34.0, 37.0, 46.0, 38.0, 38.0, 27.0, 24.0, 26.0, 25.0, 21.0, 19.0, 21.0, 9.0, 17.0, 12.0, 11.0, 5.0, 6.0, 3.0, 7.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.97265625, -3.85247802734375, -3.7322998046875, -3.61212158203125, -3.491943359375, -3.37176513671875, -3.2515869140625, -3.13140869140625, -3.01123046875, -2.89105224609375, -2.7708740234375, -2.65069580078125, -2.530517578125, -2.41033935546875, -2.2901611328125, -2.16998291015625, -2.0498046875, -1.92962646484375, -1.8094482421875, -1.68927001953125, -1.569091796875, -1.44891357421875, -1.3287353515625, -1.20855712890625, -1.08837890625, -0.96820068359375, -0.8480224609375, -0.72784423828125, -0.607666015625, -0.48748779296875, -0.3673095703125, -0.24713134765625, -0.126953125, -0.00677490234375, 0.1134033203125, 0.23358154296875, 0.353759765625, 0.47393798828125, 0.5941162109375, 0.71429443359375, 0.83447265625, 0.95465087890625, 1.0748291015625, 1.19500732421875, 1.315185546875, 1.43536376953125, 1.5555419921875, 1.67572021484375, 1.7958984375, 1.91607666015625, 2.0362548828125, 2.15643310546875, 2.276611328125, 2.39678955078125, 2.5169677734375, 2.63714599609375, 2.75732421875, 2.87750244140625, 2.9976806640625, 3.11785888671875, 3.238037109375, 3.35821533203125, 3.4783935546875, 3.59857177734375, 3.71875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 6.0, 7.0, 10.0, 6.0, 12.0, 8.0, 18.0, 12.0, 14.0, 14.0, 24.0, 30.0, 30.0, 40.0, 64.0, 98.0, 146.0, 296.0, 1002.0, 8398.0, 492083.0, 3447118.0, 237655.0, 5494.0, 851.0, 318.0, 149.0, 91.0, 42.0, 43.0, 36.0, 30.0, 27.0, 30.0, 17.0, 13.0, 10.0, 10.0, 8.0, 7.0, 5.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-16.640625, -16.1707763671875, -15.700927734375, -15.2310791015625, -14.76123046875, -14.2913818359375, -13.821533203125, -13.3516845703125, -12.8818359375, -12.4119873046875, -11.942138671875, -11.4722900390625, -11.00244140625, -10.5325927734375, -10.062744140625, -9.5928955078125, -9.123046875, -8.6531982421875, -8.183349609375, -7.7135009765625, -7.24365234375, -6.7738037109375, -6.303955078125, -5.8341064453125, -5.3642578125, -4.8944091796875, -4.424560546875, -3.9547119140625, -3.48486328125, -3.0150146484375, -2.545166015625, -2.0753173828125, -1.60546875, -1.1356201171875, -0.665771484375, -0.1959228515625, 0.27392578125, 0.7437744140625, 1.213623046875, 1.6834716796875, 2.1533203125, 2.6231689453125, 3.093017578125, 3.5628662109375, 4.03271484375, 4.5025634765625, 4.972412109375, 5.4422607421875, 5.912109375, 6.3819580078125, 6.851806640625, 7.3216552734375, 7.79150390625, 8.2613525390625, 8.731201171875, 9.2010498046875, 9.6708984375, 10.1407470703125, 10.610595703125, 11.0804443359375, 11.55029296875, 12.0201416015625, 12.489990234375, 12.9598388671875, 13.4296875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 10.0, 8.0, 14.0, 18.0, 37.0, 44.0, 56.0, 87.0, 139.0, 162.0, 231.0, 321.0, 438.0, 498.0, 484.0, 380.0, 285.0, 254.0, 179.0, 116.0, 85.0, 73.0, 46.0, 31.0, 15.0, 15.0, 11.0, 7.0, 7.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1484375, -7.855712890625, -7.56298828125, -7.270263671875, -6.9775390625, -6.684814453125, -6.39208984375, -6.099365234375, -5.806640625, -5.513916015625, -5.22119140625, -4.928466796875, -4.6357421875, -4.343017578125, -4.05029296875, -3.757568359375, -3.46484375, -3.172119140625, -2.87939453125, -2.586669921875, -2.2939453125, -2.001220703125, -1.70849609375, -1.415771484375, -1.123046875, -0.830322265625, -0.53759765625, -0.244873046875, 0.0478515625, 0.340576171875, 0.63330078125, 0.926025390625, 1.21875, 1.511474609375, 1.80419921875, 2.096923828125, 2.3896484375, 2.682373046875, 2.97509765625, 3.267822265625, 3.560546875, 3.853271484375, 4.14599609375, 4.438720703125, 4.7314453125, 5.024169921875, 5.31689453125, 5.609619140625, 5.90234375, 6.195068359375, 6.48779296875, 6.780517578125, 7.0732421875, 7.365966796875, 7.65869140625, 7.951416015625, 8.244140625, 8.536865234375, 8.82958984375, 9.122314453125, 9.4150390625, 9.707763671875, 10.00048828125, 10.293212890625, 10.5859375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 10.0, 6.0, 8.0, 21.0, 15.0, 40.0, 58.0, 66.0, 96.0, 160.0, 213.0, 440.0, 1088.0, 18330.0, 3847561.0, 322302.0, 2464.0, 582.0, 288.0, 172.0, 118.0, 79.0, 50.0, 32.0, 22.0, 18.0, 10.0, 12.0, 7.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.109375, -27.016845703125, -25.92431640625, -24.831787109375, -23.7392578125, -22.646728515625, -21.55419921875, -20.461669921875, -19.369140625, -18.276611328125, -17.18408203125, -16.091552734375, -14.9990234375, -13.906494140625, -12.81396484375, -11.721435546875, -10.62890625, -9.536376953125, -8.44384765625, -7.351318359375, -6.2587890625, -5.166259765625, -4.07373046875, -2.981201171875, -1.888671875, -0.796142578125, 0.29638671875, 1.388916015625, 2.4814453125, 3.573974609375, 4.66650390625, 5.759033203125, 6.8515625, 7.944091796875, 9.03662109375, 10.129150390625, 11.2216796875, 12.314208984375, 13.40673828125, 14.499267578125, 15.591796875, 16.684326171875, 17.77685546875, 18.869384765625, 19.9619140625, 21.054443359375, 22.14697265625, 23.239501953125, 24.33203125, 25.424560546875, 26.51708984375, 27.609619140625, 28.7021484375, 29.794677734375, 30.88720703125, 31.979736328125, 33.072265625, 34.164794921875, 35.25732421875, 36.349853515625, 37.4423828125, 38.534912109375, 39.62744140625, 40.719970703125, 41.8125]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 40.0, 115.0, 245.0, 318.0, 208.0, 72.0, 10.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.05057144165039, -43.94791793823242, -40.84526824951172, -37.74261474609375, -34.63996124267578, -31.537309646606445, -28.43465805053711, -25.33200454711914, -22.229352951049805, -19.12670135498047, -16.0240478515625, -12.921396255493164, -9.818743705749512, -6.716091156005859, -3.6134395599365234, -0.5107860565185547, 2.5918655395507812, 5.694518089294434, 8.797170639038086, 11.899822235107422, 15.002474784851074, 18.105127334594727, 21.207778930664062, 24.31043243408203, 27.413084030151367, 30.515735626220703, 33.61838912963867, 36.721038818359375, 39.823692321777344, 42.92634582519531, 46.02899932861328, 49.13165283203125, 52.23430633544922, 55.33695983886719, 58.43960952758789, 61.54226303100586, 64.64491271972656, 67.74756622314453, 70.8502197265625, 73.95287322998047, 77.05552673339844, 80.1581802368164, 83.26083374023438, 86.36347961425781, 89.46613311767578, 92.56878662109375, 95.67144012451172, 98.77409362792969, 101.87673950195312, 104.9793930053711, 108.08204650878906, 111.1846923828125, 114.28734588623047, 117.38999938964844, 120.4926528930664, 123.59530639648438, 126.69795989990234, 129.8006134033203, 132.90325927734375, 136.00592041015625, 139.1085662841797, 142.2112274169922, 145.31387329101562, 148.41653442382812, 151.51918029785156]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 8.0, 5.0, 7.0, 7.0, 6.0, 9.0, 9.0, 12.0, 15.0, 19.0, 15.0, 13.0, 24.0, 27.0, 30.0, 23.0, 30.0, 32.0, 47.0, 37.0, 30.0, 48.0, 41.0, 36.0, 44.0, 46.0, 29.0, 31.0, 28.0, 31.0, 31.0, 26.0, 21.0, 23.0, 19.0, 23.0, 24.0, 14.0, 5.0, 21.0, 11.0, 14.0, 11.0, 9.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.873661041259766, -24.083269119262695, -23.292877197265625, -22.502487182617188, -21.712095260620117, -20.921703338623047, -20.13131332397461, -19.34092140197754, -18.55052947998047, -17.7601375579834, -16.969745635986328, -16.17935562133789, -15.38896369934082, -14.59857177734375, -13.808180809020996, -13.017789840698242, -12.227397918701172, -11.437005996704102, -10.646615028381348, -9.856224060058594, -9.065832138061523, -8.275440216064453, -7.485049247741699, -6.694657802581787, -5.904266357421875, -5.113874912261963, -4.323483467102051, -3.5330920219421387, -2.7427005767822266, -1.9523091316223145, -1.1619176864624023, -0.37152624130249023, 0.4188652038574219, 1.209256649017334, 1.999648094177246, 2.790039539337158, 3.5804309844970703, 4.370822429656982, 5.1612138748168945, 5.951605319976807, 6.741996765136719, 7.532388210296631, 8.322779655456543, 9.113170623779297, 9.903562545776367, 10.693954467773438, 11.484345436096191, 12.274736404418945, 13.065128326416016, 13.855520248413086, 14.64591121673584, 15.436302185058594, 16.226694107055664, 17.017086029052734, 17.807476043701172, 18.597867965698242, 19.388259887695312, 20.178651809692383, 20.969043731689453, 21.75943374633789, 22.54982566833496, 23.34021759033203, 24.13060760498047, 24.92099952697754, 25.71139144897461]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 9.0, 4.0, 3.0, 5.0, 11.0, 10.0, 11.0, 14.0, 17.0, 19.0, 16.0, 21.0, 20.0, 16.0, 21.0, 25.0, 36.0, 30.0, 33.0, 44.0, 37.0, 41.0, 35.0, 33.0, 42.0, 40.0, 46.0, 39.0, 40.0, 27.0, 29.0, 34.0, 34.0, 20.0, 18.0, 32.0, 16.0, 10.0, 13.0, 8.0, 9.0, 12.0, 6.0, 13.0, 5.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.951171875, -3.836395263671875, -3.72161865234375, -3.606842041015625, -3.4920654296875, -3.377288818359375, -3.26251220703125, -3.147735595703125, -3.032958984375, -2.918182373046875, -2.80340576171875, -2.688629150390625, -2.5738525390625, -2.459075927734375, -2.34429931640625, -2.229522705078125, -2.11474609375, -1.999969482421875, -1.88519287109375, -1.770416259765625, -1.6556396484375, -1.540863037109375, -1.42608642578125, -1.311309814453125, -1.196533203125, -1.081756591796875, -0.96697998046875, -0.852203369140625, -0.7374267578125, -0.622650146484375, -0.50787353515625, -0.393096923828125, -0.2783203125, -0.163543701171875, -0.04876708984375, 0.066009521484375, 0.1807861328125, 0.295562744140625, 0.41033935546875, 0.525115966796875, 0.639892578125, 0.754669189453125, 0.86944580078125, 0.984222412109375, 1.0989990234375, 1.213775634765625, 1.32855224609375, 1.443328857421875, 1.55810546875, 1.672882080078125, 1.78765869140625, 1.902435302734375, 2.0172119140625, 2.131988525390625, 2.24676513671875, 2.361541748046875, 2.476318359375, 2.591094970703125, 2.70587158203125, 2.820648193359375, 2.9354248046875, 3.050201416015625, 3.16497802734375, 3.279754638671875, 3.39453125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 7.0, 9.0, 8.0, 15.0, 24.0, 45.0, 65.0, 126.0, 150.0, 261.0, 387.0, 748.0, 1214.0, 1841.0, 2764.0, 4221.0, 6556.0, 10006.0, 15991.0, 25732.0, 42078.0, 73314.0, 146270.0, 343422.0, 169965.0, 81611.0, 46165.0, 27627.0, 17039.0, 10920.0, 6981.0, 4658.0, 3129.0, 1963.0, 1217.0, 747.0, 498.0, 316.0, 173.0, 98.0, 68.0, 44.0, 27.0, 25.0, 15.0, 4.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.03515625, -1.0052261352539062, -0.9752960205078125, -0.9453659057617188, -0.915435791015625, -0.8855056762695312, -0.8555755615234375, -0.8256454467773438, -0.79571533203125, -0.7657852172851562, -0.7358551025390625, -0.7059249877929688, -0.675994873046875, -0.6460647583007812, -0.6161346435546875, -0.5862045288085938, -0.5562744140625, -0.5263442993164062, -0.4964141845703125, -0.46648406982421875, -0.436553955078125, -0.40662384033203125, -0.3766937255859375, -0.34676361083984375, -0.31683349609375, -0.28690338134765625, -0.2569732666015625, -0.22704315185546875, -0.197113037109375, -0.16718292236328125, -0.1372528076171875, -0.10732269287109375, -0.077392578125, -0.04746246337890625, -0.0175323486328125, 0.01239776611328125, 0.042327880859375, 0.07225799560546875, 0.1021881103515625, 0.13211822509765625, 0.16204833984375, 0.19197845458984375, 0.2219085693359375, 0.25183868408203125, 0.281768798828125, 0.31169891357421875, 0.3416290283203125, 0.37155914306640625, 0.4014892578125, 0.43141937255859375, 0.4613494873046875, 0.49127960205078125, 0.521209716796875, 0.5511398315429688, 0.5810699462890625, 0.6110000610351562, 0.64093017578125, 0.6708602905273438, 0.7007904052734375, 0.7307205200195312, 0.760650634765625, 0.7905807495117188, 0.8205108642578125, 0.8504409790039062, 0.88037109375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 4.0, 7.0, 12.0, 12.0, 16.0, 15.0, 17.0, 32.0, 27.0, 29.0, 29.0, 30.0, 42.0, 37.0, 39.0, 33.0, 52.0, 49.0, 1066.0, 36.0, 44.0, 53.0, 43.0, 36.0, 33.0, 27.0, 35.0, 19.0, 22.0, 12.0, 23.0, 16.0, 14.0, 11.0, 12.0, 4.0, 4.0, 9.0, 3.0, 3.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-2.794921875, -2.7132568359375, -2.631591796875, -2.5499267578125, -2.46826171875, -2.3865966796875, -2.304931640625, -2.2232666015625, -2.1416015625, -2.0599365234375, -1.978271484375, -1.8966064453125, -1.81494140625, -1.7332763671875, -1.651611328125, -1.5699462890625, -1.48828125, -1.4066162109375, -1.324951171875, -1.2432861328125, -1.16162109375, -1.0799560546875, -0.998291015625, -0.9166259765625, -0.8349609375, -0.7532958984375, -0.671630859375, -0.5899658203125, -0.50830078125, -0.4266357421875, -0.344970703125, -0.2633056640625, -0.181640625, -0.0999755859375, -0.018310546875, 0.0633544921875, 0.14501953125, 0.2266845703125, 0.308349609375, 0.3900146484375, 0.4716796875, 0.5533447265625, 0.635009765625, 0.7166748046875, 0.79833984375, 0.8800048828125, 0.961669921875, 1.0433349609375, 1.125, 1.2066650390625, 1.288330078125, 1.3699951171875, 1.45166015625, 1.5333251953125, 1.614990234375, 1.6966552734375, 1.7783203125, 1.8599853515625, 1.941650390625, 2.0233154296875, 2.10498046875, 2.1866455078125, 2.268310546875, 2.3499755859375, 2.431640625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 10.0, 10.0, 6.0, 19.0, 27.0, 43.0, 41.0, 83.0, 133.0, 143.0, 243.0, 374.0, 554.0, 828.0, 1333.0, 2127.0, 3454.0, 5872.0, 9813.0, 17078.0, 30213.0, 55291.0, 107327.0, 1358654.0, 278042.0, 103443.0, 52554.0, 28588.0, 16261.0, 9485.0, 5815.0, 3457.0, 2097.0, 1325.0, 874.0, 551.0, 352.0, 204.0, 156.0, 74.0, 65.0, 40.0, 18.0, 23.0, 15.0, 4.0, 8.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0068359375, -0.973236083984375, -0.93963623046875, -0.906036376953125, -0.8724365234375, -0.838836669921875, -0.80523681640625, -0.771636962890625, -0.738037109375, -0.704437255859375, -0.67083740234375, -0.637237548828125, -0.6036376953125, -0.570037841796875, -0.53643798828125, -0.502838134765625, -0.46923828125, -0.435638427734375, -0.40203857421875, -0.368438720703125, -0.3348388671875, -0.301239013671875, -0.26763916015625, -0.234039306640625, -0.200439453125, -0.166839599609375, -0.13323974609375, -0.099639892578125, -0.0660400390625, -0.032440185546875, 0.00115966796875, 0.034759521484375, 0.068359375, 0.101959228515625, 0.13555908203125, 0.169158935546875, 0.2027587890625, 0.236358642578125, 0.26995849609375, 0.303558349609375, 0.337158203125, 0.370758056640625, 0.40435791015625, 0.437957763671875, 0.4715576171875, 0.505157470703125, 0.53875732421875, 0.572357177734375, 0.60595703125, 0.639556884765625, 0.67315673828125, 0.706756591796875, 0.7403564453125, 0.773956298828125, 0.80755615234375, 0.841156005859375, 0.874755859375, 0.908355712890625, 0.94195556640625, 0.975555419921875, 1.0091552734375, 1.042755126953125, 1.07635498046875, 1.109954833984375, 1.1435546875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 7.0, 6.0, 7.0, 11.0, 17.0, 18.0, 20.0, 31.0, 44.0, 53.0, 81.0, 112.0, 116.0, 106.0, 97.0, 75.0, 55.0, 40.0, 25.0, 22.0, 21.0, 12.0, 10.0, 8.0, 5.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00101470947265625, -0.0009866058826446533, -0.0009585022926330566, -0.00093039870262146, -0.0009022951126098633, -0.0008741915225982666, -0.0008460879325866699, -0.0008179843425750732, -0.0007898807525634766, -0.0007617771625518799, -0.0007336735725402832, -0.0007055699825286865, -0.0006774663925170898, -0.0006493628025054932, -0.0006212592124938965, -0.0005931556224822998, -0.0005650520324707031, -0.0005369484424591064, -0.0005088448524475098, -0.0004807412624359131, -0.0004526376724243164, -0.0004245340824127197, -0.00039643049240112305, -0.00036832690238952637, -0.0003402233123779297, -0.000312119722366333, -0.00028401613235473633, -0.00025591254234313965, -0.00022780895233154297, -0.0001997053623199463, -0.0001716017723083496, -0.00014349818229675293, -0.00011539459228515625, -8.729100227355957e-05, -5.918741226196289e-05, -3.108382225036621e-05, -2.9802322387695312e-06, 2.512335777282715e-05, 5.322694778442383e-05, 8.133053779602051e-05, 0.00010943412780761719, 0.00013753771781921387, 0.00016564130783081055, 0.00019374489784240723, 0.0002218484878540039, 0.0002499520778656006, 0.00027805566787719727, 0.00030615925788879395, 0.0003342628479003906, 0.0003623664379119873, 0.000390470027923584, 0.00041857361793518066, 0.00044667720794677734, 0.000474780797958374, 0.0005028843879699707, 0.0005309879779815674, 0.0005590915679931641, 0.0005871951580047607, 0.0006152987480163574, 0.0006434023380279541, 0.0006715059280395508, 0.0006996095180511475, 0.0007277131080627441, 0.0007558166980743408, 0.0007839202880859375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 8.0, 1.0, 12.0, 11.0, 16.0, 13.0, 32.0, 37.0, 50.0, 79.0, 156.0, 285.0, 1150.0, 970966.0, 74400.0, 702.0, 255.0, 138.0, 71.0, 43.0, 38.0, 32.0, 18.0, 11.0, 12.0, 7.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0169525146484375, -0.01634383201599121, -0.015735149383544922, -0.015126466751098633, -0.014517784118652344, -0.013909101486206055, -0.013300418853759766, -0.012691736221313477, -0.012083053588867188, -0.011474370956420898, -0.01086568832397461, -0.01025700569152832, -0.009648323059082031, -0.009039640426635742, -0.008430957794189453, -0.007822275161743164, -0.007213592529296875, -0.006604909896850586, -0.005996227264404297, -0.005387544631958008, -0.004778861999511719, -0.00417017936706543, -0.0035614967346191406, -0.0029528141021728516, -0.0023441314697265625, -0.0017354488372802734, -0.0011267662048339844, -0.0005180835723876953, 9.059906005859375e-05, 0.0006992816925048828, 0.0013079643249511719, 0.001916646957397461, 0.00252532958984375, 0.003134012222290039, 0.003742694854736328, 0.004351377487182617, 0.004960060119628906, 0.005568742752075195, 0.006177425384521484, 0.0067861080169677734, 0.0073947906494140625, 0.008003473281860352, 0.00861215591430664, 0.00922083854675293, 0.009829521179199219, 0.010438203811645508, 0.011046886444091797, 0.011655569076538086, 0.012264251708984375, 0.012872934341430664, 0.013481616973876953, 0.014090299606323242, 0.014698982238769531, 0.01530766487121582, 0.01591634750366211, 0.0165250301361084, 0.017133712768554688, 0.017742395401000977, 0.018351078033447266, 0.018959760665893555, 0.019568443298339844, 0.020177125930786133, 0.020785808563232422, 0.02139449119567871, 0.022003173828125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 33.0, 135.0, 313.0, 337.0, 149.0, 34.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001753966324031353, -0.0017149875639006495, -0.001676008803769946, -0.0016370301600545645, -0.001598051399923861, -0.0015590726397931576, -0.0015200938796624541, -0.0014811151195317507, -0.001442136475816369, -0.0014031577156856656, -0.0013641789555549622, -0.0013252003118395805, -0.001286221551708877, -0.0012472427915781736, -0.0012082640314474702, -0.0011692852713167667, -0.0011303066276013851, -0.0010913278674706817, -0.0010523491073399782, -0.0010133704636245966, -0.0009743917034938931, -0.0009354129433631897, -0.0008964341832324862, -0.0008574554813094437, -0.0008184766629710793, -0.0007794979028403759, -0.0007405192009173334, -0.0007015404407866299, -0.0006625617388635874, -0.0006235829787328839, -0.0005846042186021805, -0.0005456255166791379, -0.0005066467565484345, -0.0004676680255215615, -0.0004286892944946885, -0.00038971053436398506, -0.0003507318324409425, -0.0003117530723102391, -0.0002727743412833661, -0.0002337956102564931, -0.0001948168792296201, -0.0001558381482027471, -0.0001168594098999165, -7.788067159708589e-05, -3.89019405702129e-05, 7.679045666009188e-08, 3.905553603544831e-05, 7.80342670623213e-05, 0.0001170129980891943, 0.0001559917291160673, 0.00019497046014294028, 0.0002339492057217285, 0.00027292792219668627, 0.0003119066823273897, 0.0003508854133542627, 0.0003898641443811357, 0.0004288428754080087, 0.0004678216064348817, 0.0005068003665655851, 0.0005457790684886277, 0.0005847578286193311, 0.0006237365305423737, 0.0006627152906730771, 0.0007016940508037806, 0.0007406727527268231]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 8.0, 7.0, 9.0, 7.0, 19.0, 16.0, 16.0, 21.0, 17.0, 23.0, 22.0, 33.0, 33.0, 31.0, 38.0, 47.0, 36.0, 43.0, 36.0, 40.0, 46.0, 35.0, 37.0, 47.0, 44.0, 38.0, 35.0, 32.0, 25.0, 24.0, 21.0, 24.0, 17.0, 10.0, 10.0, 12.0, 9.0, 6.0, 6.0, 4.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0003139972686767578, -0.00030429940670728683, -0.00029460154473781586, -0.0002849036827683449, -0.0002752058207988739, -0.0002655079588294029, -0.00025581009685993195, -0.00024611223489046097, -0.00023641437292099, -0.000226716510951519, -0.00021701864898204803, -0.00020732078701257706, -0.00019762292504310608, -0.0001879250630736351, -0.00017822720110416412, -0.00016852933913469315, -0.00015883147716522217, -0.0001491336151957512, -0.0001394357532262802, -0.00012973789125680923, -0.00012004002928733826, -0.00011034216731786728, -0.0001006443053483963, -9.094644337892532e-05, -8.124858140945435e-05, -7.155071943998337e-05, -6.185285747051239e-05, -5.215499550104141e-05, -4.2457133531570435e-05, -3.275927156209946e-05, -2.306140959262848e-05, -1.3363547623157501e-05, -3.6656856536865234e-06, 6.032176315784454e-06, 1.5730038285255432e-05, 2.542790025472641e-05, 3.512576222419739e-05, 4.4823624193668365e-05, 5.452148616313934e-05, 6.421934813261032e-05, 7.39172101020813e-05, 8.361507207155228e-05, 9.331293404102325e-05, 0.00010301079601049423, 0.00011270865797996521, 0.0001224065199494362, 0.00013210438191890717, 0.00014180224388837814, 0.00015150010585784912, 0.0001611979678273201, 0.00017089582979679108, 0.00018059369176626205, 0.00019029155373573303, 0.000199989415705204, 0.000209687277674675, 0.00021938513964414597, 0.00022908300161361694, 0.00023878086358308792, 0.0002484787255525589, 0.0002581765875220299, 0.00026787444949150085, 0.00027757231146097183, 0.0002872701734304428, 0.0002969680353999138, 0.00030666589736938477]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 9.0, 4.0, 3.0, 5.0, 11.0, 10.0, 11.0, 14.0, 17.0, 19.0, 16.0, 21.0, 20.0, 16.0, 21.0, 25.0, 36.0, 30.0, 33.0, 44.0, 37.0, 41.0, 35.0, 33.0, 42.0, 40.0, 46.0, 39.0, 40.0, 27.0, 29.0, 34.0, 34.0, 20.0, 18.0, 32.0, 16.0, 10.0, 13.0, 8.0, 9.0, 12.0, 6.0, 13.0, 5.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.951171875, -3.836395263671875, -3.72161865234375, -3.606842041015625, -3.4920654296875, -3.377288818359375, -3.26251220703125, -3.147735595703125, -3.032958984375, -2.918182373046875, -2.80340576171875, -2.688629150390625, -2.5738525390625, -2.459075927734375, -2.34429931640625, -2.229522705078125, -2.11474609375, -1.999969482421875, -1.88519287109375, -1.770416259765625, -1.6556396484375, -1.540863037109375, -1.42608642578125, -1.311309814453125, -1.196533203125, -1.081756591796875, -0.96697998046875, -0.852203369140625, -0.7374267578125, -0.622650146484375, -0.50787353515625, -0.393096923828125, -0.2783203125, -0.163543701171875, -0.04876708984375, 0.066009521484375, 0.1807861328125, 0.295562744140625, 0.41033935546875, 0.525115966796875, 0.639892578125, 0.754669189453125, 0.86944580078125, 0.984222412109375, 1.0989990234375, 1.213775634765625, 1.32855224609375, 1.443328857421875, 1.55810546875, 1.672882080078125, 1.78765869140625, 1.902435302734375, 2.0172119140625, 2.131988525390625, 2.24676513671875, 2.361541748046875, 2.476318359375, 2.591094970703125, 2.70587158203125, 2.820648193359375, 2.9354248046875, 3.050201416015625, 3.16497802734375, 3.279754638671875, 3.39453125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 6.0, 9.0, 7.0, 17.0, 16.0, 26.0, 35.0, 60.0, 62.0, 126.0, 183.0, 329.0, 494.0, 1013.0, 2399.0, 6633.0, 21911.0, 73697.0, 251660.0, 466608.0, 154978.0, 46332.0, 13836.0, 4409.0, 1760.0, 817.0, 429.0, 233.0, 152.0, 109.0, 56.0, 47.0, 34.0, 19.0, 17.0, 15.0, 8.0, 6.0, 4.0, 3.0, 1.0, 0.0, 4.0], "bins": [-7.1640625, -6.986328125, -6.80859375, -6.630859375, -6.453125, -6.275390625, -6.09765625, -5.919921875, -5.7421875, -5.564453125, -5.38671875, -5.208984375, -5.03125, -4.853515625, -4.67578125, -4.498046875, -4.3203125, -4.142578125, -3.96484375, -3.787109375, -3.609375, -3.431640625, -3.25390625, -3.076171875, -2.8984375, -2.720703125, -2.54296875, -2.365234375, -2.1875, -2.009765625, -1.83203125, -1.654296875, -1.4765625, -1.298828125, -1.12109375, -0.943359375, -0.765625, -0.587890625, -0.41015625, -0.232421875, -0.0546875, 0.123046875, 0.30078125, 0.478515625, 0.65625, 0.833984375, 1.01171875, 1.189453125, 1.3671875, 1.544921875, 1.72265625, 1.900390625, 2.078125, 2.255859375, 2.43359375, 2.611328125, 2.7890625, 2.966796875, 3.14453125, 3.322265625, 3.5, 3.677734375, 3.85546875, 4.033203125, 4.2109375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 7.0, 8.0, 13.0, 11.0, 14.0, 17.0, 9.0, 25.0, 28.0, 30.0, 33.0, 44.0, 37.0, 55.0, 59.0, 95.0, 203.0, 1543.0, 256.0, 106.0, 67.0, 64.0, 38.0, 53.0, 42.0, 35.0, 32.0, 32.0, 20.0, 13.0, 14.0, 9.0, 10.0, 6.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.859375, -15.400634765625, -14.94189453125, -14.483154296875, -14.0244140625, -13.565673828125, -13.10693359375, -12.648193359375, -12.189453125, -11.730712890625, -11.27197265625, -10.813232421875, -10.3544921875, -9.895751953125, -9.43701171875, -8.978271484375, -8.51953125, -8.060791015625, -7.60205078125, -7.143310546875, -6.6845703125, -6.225830078125, -5.76708984375, -5.308349609375, -4.849609375, -4.390869140625, -3.93212890625, -3.473388671875, -3.0146484375, -2.555908203125, -2.09716796875, -1.638427734375, -1.1796875, -0.720947265625, -0.26220703125, 0.196533203125, 0.6552734375, 1.114013671875, 1.57275390625, 2.031494140625, 2.490234375, 2.948974609375, 3.40771484375, 3.866455078125, 4.3251953125, 4.783935546875, 5.24267578125, 5.701416015625, 6.16015625, 6.618896484375, 7.07763671875, 7.536376953125, 7.9951171875, 8.453857421875, 8.91259765625, 9.371337890625, 9.830078125, 10.288818359375, 10.74755859375, 11.206298828125, 11.6650390625, 12.123779296875, 12.58251953125, 13.041259765625, 13.5]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 5.0, 11.0, 16.0, 19.0, 24.0, 42.0, 64.0, 80.0, 159.0, 289.0, 736.0, 12369.0, 3128561.0, 2291.0, 490.0, 216.0, 102.0, 89.0, 45.0, 28.0, 26.0, 14.0, 12.0, 10.0, 6.0, 7.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.15625, -36.76025390625, -34.3642578125, -31.96826171875, -29.572265625, -27.17626953125, -24.7802734375, -22.38427734375, -19.98828125, -17.59228515625, -15.1962890625, -12.80029296875, -10.404296875, -8.00830078125, -5.6123046875, -3.21630859375, -0.8203125, 1.57568359375, 3.9716796875, 6.36767578125, 8.763671875, 11.15966796875, 13.5556640625, 15.95166015625, 18.34765625, 20.74365234375, 23.1396484375, 25.53564453125, 27.931640625, 30.32763671875, 32.7236328125, 35.11962890625, 37.515625, 39.91162109375, 42.3076171875, 44.70361328125, 47.099609375, 49.49560546875, 51.8916015625, 54.28759765625, 56.68359375, 59.07958984375, 61.4755859375, 63.87158203125, 66.267578125, 68.66357421875, 71.0595703125, 73.45556640625, 75.8515625, 78.24755859375, 80.6435546875, 83.03955078125, 85.435546875, 87.83154296875, 90.2275390625, 92.62353515625, 95.01953125, 97.41552734375, 99.8115234375, 102.20751953125, 104.603515625, 106.99951171875, 109.3955078125, 111.79150390625, 114.1875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 6.0, 21.0, 64.0, 96.0, 139.0, 184.0, 200.0, 140.0, 80.0, 40.0, 21.0, 13.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.113792419433594, -41.10508346557617, -40.09637451171875, -39.08766555786133, -38.078956604003906, -37.070247650146484, -36.06153869628906, -35.052833557128906, -34.04412078857422, -33.0354118347168, -32.026702880859375, -31.017993927001953, -30.00928497314453, -29.00057601928711, -27.99186897277832, -26.9831600189209, -25.97445297241211, -24.965744018554688, -23.957035064697266, -22.948326110839844, -21.939617156982422, -20.930908203125, -19.92220115661621, -18.91349220275879, -17.904783248901367, -16.896074295043945, -15.887365341186523, -14.878657341003418, -13.869948387145996, -12.861239433288574, -11.852531433105469, -10.843822479248047, -9.835115432739258, -8.826406478881836, -7.817698001861572, -6.808989524841309, -5.800280570983887, -4.791571617126465, -3.782863140106201, -2.7741546630859375, -1.7654457092285156, -0.7567369937896729, 0.2519717216491699, 1.2606804370880127, 2.2693891525268555, 3.2780981063842773, 4.286806583404541, 5.295515060424805, 6.304224014282227, 7.312932968139648, 8.32164192199707, 9.330349922180176, 10.339058876037598, 11.34776782989502, 12.356475830078125, 13.365184783935547, 14.373893737792969, 15.38260269165039, 16.391311645507812, 17.400020599365234, 18.408729553222656, 19.417438507080078, 20.426145553588867, 21.43485450744629, 22.44356346130371]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 8.0, 10.0, 8.0, 7.0, 7.0, 10.0, 15.0, 17.0, 18.0, 24.0, 35.0, 31.0, 36.0, 45.0, 37.0, 46.0, 43.0, 42.0, 39.0, 39.0, 46.0, 42.0, 34.0, 44.0, 33.0, 27.0, 33.0, 23.0, 25.0, 27.0, 24.0, 31.0, 18.0, 17.0, 13.0, 11.0, 6.0, 13.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-44.56050109863281, -43.31117630004883, -42.06185531616211, -40.812530517578125, -39.563209533691406, -38.31388473510742, -37.0645637512207, -35.81523895263672, -34.56591796875, -33.316593170166016, -32.0672721862793, -30.817949295043945, -29.568626403808594, -28.319303512573242, -27.06998062133789, -25.820655822753906, -24.571332931518555, -23.322010040283203, -22.07268714904785, -20.8233642578125, -19.57404136657715, -18.324718475341797, -17.075393676757812, -15.826071739196777, -14.576748847961426, -13.327425956726074, -12.078103065490723, -10.828779220581055, -9.579456329345703, -8.330133438110352, -7.080810546875, -5.831487655639648, -4.582164764404297, -3.3328418731689453, -2.0835187435150146, -0.834195613861084, 0.4151272773742676, 1.6644501686096191, 2.913773536682129, 4.1630964279174805, 5.412419319152832, 6.661742210388184, 7.911065101623535, 9.160388946533203, 10.409711837768555, 11.659034729003906, 12.908357620239258, 14.15768051147461, 15.407003402709961, 16.656326293945312, 17.905649185180664, 19.154972076416016, 20.404294967651367, 21.65361785888672, 22.902942657470703, 24.152263641357422, 25.401588439941406, 26.650911331176758, 27.90023422241211, 29.14955711364746, 30.398880004882812, 31.648202896118164, 32.897525787353516, 34.1468505859375, 35.39617156982422]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 0.0, 3.0, 6.0, 2.0, 6.0, 6.0, 3.0, 6.0, 8.0, 13.0, 14.0, 10.0, 16.0, 18.0, 25.0, 10.0, 16.0, 22.0, 23.0, 27.0, 27.0, 16.0, 26.0, 25.0, 48.0, 33.0, 44.0, 40.0, 43.0, 41.0, 26.0, 36.0, 36.0, 40.0, 34.0, 27.0, 24.0, 20.0, 20.0, 24.0, 23.0, 18.0, 20.0, 14.0, 14.0, 6.0, 8.0, 9.0, 7.0, 7.0, 10.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.900390625, -3.77899169921875, -3.6575927734375, -3.53619384765625, -3.414794921875, -3.29339599609375, -3.1719970703125, -3.05059814453125, -2.92919921875, -2.80780029296875, -2.6864013671875, -2.56500244140625, -2.443603515625, -2.32220458984375, -2.2008056640625, -2.07940673828125, -1.9580078125, -1.83660888671875, -1.7152099609375, -1.59381103515625, -1.472412109375, -1.35101318359375, -1.2296142578125, -1.10821533203125, -0.98681640625, -0.86541748046875, -0.7440185546875, -0.62261962890625, -0.501220703125, -0.37982177734375, -0.2584228515625, -0.13702392578125, -0.015625, 0.10577392578125, 0.2271728515625, 0.34857177734375, 0.469970703125, 0.59136962890625, 0.7127685546875, 0.83416748046875, 0.95556640625, 1.07696533203125, 1.1983642578125, 1.31976318359375, 1.441162109375, 1.56256103515625, 1.6839599609375, 1.80535888671875, 1.9267578125, 2.04815673828125, 2.1695556640625, 2.29095458984375, 2.412353515625, 2.53375244140625, 2.6551513671875, 2.77655029296875, 2.89794921875, 3.01934814453125, 3.1407470703125, 3.26214599609375, 3.383544921875, 3.50494384765625, 3.6263427734375, 3.74774169921875, 3.869140625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 5.0, 5.0, 4.0, 10.0, 8.0, 10.0, 15.0, 12.0, 7.0, 13.0, 22.0, 20.0, 21.0, 22.0, 27.0, 26.0, 42.0, 51.0, 86.0, 216.0, 548.0, 1941.0, 20722.0, 958425.0, 3006934.0, 196833.0, 6241.0, 1091.0, 379.0, 158.0, 82.0, 51.0, 42.0, 31.0, 26.0, 26.0, 20.0, 18.0, 19.0, 11.0, 11.0, 13.0, 8.0, 11.0, 6.0, 4.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-14.4765625, -14.0281982421875, -13.579833984375, -13.1314697265625, -12.68310546875, -12.2347412109375, -11.786376953125, -11.3380126953125, -10.8896484375, -10.4412841796875, -9.992919921875, -9.5445556640625, -9.09619140625, -8.6478271484375, -8.199462890625, -7.7510986328125, -7.302734375, -6.8543701171875, -6.406005859375, -5.9576416015625, -5.50927734375, -5.0609130859375, -4.612548828125, -4.1641845703125, -3.7158203125, -3.2674560546875, -2.819091796875, -2.3707275390625, -1.92236328125, -1.4739990234375, -1.025634765625, -0.5772705078125, -0.12890625, 0.3194580078125, 0.767822265625, 1.2161865234375, 1.66455078125, 2.1129150390625, 2.561279296875, 3.0096435546875, 3.4580078125, 3.9063720703125, 4.354736328125, 4.8031005859375, 5.25146484375, 5.6998291015625, 6.148193359375, 6.5965576171875, 7.044921875, 7.4932861328125, 7.941650390625, 8.3900146484375, 8.83837890625, 9.2867431640625, 9.735107421875, 10.1834716796875, 10.6318359375, 11.0802001953125, 11.528564453125, 11.9769287109375, 12.42529296875, 12.8736572265625, 13.322021484375, 13.7703857421875, 14.21875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 3.0, 3.0, 3.0, 5.0, 7.0, 11.0, 19.0, 27.0, 41.0, 44.0, 47.0, 65.0, 95.0, 127.0, 163.0, 228.0, 311.0, 363.0, 413.0, 422.0, 425.0, 301.0, 233.0, 176.0, 142.0, 100.0, 83.0, 53.0, 45.0, 31.0, 28.0, 16.0, 10.0, 12.0, 12.0, 6.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.203125, -7.9306640625, -7.658203125, -7.3857421875, -7.11328125, -6.8408203125, -6.568359375, -6.2958984375, -6.0234375, -5.7509765625, -5.478515625, -5.2060546875, -4.93359375, -4.6611328125, -4.388671875, -4.1162109375, -3.84375, -3.5712890625, -3.298828125, -3.0263671875, -2.75390625, -2.4814453125, -2.208984375, -1.9365234375, -1.6640625, -1.3916015625, -1.119140625, -0.8466796875, -0.57421875, -0.3017578125, -0.029296875, 0.2431640625, 0.515625, 0.7880859375, 1.060546875, 1.3330078125, 1.60546875, 1.8779296875, 2.150390625, 2.4228515625, 2.6953125, 2.9677734375, 3.240234375, 3.5126953125, 3.78515625, 4.0576171875, 4.330078125, 4.6025390625, 4.875, 5.1474609375, 5.419921875, 5.6923828125, 5.96484375, 6.2373046875, 6.509765625, 6.7822265625, 7.0546875, 7.3271484375, 7.599609375, 7.8720703125, 8.14453125, 8.4169921875, 8.689453125, 8.9619140625, 9.234375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 9.0, 14.0, 15.0, 13.0, 27.0, 30.0, 38.0, 44.0, 65.0, 79.0, 113.0, 145.0, 186.0, 236.0, 340.0, 627.0, 3140.0, 266331.0, 3870769.0, 48714.0, 1635.0, 509.0, 280.0, 215.0, 148.0, 135.0, 85.0, 89.0, 75.0, 42.0, 39.0, 29.0, 25.0, 16.0, 7.0, 6.0, 6.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-32.75, -31.796630859375, -30.84326171875, -29.889892578125, -28.9365234375, -27.983154296875, -27.02978515625, -26.076416015625, -25.123046875, -24.169677734375, -23.21630859375, -22.262939453125, -21.3095703125, -20.356201171875, -19.40283203125, -18.449462890625, -17.49609375, -16.542724609375, -15.58935546875, -14.635986328125, -13.6826171875, -12.729248046875, -11.77587890625, -10.822509765625, -9.869140625, -8.915771484375, -7.96240234375, -7.009033203125, -6.0556640625, -5.102294921875, -4.14892578125, -3.195556640625, -2.2421875, -1.288818359375, -0.33544921875, 0.617919921875, 1.5712890625, 2.524658203125, 3.47802734375, 4.431396484375, 5.384765625, 6.338134765625, 7.29150390625, 8.244873046875, 9.1982421875, 10.151611328125, 11.10498046875, 12.058349609375, 13.01171875, 13.965087890625, 14.91845703125, 15.871826171875, 16.8251953125, 17.778564453125, 18.73193359375, 19.685302734375, 20.638671875, 21.592041015625, 22.54541015625, 23.498779296875, 24.4521484375, 25.405517578125, 26.35888671875, 27.312255859375, 28.265625]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 45.0, 195.0, 380.0, 286.0, 95.0, 8.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-182.7434844970703, -178.9963836669922, -175.24929809570312, -171.502197265625, -167.75509643554688, -164.00799560546875, -160.2609100341797, -156.51380920410156, -152.76670837402344, -149.0196075439453, -145.27252197265625, -141.52542114257812, -137.7783203125, -134.03121948242188, -130.2841339111328, -126.53703308105469, -122.78993225097656, -119.04283905029297, -115.29573822021484, -111.54864501953125, -107.80154418945312, -104.05445098876953, -100.3073501586914, -96.56025695800781, -92.81316375732422, -89.06607055664062, -85.3189697265625, -81.5718765258789, -77.82477569580078, -74.07768249511719, -70.33058166503906, -66.58348846435547, -62.83638381958008, -59.08928680419922, -55.34218978881836, -51.5950927734375, -47.84799575805664, -44.10089874267578, -40.35380554199219, -36.60670471191406, -32.85961151123047, -29.11251449584961, -25.36541748046875, -21.61832046508789, -17.87122344970703, -14.124128341674805, -10.377031326293945, -6.629934310913086, -2.8828353881835938, 0.8642613887786865, 4.611358165740967, 8.358454704284668, 12.105551719665527, 15.85264778137207, 19.59974479675293, 23.34684181213379, 27.09393882751465, 30.841035842895508, 34.588130950927734, 38.335227966308594, 42.08232498168945, 45.82942199707031, 49.57651901245117, 53.32361602783203, 57.07071304321289]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 4.0, 5.0, 7.0, 7.0, 5.0, 13.0, 8.0, 12.0, 16.0, 15.0, 17.0, 17.0, 13.0, 31.0, 33.0, 21.0, 39.0, 27.0, 30.0, 35.0, 33.0, 51.0, 41.0, 39.0, 33.0, 25.0, 29.0, 29.0, 41.0, 33.0, 41.0, 30.0, 25.0, 22.0, 28.0, 28.0, 17.0, 18.0, 22.0, 14.0, 9.0, 10.0, 11.0, 6.0, 6.0, 4.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.10993194580078, -23.26485824584961, -22.419784545898438, -21.574710845947266, -20.729637145996094, -19.884563446044922, -19.03948974609375, -18.194416046142578, -17.349342346191406, -16.504268646240234, -15.659194946289062, -14.81412124633789, -13.969047546386719, -13.123973846435547, -12.278899192810059, -11.433825492858887, -10.588750839233398, -9.743677139282227, -8.898603439331055, -8.053529739379883, -7.208455562591553, -6.363381862640381, -5.518307685852051, -4.673233985900879, -3.828160285949707, -2.983086585998535, -2.138012647628784, -1.2929387092590332, -0.44786500930786133, 0.39720869064331055, 1.2422828674316406, 2.0873565673828125, 2.9324302673339844, 3.7775039672851562, 4.622577667236328, 5.467651844024658, 6.31272554397583, 7.157799243927002, 8.002873420715332, 8.847947120666504, 9.693020820617676, 10.538094520568848, 11.38316822052002, 12.228242874145508, 13.07331657409668, 13.918390274047852, 14.763463973999023, 15.608537673950195, 16.453611373901367, 17.29868507385254, 18.14375877380371, 18.988832473754883, 19.833906173706055, 20.678979873657227, 21.52405548095703, 22.369129180908203, 23.214202880859375, 24.059276580810547, 24.90435028076172, 25.74942398071289, 26.594497680664062, 27.439571380615234, 28.284645080566406, 29.129718780517578, 29.97479248046875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 7.0, 10.0, 10.0, 9.0, 9.0, 8.0, 19.0, 23.0, 18.0, 20.0, 18.0, 17.0, 31.0, 24.0, 29.0, 42.0, 32.0, 38.0, 38.0, 36.0, 48.0, 51.0, 56.0, 49.0, 38.0, 32.0, 32.0, 25.0, 31.0, 29.0, 20.0, 33.0, 20.0, 13.0, 22.0, 15.0, 13.0, 11.0, 4.0, 6.0, 1.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.890625, -3.76068115234375, -3.6307373046875, -3.50079345703125, -3.370849609375, -3.24090576171875, -3.1109619140625, -2.98101806640625, -2.85107421875, -2.72113037109375, -2.5911865234375, -2.46124267578125, -2.331298828125, -2.20135498046875, -2.0714111328125, -1.94146728515625, -1.8115234375, -1.68157958984375, -1.5516357421875, -1.42169189453125, -1.291748046875, -1.16180419921875, -1.0318603515625, -0.90191650390625, -0.77197265625, -0.64202880859375, -0.5120849609375, -0.38214111328125, -0.252197265625, -0.12225341796875, 0.0076904296875, 0.13763427734375, 0.267578125, 0.39752197265625, 0.5274658203125, 0.65740966796875, 0.787353515625, 0.91729736328125, 1.0472412109375, 1.17718505859375, 1.30712890625, 1.43707275390625, 1.5670166015625, 1.69696044921875, 1.826904296875, 1.95684814453125, 2.0867919921875, 2.21673583984375, 2.3466796875, 2.47662353515625, 2.6065673828125, 2.73651123046875, 2.866455078125, 2.99639892578125, 3.1263427734375, 3.25628662109375, 3.38623046875, 3.51617431640625, 3.6461181640625, 3.77606201171875, 3.906005859375, 4.03594970703125, 4.1658935546875, 4.29583740234375, 4.42578125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 12.0, 14.0, 25.0, 37.0, 61.0, 86.0, 106.0, 185.0, 225.0, 376.0, 513.0, 795.0, 1142.0, 1672.0, 2312.0, 3415.0, 5095.0, 7324.0, 10500.0, 16051.0, 23769.0, 36053.0, 56112.0, 95801.0, 219123.0, 281075.0, 107063.0, 61402.0, 38884.0, 25740.0, 17101.0, 11564.0, 7904.0, 5348.0, 3637.0, 2528.0, 1704.0, 1128.0, 794.0, 601.0, 382.0, 295.0, 189.0, 145.0, 88.0, 66.0, 42.0, 20.0, 26.0, 10.0, 6.0, 5.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.93408203125, -0.905853271484375, -0.87762451171875, -0.849395751953125, -0.8211669921875, -0.792938232421875, -0.76470947265625, -0.736480712890625, -0.708251953125, -0.680023193359375, -0.65179443359375, -0.623565673828125, -0.5953369140625, -0.567108154296875, -0.53887939453125, -0.510650634765625, -0.482421875, -0.454193115234375, -0.42596435546875, -0.397735595703125, -0.3695068359375, -0.341278076171875, -0.31304931640625, -0.284820556640625, -0.256591796875, -0.228363037109375, -0.20013427734375, -0.171905517578125, -0.1436767578125, -0.115447998046875, -0.08721923828125, -0.058990478515625, -0.03076171875, -0.002532958984375, 0.02569580078125, 0.053924560546875, 0.0821533203125, 0.110382080078125, 0.13861083984375, 0.166839599609375, 0.195068359375, 0.223297119140625, 0.25152587890625, 0.279754638671875, 0.3079833984375, 0.336212158203125, 0.36444091796875, 0.392669677734375, 0.4208984375, 0.449127197265625, 0.47735595703125, 0.505584716796875, 0.5338134765625, 0.562042236328125, 0.59027099609375, 0.618499755859375, 0.646728515625, 0.674957275390625, 0.70318603515625, 0.731414794921875, 0.7596435546875, 0.787872314453125, 0.81610107421875, 0.844329833984375, 0.87255859375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 5.0, 7.0, 6.0, 10.0, 8.0, 11.0, 19.0, 19.0, 31.0, 33.0, 33.0, 37.0, 51.0, 36.0, 49.0, 35.0, 45.0, 32.0, 1079.0, 52.0, 50.0, 55.0, 44.0, 39.0, 31.0, 28.0, 27.0, 25.0, 20.0, 23.0, 17.0, 13.0, 9.0, 12.0, 11.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9921875, -2.895782470703125, -2.79937744140625, -2.702972412109375, -2.6065673828125, -2.510162353515625, -2.41375732421875, -2.317352294921875, -2.220947265625, -2.124542236328125, -2.02813720703125, -1.931732177734375, -1.8353271484375, -1.738922119140625, -1.64251708984375, -1.546112060546875, -1.44970703125, -1.353302001953125, -1.25689697265625, -1.160491943359375, -1.0640869140625, -0.967681884765625, -0.87127685546875, -0.774871826171875, -0.678466796875, -0.582061767578125, -0.48565673828125, -0.389251708984375, -0.2928466796875, -0.196441650390625, -0.10003662109375, -0.003631591796875, 0.0927734375, 0.189178466796875, 0.28558349609375, 0.381988525390625, 0.4783935546875, 0.574798583984375, 0.67120361328125, 0.767608642578125, 0.864013671875, 0.960418701171875, 1.05682373046875, 1.153228759765625, 1.2496337890625, 1.346038818359375, 1.44244384765625, 1.538848876953125, 1.63525390625, 1.731658935546875, 1.82806396484375, 1.924468994140625, 2.0208740234375, 2.117279052734375, 2.21368408203125, 2.310089111328125, 2.406494140625, 2.502899169921875, 2.59930419921875, 2.695709228515625, 2.7921142578125, 2.888519287109375, 2.98492431640625, 3.081329345703125, 3.177734375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 8.0, 10.0, 20.0, 15.0, 32.0, 51.0, 77.0, 110.0, 172.0, 264.0, 432.0, 717.0, 1122.0, 1861.0, 3096.0, 5204.0, 9042.0, 16512.0, 30901.0, 60401.0, 124593.0, 1428050.0, 222574.0, 91512.0, 45276.0, 23808.0, 13167.0, 7510.0, 4246.0, 2489.0, 1444.0, 900.0, 525.0, 354.0, 219.0, 142.0, 97.0, 67.0, 39.0, 25.0, 12.0, 12.0, 13.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2841796875, -1.245025634765625, -1.20587158203125, -1.166717529296875, -1.1275634765625, -1.088409423828125, -1.04925537109375, -1.010101318359375, -0.970947265625, -0.931793212890625, -0.89263916015625, -0.853485107421875, -0.8143310546875, -0.775177001953125, -0.73602294921875, -0.696868896484375, -0.65771484375, -0.618560791015625, -0.57940673828125, -0.540252685546875, -0.5010986328125, -0.461944580078125, -0.42279052734375, -0.383636474609375, -0.344482421875, -0.305328369140625, -0.26617431640625, -0.227020263671875, -0.1878662109375, -0.148712158203125, -0.10955810546875, -0.070404052734375, -0.03125, 0.007904052734375, 0.04705810546875, 0.086212158203125, 0.1253662109375, 0.164520263671875, 0.20367431640625, 0.242828369140625, 0.281982421875, 0.321136474609375, 0.36029052734375, 0.399444580078125, 0.4385986328125, 0.477752685546875, 0.51690673828125, 0.556060791015625, 0.59521484375, 0.634368896484375, 0.67352294921875, 0.712677001953125, 0.7518310546875, 0.790985107421875, 0.83013916015625, 0.869293212890625, 0.908447265625, 0.947601318359375, 0.98675537109375, 1.025909423828125, 1.0650634765625, 1.104217529296875, 1.14337158203125, 1.182525634765625, 1.2216796875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 5.0, 8.0, 10.0, 9.0, 11.0, 21.0, 22.0, 35.0, 33.0, 54.0, 49.0, 76.0, 129.0, 112.0, 113.0, 60.0, 50.0, 44.0, 21.0, 31.0, 19.0, 27.0, 15.0, 10.0, 11.0, 12.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00054168701171875, -0.0005183443427085876, -0.0004950016736984253, -0.00047165900468826294, -0.0004483163356781006, -0.00042497366666793823, -0.0004016309976577759, -0.0003782883286476135, -0.00035494565963745117, -0.0003316029906272888, -0.00030826032161712646, -0.0002849176526069641, -0.00026157498359680176, -0.0002382323145866394, -0.00021488964557647705, -0.0001915469765663147, -0.00016820430755615234, -0.00014486163854599, -0.00012151896953582764, -9.817630052566528e-05, -7.483363151550293e-05, -5.1490962505340576e-05, -2.8148293495178223e-05, -4.805624485015869e-06, 1.8537044525146484e-05, 4.187971353530884e-05, 6.522238254547119e-05, 8.856505155563354e-05, 0.0001119077205657959, 0.00013525038957595825, 0.0001585930585861206, 0.00018193572759628296, 0.0002052783966064453, 0.00022862106561660767, 0.00025196373462677, 0.0002753064036369324, 0.0002986490726470947, 0.0003219917416572571, 0.00034533441066741943, 0.0003686770796775818, 0.00039201974868774414, 0.0004153624176979065, 0.00043870508670806885, 0.0004620477557182312, 0.00048539042472839355, 0.0005087330937385559, 0.0005320757627487183, 0.0005554184317588806, 0.000578761100769043, 0.0006021037697792053, 0.0006254464387893677, 0.00064878910779953, 0.0006721317768096924, 0.0006954744458198547, 0.0007188171148300171, 0.0007421597838401794, 0.0007655024528503418, 0.0007888451218605042, 0.0008121877908706665, 0.0008355304598808289, 0.0008588731288909912, 0.0008822157979011536, 0.0009055584669113159, 0.0009289011359214783, 0.0009522438049316406]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 8.0, 5.0, 8.0, 9.0, 9.0, 20.0, 17.0, 32.0, 38.0, 48.0, 48.0, 95.0, 112.0, 208.0, 476.0, 1754.0, 550032.0, 492798.0, 1711.0, 469.0, 222.0, 114.0, 76.0, 57.0, 40.0, 34.0, 24.0, 17.0, 15.0, 16.0, 9.0, 6.0, 5.0, 6.0, 4.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.0165863037109375, -0.016171574592590332, -0.015756845474243164, -0.015342116355895996, -0.014927387237548828, -0.01451265811920166, -0.014097929000854492, -0.013683199882507324, -0.013268470764160156, -0.012853741645812988, -0.01243901252746582, -0.012024283409118652, -0.011609554290771484, -0.011194825172424316, -0.010780096054077148, -0.01036536693572998, -0.009950637817382812, -0.009535908699035645, -0.009121179580688477, -0.008706450462341309, -0.00829172134399414, -0.007876992225646973, -0.007462263107299805, -0.007047533988952637, -0.006632804870605469, -0.006218075752258301, -0.005803346633911133, -0.005388617515563965, -0.004973888397216797, -0.004559159278869629, -0.004144430160522461, -0.003729701042175293, -0.003314971923828125, -0.002900242805480957, -0.002485513687133789, -0.002070784568786621, -0.0016560554504394531, -0.0012413263320922852, -0.0008265972137451172, -0.0004118680953979492, 2.86102294921875e-06, 0.0004175901412963867, 0.0008323192596435547, 0.0012470483779907227, 0.0016617774963378906, 0.0020765066146850586, 0.0024912357330322266, 0.0029059648513793945, 0.0033206939697265625, 0.0037354230880737305, 0.0041501522064208984, 0.004564881324768066, 0.004979610443115234, 0.005394339561462402, 0.00580906867980957, 0.006223797798156738, 0.006638526916503906, 0.007053256034851074, 0.007467985153198242, 0.00788271427154541, 0.008297443389892578, 0.008712172508239746, 0.009126901626586914, 0.009541630744934082, 0.00995635986328125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 61.0, 210.0, 326.0, 288.0, 87.0, 29.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001050880760885775, -0.0010099856881424785, -0.0009690905571915209, -0.0009281954844482243, -0.0008873003534972668, -0.0008464052807539701, -0.0008055102080106735, -0.0007646151352673769, -0.0007237200043164194, -0.0006828249315731227, -0.0006419298006221652, -0.0006010347278788686, -0.000560139655135572, -0.0005192445241846144, -0.0004783494514413178, -0.0004374543495941907, -0.00039655924774706364, -0.00035566414589993656, -0.0003147690440528095, -0.00027387397130951285, -0.00023297886946238577, -0.0001920837676152587, -0.00015118869487196207, -0.00011029359302483499, -6.939849117770791e-05, -2.8503396606538445e-05, 1.2391697964631021e-05, 5.328678525984287e-05, 9.418188710696995e-05, 0.00013507698895409703, 0.00017597206169739366, 0.00021686716354452074, 0.00025776238180696964, 0.0002986574836540967, 0.0003395525855012238, 0.0003804476582445204, 0.0004213427600916475, 0.0004622378619387746, 0.0005031329346820712, 0.0005440280074253678, 0.0005849231383763254, 0.000625818211119622, 0.0006667133420705795, 0.0007076084148138762, 0.0007485034875571728, 0.0007893986185081303, 0.0008302936912514269, 0.0008711888222023845, 0.0009120838949456811, 0.0009529789676889777, 0.0009938740404322743, 0.0010347692295908928, 0.0010756643023341894, 0.001116559375077486, 0.0011574544478207827, 0.0011983495205640793, 0.001239244593307376, 0.0012801396660506725, 0.0013210347387939692, 0.0013619298115372658, 0.0014028250006958842, 0.0014437200734391809, 0.0014846151461824775, 0.001525510218925774, 0.0015664054080843925]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 6.0, 3.0, 7.0, 10.0, 3.0, 17.0, 31.0, 13.0, 24.0, 25.0, 21.0, 33.0, 30.0, 37.0, 44.0, 36.0, 53.0, 52.0, 34.0, 32.0, 40.0, 32.0, 33.0, 46.0, 32.0, 51.0, 33.0, 34.0, 26.0, 28.0, 17.0, 16.0, 13.0, 21.0, 15.0, 11.0, 12.0, 7.0, 6.0, 2.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0002950429916381836, -0.00028582941740751266, -0.00027661584317684174, -0.0002674022689461708, -0.0002581886947154999, -0.00024897512048482895, -0.00023976154625415802, -0.0002305479720234871, -0.00022133439779281616, -0.00021212082356214523, -0.0002029072493314743, -0.00019369367510080338, -0.00018448010087013245, -0.00017526652663946152, -0.0001660529524087906, -0.00015683937817811966, -0.00014762580394744873, -0.0001384122297167778, -0.00012919865548610687, -0.00011998508125543594, -0.00011077150702476501, -0.00010155793279409409, -9.234435856342316e-05, -8.313078433275223e-05, -7.39172101020813e-05, -6.470363587141037e-05, -5.549006164073944e-05, -4.627648741006851e-05, -3.706291317939758e-05, -2.7849338948726654e-05, -1.8635764718055725e-05, -9.422190487384796e-06, -2.086162567138672e-07, 9.004957973957062e-06, 1.821853220462799e-05, 2.743210643529892e-05, 3.664568066596985e-05, 4.585925489664078e-05, 5.5072829127311707e-05, 6.428640335798264e-05, 7.349997758865356e-05, 8.27135518193245e-05, 9.192712604999542e-05, 0.00010114070028066635, 0.00011035427451133728, 0.00011956784874200821, 0.00012878142297267914, 0.00013799499720335007, 0.000147208571434021, 0.00015642214566469193, 0.00016563571989536285, 0.00017484929412603378, 0.0001840628683567047, 0.00019327644258737564, 0.00020249001681804657, 0.0002117035910487175, 0.00022091716527938843, 0.00023013073951005936, 0.00023934431374073029, 0.0002485578879714012, 0.00025777146220207214, 0.00026698503643274307, 0.000276198610663414, 0.00028541218489408493, 0.00029462575912475586]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 7.0, 10.0, 10.0, 9.0, 9.0, 8.0, 19.0, 23.0, 18.0, 20.0, 18.0, 17.0, 31.0, 24.0, 29.0, 42.0, 32.0, 38.0, 38.0, 36.0, 48.0, 51.0, 56.0, 49.0, 38.0, 32.0, 32.0, 25.0, 31.0, 29.0, 20.0, 33.0, 20.0, 13.0, 22.0, 15.0, 13.0, 11.0, 4.0, 6.0, 1.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.890625, -3.76068115234375, -3.6307373046875, -3.50079345703125, -3.370849609375, -3.24090576171875, -3.1109619140625, -2.98101806640625, -2.85107421875, -2.72113037109375, -2.5911865234375, -2.46124267578125, -2.331298828125, -2.20135498046875, -2.0714111328125, -1.94146728515625, -1.8115234375, -1.68157958984375, -1.5516357421875, -1.42169189453125, -1.291748046875, -1.16180419921875, -1.0318603515625, -0.90191650390625, -0.77197265625, -0.64202880859375, -0.5120849609375, -0.38214111328125, -0.252197265625, -0.12225341796875, 0.0076904296875, 0.13763427734375, 0.267578125, 0.39752197265625, 0.5274658203125, 0.65740966796875, 0.787353515625, 0.91729736328125, 1.0472412109375, 1.17718505859375, 1.30712890625, 1.43707275390625, 1.5670166015625, 1.69696044921875, 1.826904296875, 1.95684814453125, 2.0867919921875, 2.21673583984375, 2.3466796875, 2.47662353515625, 2.6065673828125, 2.73651123046875, 2.866455078125, 2.99639892578125, 3.1263427734375, 3.25628662109375, 3.38623046875, 3.51617431640625, 3.6461181640625, 3.77606201171875, 3.906005859375, 4.03594970703125, 4.1658935546875, 4.29583740234375, 4.42578125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 7.0, 5.0, 22.0, 26.0, 19.0, 33.0, 38.0, 70.0, 89.0, 132.0, 183.0, 289.0, 479.0, 834.0, 1440.0, 2923.0, 6245.0, 13893.0, 32270.0, 78282.0, 192074.0, 375377.0, 199909.0, 82389.0, 33916.0, 14408.0, 6311.0, 3031.0, 1553.0, 844.0, 503.0, 287.0, 195.0, 136.0, 96.0, 74.0, 54.0, 31.0, 24.0, 12.0, 14.0, 15.0, 6.0, 4.0, 5.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.861328125, -3.734832763671875, -3.60833740234375, -3.481842041015625, -3.3553466796875, -3.228851318359375, -3.10235595703125, -2.975860595703125, -2.849365234375, -2.722869873046875, -2.59637451171875, -2.469879150390625, -2.3433837890625, -2.216888427734375, -2.09039306640625, -1.963897705078125, -1.83740234375, -1.710906982421875, -1.58441162109375, -1.457916259765625, -1.3314208984375, -1.204925537109375, -1.07843017578125, -0.951934814453125, -0.825439453125, -0.698944091796875, -0.57244873046875, -0.445953369140625, -0.3194580078125, -0.192962646484375, -0.06646728515625, 0.060028076171875, 0.1865234375, 0.313018798828125, 0.43951416015625, 0.566009521484375, 0.6925048828125, 0.819000244140625, 0.94549560546875, 1.071990966796875, 1.198486328125, 1.324981689453125, 1.45147705078125, 1.577972412109375, 1.7044677734375, 1.830963134765625, 1.95745849609375, 2.083953857421875, 2.21044921875, 2.336944580078125, 2.46343994140625, 2.589935302734375, 2.7164306640625, 2.842926025390625, 2.96942138671875, 3.095916748046875, 3.222412109375, 3.348907470703125, 3.47540283203125, 3.601898193359375, 3.7283935546875, 3.854888916015625, 3.98138427734375, 4.107879638671875, 4.234375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 10.0, 3.0, 6.0, 15.0, 10.0, 10.0, 13.0, 18.0, 24.0, 38.0, 31.0, 34.0, 46.0, 48.0, 61.0, 82.0, 150.0, 353.0, 1427.0, 172.0, 89.0, 61.0, 42.0, 58.0, 51.0, 34.0, 38.0, 26.0, 26.0, 9.0, 19.0, 12.0, 11.0, 5.0, 4.0, 3.0, 2.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.65625, -17.1527099609375, -16.649169921875, -16.1456298828125, -15.64208984375, -15.1385498046875, -14.635009765625, -14.1314697265625, -13.6279296875, -13.1243896484375, -12.620849609375, -12.1173095703125, -11.61376953125, -11.1102294921875, -10.606689453125, -10.1031494140625, -9.599609375, -9.0960693359375, -8.592529296875, -8.0889892578125, -7.58544921875, -7.0819091796875, -6.578369140625, -6.0748291015625, -5.5712890625, -5.0677490234375, -4.564208984375, -4.0606689453125, -3.55712890625, -3.0535888671875, -2.550048828125, -2.0465087890625, -1.54296875, -1.0394287109375, -0.535888671875, -0.0323486328125, 0.47119140625, 0.9747314453125, 1.478271484375, 1.9818115234375, 2.4853515625, 2.9888916015625, 3.492431640625, 3.9959716796875, 4.49951171875, 5.0030517578125, 5.506591796875, 6.0101318359375, 6.513671875, 7.0172119140625, 7.520751953125, 8.0242919921875, 8.52783203125, 9.0313720703125, 9.534912109375, 10.0384521484375, 10.5419921875, 11.0455322265625, 11.549072265625, 12.0526123046875, 12.55615234375, 13.0596923828125, 13.563232421875, 14.0667724609375, 14.5703125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 7.0, 6.0, 6.0, 9.0, 13.0, 16.0, 17.0, 25.0, 35.0, 63.0, 94.0, 146.0, 254.0, 467.0, 1335.0, 512714.0, 2627833.0, 1453.0, 467.0, 273.0, 151.0, 96.0, 63.0, 42.0, 27.0, 19.0, 11.0, 12.0, 9.0, 9.0, 10.0, 6.0, 3.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0], "bins": [-87.0625, -84.7744140625, -82.486328125, -80.1982421875, -77.91015625, -75.6220703125, -73.333984375, -71.0458984375, -68.7578125, -66.4697265625, -64.181640625, -61.8935546875, -59.60546875, -57.3173828125, -55.029296875, -52.7412109375, -50.453125, -48.1650390625, -45.876953125, -43.5888671875, -41.30078125, -39.0126953125, -36.724609375, -34.4365234375, -32.1484375, -29.8603515625, -27.572265625, -25.2841796875, -22.99609375, -20.7080078125, -18.419921875, -16.1318359375, -13.84375, -11.5556640625, -9.267578125, -6.9794921875, -4.69140625, -2.4033203125, -0.115234375, 2.1728515625, 4.4609375, 6.7490234375, 9.037109375, 11.3251953125, 13.61328125, 15.9013671875, 18.189453125, 20.4775390625, 22.765625, 25.0537109375, 27.341796875, 29.6298828125, 31.91796875, 34.2060546875, 36.494140625, 38.7822265625, 41.0703125, 43.3583984375, 45.646484375, 47.9345703125, 50.22265625, 52.5107421875, 54.798828125, 57.0869140625, 59.375]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.0, 962.0, 10.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-452.3536376953125, -444.18548583984375, -436.0173034667969, -427.84912109375, -419.68096923828125, -411.5128173828125, -403.3446350097656, -395.17645263671875, -387.00830078125, -378.84014892578125, -370.6719665527344, -362.5037841796875, -354.33563232421875, -346.16748046875, -337.9992980957031, -329.83111572265625, -321.6629638671875, -313.49481201171875, -305.3266296386719, -297.158447265625, -288.99029541015625, -280.8221435546875, -272.6539611816406, -264.48577880859375, -256.317626953125, -248.1494598388672, -239.98129272460938, -231.81312561035156, -223.64495849609375, -215.47679138183594, -207.30862426757812, -199.1404571533203, -190.9722900390625, -182.8041229248047, -174.63595581054688, -166.46778869628906, -158.29962158203125, -150.13145446777344, -141.96328735351562, -133.7951202392578, -125.626953125, -117.45878601074219, -109.29061889648438, -101.12245178222656, -92.95428466796875, -84.78611755371094, -76.61795043945312, -68.44978332519531, -60.2816162109375, -52.11344909667969, -43.945281982421875, -35.77711486816406, -27.60894775390625, -19.440780639648438, -11.272613525390625, -3.1044464111328125, 5.063720703125, 13.231887817382812, 21.400054931640625, 29.568222045898438, 37.73638916015625, 45.90455627441406, 54.072723388671875, 62.24089050292969, 70.4090576171875]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 7.0, 5.0, 5.0, 6.0, 10.0, 13.0, 20.0, 21.0, 20.0, 18.0, 22.0, 22.0, 24.0, 30.0, 20.0, 27.0, 41.0, 47.0, 25.0, 36.0, 38.0, 48.0, 32.0, 36.0, 49.0, 37.0, 35.0, 38.0, 34.0, 34.0, 32.0, 28.0, 15.0, 21.0, 13.0, 11.0, 17.0, 11.0, 9.0, 7.0, 10.0, 5.0, 8.0, 5.0, 3.0, 3.0, 3.0, 0.0, 3.0], "bins": [-37.644283294677734, -36.58751678466797, -35.5307502746582, -34.47398376464844, -33.41721725463867, -32.360450744628906, -31.30368423461914, -30.246917724609375, -29.19015121459961, -28.133384704589844, -27.076618194580078, -26.019851684570312, -24.963085174560547, -23.90631866455078, -22.849552154541016, -21.79278564453125, -20.736019134521484, -19.67925262451172, -18.622486114501953, -17.565719604492188, -16.508953094482422, -15.452186584472656, -14.39542007446289, -13.338653564453125, -12.28188705444336, -11.225120544433594, -10.168354034423828, -9.111587524414062, -8.054821014404297, -6.998054504394531, -5.941287994384766, -4.884521484375, -3.8277549743652344, -2.7709884643554688, -1.7142219543457031, -0.6574554443359375, 0.3993110656738281, 1.4560775756835938, 2.5128440856933594, 3.569610595703125, 4.626377105712891, 5.683143615722656, 6.739910125732422, 7.7966766357421875, 8.853443145751953, 9.910209655761719, 10.966976165771484, 12.02374267578125, 13.080509185791016, 14.137275695800781, 15.194042205810547, 16.250808715820312, 17.307575225830078, 18.364341735839844, 19.42110824584961, 20.477874755859375, 21.53464126586914, 22.591407775878906, 23.648174285888672, 24.704940795898438, 25.761707305908203, 26.81847381591797, 27.875240325927734, 28.9320068359375, 29.988773345947266]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 9.0, 4.0, 7.0, 10.0, 10.0, 18.0, 9.0, 15.0, 17.0, 26.0, 16.0, 21.0, 23.0, 21.0, 35.0, 29.0, 41.0, 31.0, 44.0, 51.0, 38.0, 41.0, 54.0, 50.0, 46.0, 42.0, 33.0, 38.0, 25.0, 22.0, 26.0, 27.0, 20.0, 12.0, 18.0, 17.0, 9.0, 12.0, 9.0, 5.0, 4.0, 8.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.46875, -4.3214111328125, -4.174072265625, -4.0267333984375, -3.87939453125, -3.7320556640625, -3.584716796875, -3.4373779296875, -3.2900390625, -3.1427001953125, -2.995361328125, -2.8480224609375, -2.70068359375, -2.5533447265625, -2.406005859375, -2.2586669921875, -2.111328125, -1.9639892578125, -1.816650390625, -1.6693115234375, -1.52197265625, -1.3746337890625, -1.227294921875, -1.0799560546875, -0.9326171875, -0.7852783203125, -0.637939453125, -0.4906005859375, -0.34326171875, -0.1959228515625, -0.048583984375, 0.0987548828125, 0.24609375, 0.3934326171875, 0.540771484375, 0.6881103515625, 0.83544921875, 0.9827880859375, 1.130126953125, 1.2774658203125, 1.4248046875, 1.5721435546875, 1.719482421875, 1.8668212890625, 2.01416015625, 2.1614990234375, 2.308837890625, 2.4561767578125, 2.603515625, 2.7508544921875, 2.898193359375, 3.0455322265625, 3.19287109375, 3.3402099609375, 3.487548828125, 3.6348876953125, 3.7822265625, 3.9295654296875, 4.076904296875, 4.2242431640625, 4.37158203125, 4.5189208984375, 4.666259765625, 4.8135986328125, 4.9609375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 5.0, 2.0, 6.0, 3.0, 12.0, 9.0, 13.0, 19.0, 16.0, 19.0, 20.0, 32.0, 20.0, 63.0, 77.0, 108.0, 224.0, 370.0, 977.0, 5220.0, 98294.0, 1869728.0, 2086873.0, 124052.0, 6013.0, 1037.0, 431.0, 198.0, 115.0, 68.0, 62.0, 42.0, 20.0, 34.0, 16.0, 18.0, 19.0, 9.0, 8.0, 7.0, 9.0, 3.0, 3.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.8671875, -12.4776611328125, -12.088134765625, -11.6986083984375, -11.30908203125, -10.9195556640625, -10.530029296875, -10.1405029296875, -9.7509765625, -9.3614501953125, -8.971923828125, -8.5823974609375, -8.19287109375, -7.8033447265625, -7.413818359375, -7.0242919921875, -6.634765625, -6.2452392578125, -5.855712890625, -5.4661865234375, -5.07666015625, -4.6871337890625, -4.297607421875, -3.9080810546875, -3.5185546875, -3.1290283203125, -2.739501953125, -2.3499755859375, -1.96044921875, -1.5709228515625, -1.181396484375, -0.7918701171875, -0.40234375, -0.0128173828125, 0.376708984375, 0.7662353515625, 1.15576171875, 1.5452880859375, 1.934814453125, 2.3243408203125, 2.7138671875, 3.1033935546875, 3.492919921875, 3.8824462890625, 4.27197265625, 4.6614990234375, 5.051025390625, 5.4405517578125, 5.830078125, 6.2196044921875, 6.609130859375, 6.9986572265625, 7.38818359375, 7.7777099609375, 8.167236328125, 8.5567626953125, 8.9462890625, 9.3358154296875, 9.725341796875, 10.1148681640625, 10.50439453125, 10.8939208984375, 11.283447265625, 11.6729736328125, 12.0625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 3.0, 3.0, 9.0, 7.0, 15.0, 16.0, 19.0, 24.0, 42.0, 39.0, 48.0, 91.0, 101.0, 123.0, 180.0, 221.0, 279.0, 344.0, 444.0, 390.0, 389.0, 320.0, 256.0, 173.0, 140.0, 101.0, 71.0, 61.0, 50.0, 31.0, 26.0, 12.0, 14.0, 8.0, 8.0, 7.0, 5.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7890625, -8.523193359375, -8.25732421875, -7.991455078125, -7.7255859375, -7.459716796875, -7.19384765625, -6.927978515625, -6.662109375, -6.396240234375, -6.13037109375, -5.864501953125, -5.5986328125, -5.332763671875, -5.06689453125, -4.801025390625, -4.53515625, -4.269287109375, -4.00341796875, -3.737548828125, -3.4716796875, -3.205810546875, -2.93994140625, -2.674072265625, -2.408203125, -2.142333984375, -1.87646484375, -1.610595703125, -1.3447265625, -1.078857421875, -0.81298828125, -0.547119140625, -0.28125, -0.015380859375, 0.25048828125, 0.516357421875, 0.7822265625, 1.048095703125, 1.31396484375, 1.579833984375, 1.845703125, 2.111572265625, 2.37744140625, 2.643310546875, 2.9091796875, 3.175048828125, 3.44091796875, 3.706787109375, 3.97265625, 4.238525390625, 4.50439453125, 4.770263671875, 5.0361328125, 5.302001953125, 5.56787109375, 5.833740234375, 6.099609375, 6.365478515625, 6.63134765625, 6.897216796875, 7.1630859375, 7.428955078125, 7.69482421875, 7.960693359375, 8.2265625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 8.0, 8.0, 11.0, 14.0, 21.0, 29.0, 33.0, 47.0, 60.0, 95.0, 101.0, 134.0, 202.0, 258.0, 363.0, 680.0, 5480.0, 1759094.0, 2418456.0, 7071.0, 669.0, 376.0, 255.0, 194.0, 160.0, 106.0, 93.0, 70.0, 49.0, 38.0, 35.0, 14.0, 19.0, 15.0, 4.0, 6.0, 7.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.359375, -30.315185546875, -29.27099609375, -28.226806640625, -27.1826171875, -26.138427734375, -25.09423828125, -24.050048828125, -23.005859375, -21.961669921875, -20.91748046875, -19.873291015625, -18.8291015625, -17.784912109375, -16.74072265625, -15.696533203125, -14.65234375, -13.608154296875, -12.56396484375, -11.519775390625, -10.4755859375, -9.431396484375, -8.38720703125, -7.343017578125, -6.298828125, -5.254638671875, -4.21044921875, -3.166259765625, -2.1220703125, -1.077880859375, -0.03369140625, 1.010498046875, 2.0546875, 3.098876953125, 4.14306640625, 5.187255859375, 6.2314453125, 7.275634765625, 8.31982421875, 9.364013671875, 10.408203125, 11.452392578125, 12.49658203125, 13.540771484375, 14.5849609375, 15.629150390625, 16.67333984375, 17.717529296875, 18.76171875, 19.805908203125, 20.85009765625, 21.894287109375, 22.9384765625, 23.982666015625, 25.02685546875, 26.071044921875, 27.115234375, 28.159423828125, 29.20361328125, 30.247802734375, 31.2919921875, 32.336181640625, 33.38037109375, 34.424560546875, 35.46875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 14.0, 31.0, 64.0, 121.0, 179.0, 178.0, 188.0, 114.0, 65.0, 34.0, 13.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.81599044799805, -40.04401397705078, -38.27203369140625, -36.50005340576172, -34.72807693481445, -32.95610046386719, -31.184120178222656, -29.412141799926758, -27.64016342163086, -25.86818504333496, -24.096206665039062, -22.324228286743164, -20.552249908447266, -18.780271530151367, -17.00829315185547, -15.23631477355957, -13.464336395263672, -11.692358016967773, -9.920379638671875, -8.148401260375977, -6.376422882080078, -4.60444450378418, -2.8324661254882812, -1.0604877471923828, 0.7114906311035156, 2.483469009399414, 4.2554473876953125, 6.027425765991211, 7.799404144287109, 9.571382522583008, 11.343360900878906, 13.115339279174805, 14.887313842773438, 16.659292221069336, 18.431270599365234, 20.203248977661133, 21.97522735595703, 23.74720573425293, 25.519184112548828, 27.291162490844727, 29.063140869140625, 30.835119247436523, 32.60709762573242, 34.37907409667969, 36.15105438232422, 37.92303466796875, 39.695011138916016, 41.46698760986328, 43.23896789550781, 45.010948181152344, 46.78292465209961, 48.554901123046875, 50.326881408691406, 52.09886169433594, 53.8708381652832, 55.64281463623047, 57.414794921875, 59.18677520751953, 60.9587516784668, 62.73072814941406, 64.5027084350586, 66.27468872070312, 68.04666137695312, 69.81864166259766, 71.59062194824219]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 5.0, 5.0, 11.0, 8.0, 12.0, 15.0, 24.0, 27.0, 21.0, 29.0, 33.0, 32.0, 30.0, 24.0, 41.0, 46.0, 39.0, 36.0, 43.0, 37.0, 32.0, 47.0, 38.0, 36.0, 37.0, 37.0, 28.0, 38.0, 34.0, 20.0, 20.0, 15.0, 20.0, 22.0, 10.0, 5.0, 18.0, 10.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-29.399795532226562, -28.469858169555664, -27.539920806884766, -26.6099853515625, -25.6800479888916, -24.750110626220703, -23.820175170898438, -22.89023780822754, -21.96030044555664, -21.030363082885742, -20.100425720214844, -19.170490264892578, -18.24055290222168, -17.31061553955078, -16.380680084228516, -15.450742721557617, -14.520805358886719, -13.59086799621582, -12.660931587219238, -11.730995178222656, -10.801057815551758, -9.87112045288086, -8.941184043884277, -8.011247634887695, -7.081310272216797, -6.151373386383057, -5.221436500549316, -4.291499614715576, -3.361562728881836, -2.4316258430480957, -1.5016889572143555, -0.5717520713806152, 0.358184814453125, 1.2881217002868652, 2.2180585861206055, 3.1479954719543457, 4.077932357788086, 5.007869243621826, 5.937806129455566, 6.867743015289307, 7.797679901123047, 8.727617263793945, 9.657553672790527, 10.58749008178711, 11.517427444458008, 12.447364807128906, 13.377301216125488, 14.30723762512207, 15.237174987792969, 16.167112350463867, 17.097049713134766, 18.02698516845703, 18.95692253112793, 19.886859893798828, 20.816795349121094, 21.746732711791992, 22.67667007446289, 23.60660743713379, 24.536544799804688, 25.466480255126953, 26.39641761779785, 27.32635498046875, 28.256290435791016, 29.186227798461914, 30.116165161132812]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 6.0, 9.0, 5.0, 5.0, 9.0, 10.0, 4.0, 12.0, 11.0, 14.0, 11.0, 8.0, 17.0, 39.0, 41.0, 26.0, 22.0, 29.0, 25.0, 41.0, 34.0, 34.0, 47.0, 35.0, 36.0, 43.0, 46.0, 44.0, 35.0, 34.0, 30.0, 40.0, 24.0, 38.0, 18.0, 18.0, 13.0, 17.0, 9.0, 12.0, 11.0, 8.0, 11.0, 8.0, 7.0, 5.0, 3.0, 6.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.861328125, -3.728546142578125, -3.59576416015625, -3.462982177734375, -3.3302001953125, -3.197418212890625, -3.06463623046875, -2.931854248046875, -2.799072265625, -2.666290283203125, -2.53350830078125, -2.400726318359375, -2.2679443359375, -2.135162353515625, -2.00238037109375, -1.869598388671875, -1.73681640625, -1.604034423828125, -1.47125244140625, -1.338470458984375, -1.2056884765625, -1.072906494140625, -0.94012451171875, -0.807342529296875, -0.674560546875, -0.541778564453125, -0.40899658203125, -0.276214599609375, -0.1434326171875, -0.010650634765625, 0.12213134765625, 0.254913330078125, 0.3876953125, 0.520477294921875, 0.65325927734375, 0.786041259765625, 0.9188232421875, 1.051605224609375, 1.18438720703125, 1.317169189453125, 1.449951171875, 1.582733154296875, 1.71551513671875, 1.848297119140625, 1.9810791015625, 2.113861083984375, 2.24664306640625, 2.379425048828125, 2.51220703125, 2.644989013671875, 2.77777099609375, 2.910552978515625, 3.0433349609375, 3.176116943359375, 3.30889892578125, 3.441680908203125, 3.574462890625, 3.707244873046875, 3.84002685546875, 3.972808837890625, 4.1055908203125, 4.238372802734375, 4.37115478515625, 4.503936767578125, 4.63671875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 6.0, 5.0, 11.0, 13.0, 25.0, 39.0, 59.0, 83.0, 111.0, 155.0, 250.0, 350.0, 467.0, 703.0, 1000.0, 1347.0, 2019.0, 2722.0, 3922.0, 5713.0, 8270.0, 12410.0, 19051.0, 28639.0, 44799.0, 73694.0, 137419.0, 310961.0, 165824.0, 83009.0, 50037.0, 31513.0, 20614.0, 13564.0, 9198.0, 6257.0, 4246.0, 2952.0, 2065.0, 1465.0, 1015.0, 786.0, 547.0, 379.0, 263.0, 202.0, 129.0, 100.0, 60.0, 32.0, 24.0, 15.0, 11.0, 12.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.87744140625, -0.8487777709960938, -0.8201141357421875, -0.7914505004882812, -0.762786865234375, -0.7341232299804688, -0.7054595947265625, -0.6767959594726562, -0.64813232421875, -0.6194686889648438, -0.5908050537109375, -0.5621414184570312, -0.533477783203125, -0.5048141479492188, -0.4761505126953125, -0.44748687744140625, -0.4188232421875, -0.39015960693359375, -0.3614959716796875, -0.33283233642578125, -0.304168701171875, -0.27550506591796875, -0.2468414306640625, -0.21817779541015625, -0.18951416015625, -0.16085052490234375, -0.1321868896484375, -0.10352325439453125, -0.074859619140625, -0.04619598388671875, -0.0175323486328125, 0.01113128662109375, 0.039794921875, 0.06845855712890625, 0.0971221923828125, 0.12578582763671875, 0.154449462890625, 0.18311309814453125, 0.2117767333984375, 0.24044036865234375, 0.26910400390625, 0.29776763916015625, 0.3264312744140625, 0.35509490966796875, 0.383758544921875, 0.41242218017578125, 0.4410858154296875, 0.46974945068359375, 0.4984130859375, 0.5270767211914062, 0.5557403564453125, 0.5844039916992188, 0.613067626953125, 0.6417312622070312, 0.6703948974609375, 0.6990585327148438, 0.72772216796875, 0.7563858032226562, 0.7850494384765625, 0.8137130737304688, 0.842376708984375, 0.8710403442382812, 0.8997039794921875, 0.9283676147460938, 0.95703125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 5.0, 3.0, 8.0, 10.0, 7.0, 9.0, 24.0, 17.0, 22.0, 26.0, 31.0, 28.0, 34.0, 30.0, 34.0, 40.0, 36.0, 39.0, 47.0, 1057.0, 42.0, 32.0, 34.0, 41.0, 44.0, 34.0, 32.0, 34.0, 27.0, 34.0, 19.0, 17.0, 17.0, 18.0, 12.0, 12.0, 22.0, 12.0, 9.0, 3.0, 1.0, 4.0, 6.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.998046875, -2.909332275390625, -2.82061767578125, -2.731903076171875, -2.6431884765625, -2.554473876953125, -2.46575927734375, -2.377044677734375, -2.288330078125, -2.199615478515625, -2.11090087890625, -2.022186279296875, -1.9334716796875, -1.844757080078125, -1.75604248046875, -1.667327880859375, -1.57861328125, -1.489898681640625, -1.40118408203125, -1.312469482421875, -1.2237548828125, -1.135040283203125, -1.04632568359375, -0.957611083984375, -0.868896484375, -0.780181884765625, -0.69146728515625, -0.602752685546875, -0.5140380859375, -0.425323486328125, -0.33660888671875, -0.247894287109375, -0.1591796875, -0.070465087890625, 0.01824951171875, 0.106964111328125, 0.1956787109375, 0.284393310546875, 0.37310791015625, 0.461822509765625, 0.550537109375, 0.639251708984375, 0.72796630859375, 0.816680908203125, 0.9053955078125, 0.994110107421875, 1.08282470703125, 1.171539306640625, 1.26025390625, 1.348968505859375, 1.43768310546875, 1.526397705078125, 1.6151123046875, 1.703826904296875, 1.79254150390625, 1.881256103515625, 1.969970703125, 2.058685302734375, 2.14739990234375, 2.236114501953125, 2.3248291015625, 2.413543701171875, 2.50225830078125, 2.590972900390625, 2.6796875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 11.0, 5.0, 22.0, 17.0, 31.0, 51.0, 87.0, 100.0, 159.0, 243.0, 327.0, 578.0, 816.0, 1274.0, 1870.0, 2927.0, 4654.0, 7543.0, 12751.0, 21658.0, 37212.0, 66674.0, 126885.0, 1393476.0, 201651.0, 93263.0, 50274.0, 28609.0, 16714.0, 10304.0, 6235.0, 3988.0, 2446.0, 1475.0, 981.0, 581.0, 408.0, 290.0, 172.0, 109.0, 89.0, 44.0, 36.0, 28.0, 22.0, 12.0, 15.0, 5.0, 5.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0693359375, -1.033416748046875, -0.99749755859375, -0.961578369140625, -0.9256591796875, -0.889739990234375, -0.85382080078125, -0.817901611328125, -0.781982421875, -0.746063232421875, -0.71014404296875, -0.674224853515625, -0.6383056640625, -0.602386474609375, -0.56646728515625, -0.530548095703125, -0.49462890625, -0.458709716796875, -0.42279052734375, -0.386871337890625, -0.3509521484375, -0.315032958984375, -0.27911376953125, -0.243194580078125, -0.207275390625, -0.171356201171875, -0.13543701171875, -0.099517822265625, -0.0635986328125, -0.027679443359375, 0.00823974609375, 0.044158935546875, 0.080078125, 0.115997314453125, 0.15191650390625, 0.187835693359375, 0.2237548828125, 0.259674072265625, 0.29559326171875, 0.331512451171875, 0.367431640625, 0.403350830078125, 0.43927001953125, 0.475189208984375, 0.5111083984375, 0.547027587890625, 0.58294677734375, 0.618865966796875, 0.65478515625, 0.690704345703125, 0.72662353515625, 0.762542724609375, 0.7984619140625, 0.834381103515625, 0.87030029296875, 0.906219482421875, 0.942138671875, 0.978057861328125, 1.01397705078125, 1.049896240234375, 1.0858154296875, 1.121734619140625, 1.15765380859375, 1.193572998046875, 1.2294921875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 5.0, 2.0, 4.0, 7.0, 12.0, 10.0, 17.0, 16.0, 19.0, 19.0, 28.0, 31.0, 45.0, 58.0, 71.0, 62.0, 65.0, 69.0, 79.0, 63.0, 55.0, 36.0, 40.0, 28.0, 23.0, 21.0, 12.0, 19.0, 13.0, 18.0, 8.0, 7.0, 6.0, 1.0, 4.0, 5.0, 4.0, 0.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.0004944801330566406, -0.00047635287046432495, -0.0004582256078720093, -0.0004400983452796936, -0.00042197108268737793, -0.00040384382009506226, -0.0003857165575027466, -0.0003675892949104309, -0.00034946203231811523, -0.00033133476972579956, -0.0003132075071334839, -0.0002950802445411682, -0.00027695298194885254, -0.00025882571935653687, -0.0002406984567642212, -0.00022257119417190552, -0.00020444393157958984, -0.00018631666898727417, -0.0001681894063949585, -0.00015006214380264282, -0.00013193488121032715, -0.00011380761861801147, -9.56803560256958e-05, -7.755309343338013e-05, -5.942583084106445e-05, -4.129856824874878e-05, -2.3171305656433105e-05, -5.044043064117432e-06, 1.3083219528198242e-05, 3.1210482120513916e-05, 4.933774471282959e-05, 6.746500730514526e-05, 8.559226989746094e-05, 0.00010371953248977661, 0.00012184679508209229, 0.00013997405767440796, 0.00015810132026672363, 0.0001762285828590393, 0.00019435584545135498, 0.00021248310804367065, 0.00023061037063598633, 0.000248737633228302, 0.0002668648958206177, 0.00028499215841293335, 0.000303119421005249, 0.0003212466835975647, 0.00033937394618988037, 0.00035750120878219604, 0.0003756284713745117, 0.0003937557339668274, 0.00041188299655914307, 0.00043001025915145874, 0.0004481375217437744, 0.0004662647843360901, 0.00048439204692840576, 0.0005025193095207214, 0.0005206465721130371, 0.0005387738347053528, 0.0005569010972976685, 0.0005750283598899841, 0.0005931556224822998, 0.0006112828850746155, 0.0006294101476669312, 0.0006475374102592468, 0.0006656646728515625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 4.0, 9.0, 12.0, 17.0, 17.0, 23.0, 26.0, 36.0, 63.0, 78.0, 119.0, 221.0, 604.0, 6864.0, 1019553.0, 19406.0, 743.0, 287.0, 129.0, 88.0, 53.0, 54.0, 29.0, 28.0, 14.0, 12.0, 9.0, 7.0, 6.0, 5.0, 1.0, 2.0, 6.0, 1.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.01690673828125, -0.016456961631774902, -0.016007184982299805, -0.015557408332824707, -0.01510763168334961, -0.014657855033874512, -0.014208078384399414, -0.013758301734924316, -0.013308525085449219, -0.012858748435974121, -0.012408971786499023, -0.011959195137023926, -0.011509418487548828, -0.01105964183807373, -0.010609865188598633, -0.010160088539123535, -0.009710311889648438, -0.00926053524017334, -0.008810758590698242, -0.008360981941223145, -0.007911205291748047, -0.007461428642272949, -0.0070116519927978516, -0.006561875343322754, -0.006112098693847656, -0.005662322044372559, -0.005212545394897461, -0.004762768745422363, -0.004312992095947266, -0.003863215446472168, -0.0034134387969970703, -0.0029636621475219727, -0.002513885498046875, -0.0020641088485717773, -0.0016143321990966797, -0.001164555549621582, -0.0007147789001464844, -0.0002650022506713867, 0.00018477439880371094, 0.0006345510482788086, 0.0010843276977539062, 0.001534104347229004, 0.0019838809967041016, 0.0024336576461791992, 0.002883434295654297, 0.0033332109451293945, 0.003782987594604492, 0.00423276424407959, 0.0046825408935546875, 0.005132317543029785, 0.005582094192504883, 0.0060318708419799805, 0.006481647491455078, 0.006931424140930176, 0.0073812007904052734, 0.007830977439880371, 0.008280754089355469, 0.008730530738830566, 0.009180307388305664, 0.009630084037780762, 0.01007986068725586, 0.010529637336730957, 0.010979413986206055, 0.011429190635681152, 0.01187896728515625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 11.0, 55.0, 130.0, 179.0, 256.0, 196.0, 113.0, 48.0, 14.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020932972256559879, -0.0001813946000766009, -0.00015345949213951826, -0.0001255243842024356, -9.758926171343774e-05, -6.965415377635509e-05, -4.171903128735721e-05, -1.3783908798359334e-05, 1.4151199138723314e-05, 4.2086314351763576e-05, 7.002142956480384e-05, 9.79565447778441e-05, 0.00012589165999088436, 0.000153826767927967, 0.0001817618904169649, 0.00020969701290596277, 0.0002376321208430454, 0.0002655672433320433, 0.00029350235126912594, 0.0003214374592062086, 0.00034937256714329123, 0.00037730770418420434, 0.000405242812121287, 0.00043317792005836964, 0.00046111305709928274, 0.0004890481941401958, 0.000516983272973448, 0.0005449184100143611, 0.0005728534888476133, 0.0006007886258885264, 0.0006287237629294395, 0.0006566588999703526, 0.0006845939205959439, 0.000712529057636857, 0.0007404641364701092, 0.0007683992735110223, 0.0007963343523442745, 0.0008242694893851876, 0.0008522046264261007, 0.0008801397634670138, 0.000908074842300266, 0.0009360099793411791, 0.0009639450581744313, 0.0009918801952153444, 0.0010198153322562575, 0.0010477504692971706, 0.001075685489922762, 0.001103620626963675, 0.0011315557640045881, 0.0011594909010455012, 0.0011874260380864143, 0.0012153610587120056, 0.0012432961957529187, 0.0012712313327938318, 0.001299166469834745, 0.001327101606875658, 0.0013550366275012493, 0.0013829717645421624, 0.0014109069015830755, 0.0014388419222086668, 0.00146677705924958, 0.001494712196290493, 0.0015226473333314061, 0.0015505824703723192, 0.0015785176074132323]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 2.0, 7.0, 7.0, 4.0, 8.0, 10.0, 12.0, 13.0, 15.0, 24.0, 24.0, 28.0, 29.0, 34.0, 33.0, 34.0, 29.0, 37.0, 40.0, 39.0, 42.0, 51.0, 45.0, 46.0, 41.0, 34.0, 36.0, 33.0, 35.0, 29.0, 26.0, 21.0, 26.0, 12.0, 14.0, 12.0, 19.0, 17.0, 8.0, 11.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002823472023010254, -0.00027278438210487366, -0.0002632215619087219, -0.0002536587417125702, -0.00024409592151641846, -0.00023453310132026672, -0.000224970281124115, -0.00021540746092796326, -0.00020584464073181152, -0.0001962818205356598, -0.00018671900033950806, -0.00017715618014335632, -0.0001675933599472046, -0.00015803053975105286, -0.00014846771955490112, -0.0001389048993587494, -0.00012934207916259766, -0.00011977925896644592, -0.00011021643877029419, -0.00010065361857414246, -9.109079837799072e-05, -8.152797818183899e-05, -7.196515798568726e-05, -6.240233778953552e-05, -5.283951759338379e-05, -4.3276697397232056e-05, -3.371387720108032e-05, -2.415105700492859e-05, -1.4588236808776855e-05, -5.025416612625122e-06, 4.537403583526611e-06, 1.4100223779678345e-05, 2.3663043975830078e-05, 3.322586417198181e-05, 4.2788684368133545e-05, 5.235150456428528e-05, 6.191432476043701e-05, 7.147714495658875e-05, 8.103996515274048e-05, 9.060278534889221e-05, 0.00010016560554504395, 0.00010972842574119568, 0.00011929124593734741, 0.00012885406613349915, 0.00013841688632965088, 0.0001479797065258026, 0.00015754252672195435, 0.00016710534691810608, 0.0001766681671142578, 0.00018623098731040955, 0.00019579380750656128, 0.000205356627702713, 0.00021491944789886475, 0.00022448226809501648, 0.0002340450882911682, 0.00024360790848731995, 0.0002531707286834717, 0.0002627335488796234, 0.00027229636907577515, 0.0002818591892719269, 0.0002914220094680786, 0.00030098482966423035, 0.0003105476498603821, 0.0003201104700565338, 0.00032967329025268555]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 6.0, 9.0, 5.0, 5.0, 9.0, 10.0, 4.0, 12.0, 11.0, 14.0, 11.0, 8.0, 17.0, 39.0, 41.0, 26.0, 22.0, 29.0, 25.0, 41.0, 34.0, 34.0, 47.0, 35.0, 36.0, 43.0, 46.0, 44.0, 35.0, 34.0, 30.0, 40.0, 24.0, 38.0, 18.0, 18.0, 13.0, 17.0, 9.0, 12.0, 11.0, 8.0, 11.0, 8.0, 7.0, 5.0, 3.0, 6.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.861328125, -3.728546142578125, -3.59576416015625, -3.462982177734375, -3.3302001953125, -3.197418212890625, -3.06463623046875, -2.931854248046875, -2.799072265625, -2.666290283203125, -2.53350830078125, -2.400726318359375, -2.2679443359375, -2.135162353515625, -2.00238037109375, -1.869598388671875, -1.73681640625, -1.604034423828125, -1.47125244140625, -1.338470458984375, -1.2056884765625, -1.072906494140625, -0.94012451171875, -0.807342529296875, -0.674560546875, -0.541778564453125, -0.40899658203125, -0.276214599609375, -0.1434326171875, -0.010650634765625, 0.12213134765625, 0.254913330078125, 0.3876953125, 0.520477294921875, 0.65325927734375, 0.786041259765625, 0.9188232421875, 1.051605224609375, 1.18438720703125, 1.317169189453125, 1.449951171875, 1.582733154296875, 1.71551513671875, 1.848297119140625, 1.9810791015625, 2.113861083984375, 2.24664306640625, 2.379425048828125, 2.51220703125, 2.644989013671875, 2.77777099609375, 2.910552978515625, 3.0433349609375, 3.176116943359375, 3.30889892578125, 3.441680908203125, 3.574462890625, 3.707244873046875, 3.84002685546875, 3.972808837890625, 4.1055908203125, 4.238372802734375, 4.37115478515625, 4.503936767578125, 4.63671875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 9.0, 13.0, 13.0, 11.0, 32.0, 29.0, 42.0, 51.0, 84.0, 89.0, 142.0, 257.0, 426.0, 852.0, 1909.0, 4649.0, 12598.0, 37491.0, 111973.0, 343340.0, 357805.0, 116041.0, 38558.0, 13209.0, 4871.0, 1981.0, 865.0, 435.0, 270.0, 158.0, 91.0, 73.0, 47.0, 46.0, 24.0, 26.0, 15.0, 12.0, 5.0, 11.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41015625, -4.25274658203125, -4.0953369140625, -3.93792724609375, -3.780517578125, -3.62310791015625, -3.4656982421875, -3.30828857421875, -3.15087890625, -2.99346923828125, -2.8360595703125, -2.67864990234375, -2.521240234375, -2.36383056640625, -2.2064208984375, -2.04901123046875, -1.8916015625, -1.73419189453125, -1.5767822265625, -1.41937255859375, -1.261962890625, -1.10455322265625, -0.9471435546875, -0.78973388671875, -0.63232421875, -0.47491455078125, -0.3175048828125, -0.16009521484375, -0.002685546875, 0.15472412109375, 0.3121337890625, 0.46954345703125, 0.626953125, 0.78436279296875, 0.9417724609375, 1.09918212890625, 1.256591796875, 1.41400146484375, 1.5714111328125, 1.72882080078125, 1.88623046875, 2.04364013671875, 2.2010498046875, 2.35845947265625, 2.515869140625, 2.67327880859375, 2.8306884765625, 2.98809814453125, 3.1455078125, 3.30291748046875, 3.4603271484375, 3.61773681640625, 3.775146484375, 3.93255615234375, 4.0899658203125, 4.24737548828125, 4.40478515625, 4.56219482421875, 4.7196044921875, 4.87701416015625, 5.034423828125, 5.19183349609375, 5.3492431640625, 5.50665283203125, 5.6640625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 6.0, 3.0, 8.0, 8.0, 7.0, 16.0, 18.0, 23.0, 22.0, 26.0, 25.0, 41.0, 39.0, 39.0, 49.0, 55.0, 84.0, 203.0, 1519.0, 299.0, 113.0, 64.0, 40.0, 44.0, 42.0, 42.0, 29.0, 27.0, 35.0, 24.0, 22.0, 12.0, 18.0, 11.0, 9.0, 6.0, 5.0, 4.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.0625, -15.522705078125, -14.98291015625, -14.443115234375, -13.9033203125, -13.363525390625, -12.82373046875, -12.283935546875, -11.744140625, -11.204345703125, -10.66455078125, -10.124755859375, -9.5849609375, -9.045166015625, -8.50537109375, -7.965576171875, -7.42578125, -6.885986328125, -6.34619140625, -5.806396484375, -5.2666015625, -4.726806640625, -4.18701171875, -3.647216796875, -3.107421875, -2.567626953125, -2.02783203125, -1.488037109375, -0.9482421875, -0.408447265625, 0.13134765625, 0.671142578125, 1.2109375, 1.750732421875, 2.29052734375, 2.830322265625, 3.3701171875, 3.909912109375, 4.44970703125, 4.989501953125, 5.529296875, 6.069091796875, 6.60888671875, 7.148681640625, 7.6884765625, 8.228271484375, 8.76806640625, 9.307861328125, 9.84765625, 10.387451171875, 10.92724609375, 11.467041015625, 12.0068359375, 12.546630859375, 13.08642578125, 13.626220703125, 14.166015625, 14.705810546875, 15.24560546875, 15.785400390625, 16.3251953125, 16.864990234375, 17.40478515625, 17.944580078125, 18.484375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 6.0, 21.0, 17.0, 18.0, 27.0, 46.0, 64.0, 105.0, 176.0, 315.0, 888.0, 9105.0, 3129714.0, 3889.0, 626.0, 276.0, 133.0, 93.0, 52.0, 34.0, 28.0, 20.0, 15.0, 8.0, 13.0, 8.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.875, -105.1357421875, -102.396484375, -99.6572265625, -96.91796875, -94.1787109375, -91.439453125, -88.7001953125, -85.9609375, -83.2216796875, -80.482421875, -77.7431640625, -75.00390625, -72.2646484375, -69.525390625, -66.7861328125, -64.046875, -61.3076171875, -58.568359375, -55.8291015625, -53.08984375, -50.3505859375, -47.611328125, -44.8720703125, -42.1328125, -39.3935546875, -36.654296875, -33.9150390625, -31.17578125, -28.4365234375, -25.697265625, -22.9580078125, -20.21875, -17.4794921875, -14.740234375, -12.0009765625, -9.26171875, -6.5224609375, -3.783203125, -1.0439453125, 1.6953125, 4.4345703125, 7.173828125, 9.9130859375, 12.65234375, 15.3916015625, 18.130859375, 20.8701171875, 23.609375, 26.3486328125, 29.087890625, 31.8271484375, 34.56640625, 37.3056640625, 40.044921875, 42.7841796875, 45.5234375, 48.2626953125, 51.001953125, 53.7412109375, 56.48046875, 59.2197265625, 61.958984375, 64.6982421875, 67.4375]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 12.0, 42.0, 97.0, 232.0, 274.0, 225.0, 94.0, 25.0, 8.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.21437072753906, -65.99598693847656, -64.77759552001953, -63.559207916259766, -62.3408203125, -61.1224365234375, -59.90404510498047, -58.68566131591797, -57.4672737121582, -56.24888610839844, -55.03049850463867, -53.812110900878906, -52.59372329711914, -51.375335693359375, -50.156951904296875, -48.93856430053711, -47.720176696777344, -46.50178909301758, -45.28340148925781, -44.06501388549805, -42.84662628173828, -41.62824249267578, -40.40985107421875, -39.19146728515625, -37.97307586669922, -36.75468826293945, -35.53630065917969, -34.31791305541992, -33.099525451660156, -31.881139755249023, -30.662752151489258, -29.444366455078125, -28.225975036621094, -27.007587432861328, -25.789199829101562, -24.570812225341797, -23.352426528930664, -22.1340389251709, -20.915651321411133, -19.697265625, -18.478878021240234, -17.26049041748047, -16.042102813720703, -14.823716163635254, -13.605329513549805, -12.386941909790039, -11.168554306030273, -9.950167655944824, -8.731780052185059, -7.513392925262451, -6.295005798339844, -5.076618194580078, -3.8582310676574707, -2.6398439407348633, -1.4214563369750977, -0.20306968688964844, 1.0153179168701172, 2.2337050437927246, 3.452092409133911, 4.670479774475098, 5.888866901397705, 7.1072540283203125, 8.325641632080078, 9.544028282165527, 10.762415885925293]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 5.0, 3.0, 8.0, 11.0, 11.0, 13.0, 6.0, 16.0, 18.0, 22.0, 15.0, 21.0, 17.0, 30.0, 37.0, 28.0, 39.0, 38.0, 27.0, 33.0, 34.0, 38.0, 34.0, 40.0, 44.0, 31.0, 35.0, 33.0, 31.0, 31.0, 32.0, 30.0, 19.0, 27.0, 25.0, 19.0, 22.0, 14.0, 15.0, 14.0, 11.0, 6.0, 7.0, 2.0, 6.0, 6.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-37.522613525390625, -36.37358474731445, -35.22455596923828, -34.075531005859375, -32.9265022277832, -31.77747344970703, -30.628446578979492, -29.479419708251953, -28.33039093017578, -27.18136215209961, -26.03233528137207, -24.88330841064453, -23.73427963256836, -22.585250854492188, -21.43622398376465, -20.28719711303711, -19.138168334960938, -17.989139556884766, -16.840112686157227, -15.691084861755371, -14.542057037353516, -13.39302921295166, -12.244001388549805, -11.09497356414795, -9.945945739746094, -8.796917915344238, -7.647890090942383, -6.498862266540527, -5.349834442138672, -4.200806617736816, -3.051778793334961, -1.9027509689331055, -0.75372314453125, 0.39530467987060547, 1.544332504272461, 2.6933603286743164, 3.842388153076172, 4.991415977478027, 6.140443801879883, 7.289471626281738, 8.438499450683594, 9.58752727508545, 10.736555099487305, 11.88558292388916, 13.034610748291016, 14.183638572692871, 15.332666397094727, 16.481693267822266, 17.630722045898438, 18.77975082397461, 19.92877769470215, 21.077804565429688, 22.22683334350586, 23.37586212158203, 24.52488899230957, 25.67391586303711, 26.82294464111328, 27.971973419189453, 29.121000289916992, 30.27002716064453, 31.419055938720703, 32.568084716796875, 33.71710968017578, 34.86613845825195, 36.015167236328125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 5.0, 2.0, 8.0, 6.0, 8.0, 10.0, 12.0, 15.0, 6.0, 18.0, 17.0, 16.0, 24.0, 26.0, 30.0, 33.0, 29.0, 26.0, 40.0, 49.0, 40.0, 35.0, 38.0, 35.0, 40.0, 40.0, 35.0, 47.0, 29.0, 33.0, 34.0, 40.0, 21.0, 17.0, 17.0, 22.0, 16.0, 18.0, 9.0, 4.0, 7.0, 9.0, 9.0, 6.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.1077880859375, -3.965576171875, -3.8233642578125, -3.68115234375, -3.5389404296875, -3.396728515625, -3.2545166015625, -3.1123046875, -2.9700927734375, -2.827880859375, -2.6856689453125, -2.54345703125, -2.4012451171875, -2.259033203125, -2.1168212890625, -1.974609375, -1.8323974609375, -1.690185546875, -1.5479736328125, -1.40576171875, -1.2635498046875, -1.121337890625, -0.9791259765625, -0.8369140625, -0.6947021484375, -0.552490234375, -0.4102783203125, -0.26806640625, -0.1258544921875, 0.016357421875, 0.1585693359375, 0.30078125, 0.4429931640625, 0.585205078125, 0.7274169921875, 0.86962890625, 1.0118408203125, 1.154052734375, 1.2962646484375, 1.4384765625, 1.5806884765625, 1.722900390625, 1.8651123046875, 2.00732421875, 2.1495361328125, 2.291748046875, 2.4339599609375, 2.576171875, 2.7183837890625, 2.860595703125, 3.0028076171875, 3.14501953125, 3.2872314453125, 3.429443359375, 3.5716552734375, 3.7138671875, 3.8560791015625, 3.998291015625, 4.1405029296875, 4.28271484375, 4.4249267578125, 4.567138671875, 4.7093505859375, 4.8515625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 9.0, 6.0, 12.0, 7.0, 12.0, 11.0, 10.0, 21.0, 19.0, 22.0, 33.0, 38.0, 38.0, 30.0, 48.0, 65.0, 91.0, 123.0, 180.0, 339.0, 646.0, 2158.0, 16028.0, 250781.0, 2046555.0, 1691085.0, 170778.0, 11605.0, 1862.0, 605.0, 299.0, 185.0, 115.0, 77.0, 71.0, 57.0, 48.0, 31.0, 32.0, 25.0, 22.0, 24.0, 16.0, 11.0, 12.0, 10.0, 9.0, 6.0, 5.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-10.4921875, -10.16357421875, -9.8349609375, -9.50634765625, -9.177734375, -8.84912109375, -8.5205078125, -8.19189453125, -7.86328125, -7.53466796875, -7.2060546875, -6.87744140625, -6.548828125, -6.22021484375, -5.8916015625, -5.56298828125, -5.234375, -4.90576171875, -4.5771484375, -4.24853515625, -3.919921875, -3.59130859375, -3.2626953125, -2.93408203125, -2.60546875, -2.27685546875, -1.9482421875, -1.61962890625, -1.291015625, -0.96240234375, -0.6337890625, -0.30517578125, 0.0234375, 0.35205078125, 0.6806640625, 1.00927734375, 1.337890625, 1.66650390625, 1.9951171875, 2.32373046875, 2.65234375, 2.98095703125, 3.3095703125, 3.63818359375, 3.966796875, 4.29541015625, 4.6240234375, 4.95263671875, 5.28125, 5.60986328125, 5.9384765625, 6.26708984375, 6.595703125, 6.92431640625, 7.2529296875, 7.58154296875, 7.91015625, 8.23876953125, 8.5673828125, 8.89599609375, 9.224609375, 9.55322265625, 9.8818359375, 10.21044921875, 10.5390625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 2.0, 3.0, 4.0, 3.0, 7.0, 9.0, 16.0, 20.0, 28.0, 29.0, 31.0, 53.0, 48.0, 74.0, 81.0, 122.0, 161.0, 202.0, 273.0, 339.0, 391.0, 398.0, 389.0, 301.0, 254.0, 203.0, 170.0, 118.0, 74.0, 52.0, 51.0, 29.0, 39.0, 21.0, 23.0, 15.0, 17.0, 6.0, 6.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.0234375, -8.76068115234375, -8.4979248046875, -8.23516845703125, -7.972412109375, -7.70965576171875, -7.4468994140625, -7.18414306640625, -6.92138671875, -6.65863037109375, -6.3958740234375, -6.13311767578125, -5.870361328125, -5.60760498046875, -5.3448486328125, -5.08209228515625, -4.8193359375, -4.55657958984375, -4.2938232421875, -4.03106689453125, -3.768310546875, -3.50555419921875, -3.2427978515625, -2.98004150390625, -2.71728515625, -2.45452880859375, -2.1917724609375, -1.92901611328125, -1.666259765625, -1.40350341796875, -1.1407470703125, -0.87799072265625, -0.615234375, -0.35247802734375, -0.0897216796875, 0.17303466796875, 0.435791015625, 0.69854736328125, 0.9613037109375, 1.22406005859375, 1.48681640625, 1.74957275390625, 2.0123291015625, 2.27508544921875, 2.537841796875, 2.80059814453125, 3.0633544921875, 3.32611083984375, 3.5888671875, 3.85162353515625, 4.1143798828125, 4.37713623046875, 4.639892578125, 4.90264892578125, 5.1654052734375, 5.42816162109375, 5.69091796875, 5.95367431640625, 6.2164306640625, 6.47918701171875, 6.741943359375, 7.00469970703125, 7.2674560546875, 7.53021240234375, 7.79296875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 9.0, 8.0, 17.0, 21.0, 28.0, 31.0, 40.0, 52.0, 64.0, 87.0, 122.0, 182.0, 219.0, 304.0, 422.0, 1140.0, 69319.0, 4082015.0, 37622.0, 1007.0, 405.0, 302.0, 210.0, 164.0, 102.0, 86.0, 70.0, 55.0, 53.0, 30.0, 18.0, 25.0, 13.0, 5.0, 12.0, 5.0, 5.0, 4.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.15625, -36.86083984375, -35.5654296875, -34.27001953125, -32.974609375, -31.67919921875, -30.3837890625, -29.08837890625, -27.79296875, -26.49755859375, -25.2021484375, -23.90673828125, -22.611328125, -21.31591796875, -20.0205078125, -18.72509765625, -17.4296875, -16.13427734375, -14.8388671875, -13.54345703125, -12.248046875, -10.95263671875, -9.6572265625, -8.36181640625, -7.06640625, -5.77099609375, -4.4755859375, -3.18017578125, -1.884765625, -0.58935546875, 0.7060546875, 2.00146484375, 3.296875, 4.59228515625, 5.8876953125, 7.18310546875, 8.478515625, 9.77392578125, 11.0693359375, 12.36474609375, 13.66015625, 14.95556640625, 16.2509765625, 17.54638671875, 18.841796875, 20.13720703125, 21.4326171875, 22.72802734375, 24.0234375, 25.31884765625, 26.6142578125, 27.90966796875, 29.205078125, 30.50048828125, 31.7958984375, 33.09130859375, 34.38671875, 35.68212890625, 36.9775390625, 38.27294921875, 39.568359375, 40.86376953125, 42.1591796875, 43.45458984375, 44.75]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 24.0, 336.0, 531.0, 118.0, 7.0, 1.0, 1.0], "bins": [-378.9446716308594, -372.55291748046875, -366.1611328125, -359.7693786621094, -353.3775939941406, -346.98583984375, -340.59405517578125, -334.2023010253906, -327.8105163574219, -321.41876220703125, -315.0269775390625, -308.6352233886719, -302.2434387207031, -295.8516845703125, -289.45989990234375, -283.0681457519531, -276.6763916015625, -270.2846374511719, -263.8928527832031, -257.5010986328125, -251.10931396484375, -244.71755981445312, -238.32577514648438, -231.93402099609375, -225.542236328125, -219.1504669189453, -212.75869750976562, -206.36692810058594, -199.97515869140625, -193.58340454101562, -187.19161987304688, -180.79986572265625, -174.40809631347656, -168.01632690429688, -161.6245574951172, -155.2327880859375, -148.8410186767578, -142.44924926757812, -136.0574951171875, -129.6657257080078, -123.27395629882812, -116.88218688964844, -110.49041748046875, -104.09864807128906, -97.7068862915039, -91.31511688232422, -84.92334747314453, -78.53158569335938, -72.13980865478516, -65.74803924560547, -59.35627365112305, -52.96450424194336, -46.57273864746094, -40.18096923828125, -33.78919982910156, -27.39743423461914, -21.005666732788086, -14.613899230957031, -8.22213077545166, -1.830362319946289, 4.561405181884766, 10.95317268371582, 17.344942092895508, 23.73670768737793, 30.128477096557617]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 1.0, 6.0, 2.0, 12.0, 4.0, 15.0, 21.0, 19.0, 17.0, 16.0, 24.0, 24.0, 32.0, 35.0, 30.0, 33.0, 31.0, 47.0, 44.0, 42.0, 39.0, 32.0, 41.0, 36.0, 36.0, 34.0, 39.0, 21.0, 30.0, 25.0, 24.0, 26.0, 22.0, 29.0, 16.0, 15.0, 17.0, 14.0, 10.0, 4.0, 7.0, 3.0, 5.0, 7.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.848724365234375, -25.951616287231445, -25.054508209228516, -24.157400131225586, -23.260292053222656, -22.363182067871094, -21.466073989868164, -20.568965911865234, -19.671857833862305, -18.774749755859375, -17.877641677856445, -16.980533599853516, -16.083423614501953, -15.18631649017334, -14.289207458496094, -13.392099380493164, -12.494991302490234, -11.597883224487305, -10.700775146484375, -9.803666114807129, -8.9065580368042, -8.00944995880127, -7.112341403961182, -6.215232849121094, -5.318124771118164, -4.421016693115234, -3.5239081382751465, -2.6267998218536377, -1.729691505432129, -0.8325834274291992, 0.06452512741088867, 0.9616336822509766, 1.8587398529052734, 2.7558481693267822, 3.652956485748291, 4.550065040588379, 5.447173118591309, 6.344281196594238, 7.241389751434326, 8.138498306274414, 9.035606384277344, 9.932714462280273, 10.829822540283203, 11.72693157196045, 12.624039649963379, 13.521147727966309, 14.418256759643555, 15.315364837646484, 16.212472915649414, 17.109580993652344, 18.006689071655273, 18.903797149658203, 19.800907135009766, 20.698013305664062, 21.595123291015625, 22.492231369018555, 23.389339447021484, 24.286447525024414, 25.183555603027344, 26.080663681030273, 26.977771759033203, 27.874881744384766, 28.771989822387695, 29.669097900390625, 30.566205978393555]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 0.0, 8.0, 4.0, 5.0, 9.0, 7.0, 6.0, 21.0, 16.0, 17.0, 14.0, 29.0, 32.0, 13.0, 34.0, 31.0, 26.0, 35.0, 40.0, 38.0, 38.0, 46.0, 36.0, 43.0, 34.0, 42.0, 39.0, 41.0, 29.0, 31.0, 21.0, 27.0, 26.0, 15.0, 22.0, 18.0, 13.0, 24.0, 11.0, 12.0, 8.0, 4.0, 8.0, 6.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2734375, -4.13812255859375, -4.0028076171875, -3.86749267578125, -3.732177734375, -3.59686279296875, -3.4615478515625, -3.32623291015625, -3.19091796875, -3.05560302734375, -2.9202880859375, -2.78497314453125, -2.649658203125, -2.51434326171875, -2.3790283203125, -2.24371337890625, -2.1083984375, -1.97308349609375, -1.8377685546875, -1.70245361328125, -1.567138671875, -1.43182373046875, -1.2965087890625, -1.16119384765625, -1.02587890625, -0.89056396484375, -0.7552490234375, -0.61993408203125, -0.484619140625, -0.34930419921875, -0.2139892578125, -0.07867431640625, 0.056640625, 0.19195556640625, 0.3272705078125, 0.46258544921875, 0.597900390625, 0.73321533203125, 0.8685302734375, 1.00384521484375, 1.13916015625, 1.27447509765625, 1.4097900390625, 1.54510498046875, 1.680419921875, 1.81573486328125, 1.9510498046875, 2.08636474609375, 2.2216796875, 2.35699462890625, 2.4923095703125, 2.62762451171875, 2.762939453125, 2.89825439453125, 3.0335693359375, 3.16888427734375, 3.30419921875, 3.43951416015625, 3.5748291015625, 3.71014404296875, 3.845458984375, 3.98077392578125, 4.1160888671875, 4.25140380859375, 4.38671875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 6.0, 1.0, 19.0, 11.0, 12.0, 23.0, 47.0, 59.0, 100.0, 140.0, 219.0, 344.0, 516.0, 785.0, 993.0, 1494.0, 2012.0, 3019.0, 4289.0, 6326.0, 9165.0, 13504.0, 20023.0, 29779.0, 45681.0, 72373.0, 127180.0, 301559.0, 163407.0, 86381.0, 53174.0, 34220.0, 22848.0, 15329.0, 10178.0, 7284.0, 4927.0, 3419.0, 2320.0, 1674.0, 1203.0, 840.0, 593.0, 365.0, 242.0, 187.0, 93.0, 66.0, 49.0, 33.0, 16.0, 12.0, 13.0, 10.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.9111328125, -0.8823623657226562, -0.8535919189453125, -0.8248214721679688, -0.796051025390625, -0.7672805786132812, -0.7385101318359375, -0.7097396850585938, -0.68096923828125, -0.6521987915039062, -0.6234283447265625, -0.5946578979492188, -0.565887451171875, -0.5371170043945312, -0.5083465576171875, -0.47957611083984375, -0.4508056640625, -0.42203521728515625, -0.3932647705078125, -0.36449432373046875, -0.335723876953125, -0.30695343017578125, -0.2781829833984375, -0.24941253662109375, -0.22064208984375, -0.19187164306640625, -0.1631011962890625, -0.13433074951171875, -0.105560302734375, -0.07678985595703125, -0.0480194091796875, -0.01924896240234375, 0.009521484375, 0.03829193115234375, 0.0670623779296875, 0.09583282470703125, 0.124603271484375, 0.15337371826171875, 0.1821441650390625, 0.21091461181640625, 0.23968505859375, 0.26845550537109375, 0.2972259521484375, 0.32599639892578125, 0.354766845703125, 0.38353729248046875, 0.4123077392578125, 0.44107818603515625, 0.4698486328125, 0.49861907958984375, 0.5273895263671875, 0.5561599731445312, 0.584930419921875, 0.6137008666992188, 0.6424713134765625, 0.6712417602539062, 0.70001220703125, 0.7287826538085938, 0.7575531005859375, 0.7863235473632812, 0.815093994140625, 0.8438644409179688, 0.8726348876953125, 0.9014053344726562, 0.93017578125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 10.0, 8.0, 10.0, 18.0, 24.0, 20.0, 27.0, 30.0, 27.0, 29.0, 25.0, 40.0, 42.0, 35.0, 36.0, 38.0, 32.0, 1066.0, 37.0, 48.0, 37.0, 32.0, 35.0, 36.0, 46.0, 30.0, 31.0, 35.0, 19.0, 24.0, 14.0, 14.0, 12.0, 11.0, 6.0, 6.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.9296875, -2.8397216796875, -2.749755859375, -2.6597900390625, -2.56982421875, -2.4798583984375, -2.389892578125, -2.2999267578125, -2.2099609375, -2.1199951171875, -2.030029296875, -1.9400634765625, -1.85009765625, -1.7601318359375, -1.670166015625, -1.5802001953125, -1.490234375, -1.4002685546875, -1.310302734375, -1.2203369140625, -1.13037109375, -1.0404052734375, -0.950439453125, -0.8604736328125, -0.7705078125, -0.6805419921875, -0.590576171875, -0.5006103515625, -0.41064453125, -0.3206787109375, -0.230712890625, -0.1407470703125, -0.05078125, 0.0391845703125, 0.129150390625, 0.2191162109375, 0.30908203125, 0.3990478515625, 0.489013671875, 0.5789794921875, 0.6689453125, 0.7589111328125, 0.848876953125, 0.9388427734375, 1.02880859375, 1.1187744140625, 1.208740234375, 1.2987060546875, 1.388671875, 1.4786376953125, 1.568603515625, 1.6585693359375, 1.74853515625, 1.8385009765625, 1.928466796875, 2.0184326171875, 2.1083984375, 2.1983642578125, 2.288330078125, 2.3782958984375, 2.46826171875, 2.5582275390625, 2.648193359375, 2.7381591796875, 2.828125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 10.0, 11.0, 22.0, 22.0, 34.0, 59.0, 70.0, 104.0, 165.0, 232.0, 377.0, 457.0, 819.0, 1242.0, 1934.0, 3176.0, 5300.0, 8866.0, 15227.0, 26460.0, 46965.0, 86744.0, 178607.0, 1411779.0, 140190.0, 73051.0, 40221.0, 22204.0, 12837.0, 7478.0, 4599.0, 2800.0, 1797.0, 1148.0, 722.0, 465.0, 326.0, 219.0, 125.0, 83.0, 60.0, 36.0, 21.0, 21.0, 15.0, 12.0, 10.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.1435546875, -1.107086181640625, -1.07061767578125, -1.034149169921875, -0.9976806640625, -0.961212158203125, -0.92474365234375, -0.888275146484375, -0.851806640625, -0.815338134765625, -0.77886962890625, -0.742401123046875, -0.7059326171875, -0.669464111328125, -0.63299560546875, -0.596527099609375, -0.56005859375, -0.523590087890625, -0.48712158203125, -0.450653076171875, -0.4141845703125, -0.377716064453125, -0.34124755859375, -0.304779052734375, -0.268310546875, -0.231842041015625, -0.19537353515625, -0.158905029296875, -0.1224365234375, -0.085968017578125, -0.04949951171875, -0.013031005859375, 0.0234375, 0.059906005859375, 0.09637451171875, 0.132843017578125, 0.1693115234375, 0.205780029296875, 0.24224853515625, 0.278717041015625, 0.315185546875, 0.351654052734375, 0.38812255859375, 0.424591064453125, 0.4610595703125, 0.497528076171875, 0.53399658203125, 0.570465087890625, 0.60693359375, 0.643402099609375, 0.67987060546875, 0.716339111328125, 0.7528076171875, 0.789276123046875, 0.82574462890625, 0.862213134765625, 0.898681640625, 0.935150146484375, 0.97161865234375, 1.008087158203125, 1.0445556640625, 1.081024169921875, 1.11749267578125, 1.153961181640625, 1.1904296875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 2.0, 2.0, 1.0, 6.0, 4.0, 3.0, 6.0, 7.0, 5.0, 9.0, 11.0, 7.0, 12.0, 15.0, 23.0, 24.0, 22.0, 37.0, 38.0, 35.0, 58.0, 67.0, 58.0, 55.0, 50.0, 50.0, 53.0, 47.0, 44.0, 39.0, 37.0, 19.0, 19.0, 19.0, 18.0, 13.0, 11.0, 13.0, 11.0, 10.0, 6.0, 8.0, 7.0, 6.0, 0.0, 8.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0005254745483398438, -0.0005093887448310852, -0.0004933029413223267, -0.0004772171378135681, -0.00046113133430480957, -0.000445045530796051, -0.0004289597272872925, -0.00041287392377853394, -0.0003967881202697754, -0.00038070231676101685, -0.0003646165132522583, -0.00034853070974349976, -0.0003324449062347412, -0.00031635910272598267, -0.0003002732992172241, -0.0002841874957084656, -0.00026810169219970703, -0.0002520158886909485, -0.00023593008518218994, -0.0002198442816734314, -0.00020375847816467285, -0.0001876726746559143, -0.00017158687114715576, -0.00015550106763839722, -0.00013941526412963867, -0.00012332946062088013, -0.00010724365711212158, -9.115785360336304e-05, -7.507205009460449e-05, -5.898624658584595e-05, -4.29004430770874e-05, -2.6814639568328857e-05, -1.0728836059570312e-05, 5.356967449188232e-06, 2.1442770957946777e-05, 3.752857446670532e-05, 5.361437797546387e-05, 6.970018148422241e-05, 8.578598499298096e-05, 0.0001018717885017395, 0.00011795759201049805, 0.0001340433955192566, 0.00015012919902801514, 0.00016621500253677368, 0.00018230080604553223, 0.00019838660955429077, 0.00021447241306304932, 0.00023055821657180786, 0.0002466440200805664, 0.00026272982358932495, 0.0002788156270980835, 0.00029490143060684204, 0.0003109872341156006, 0.00032707303762435913, 0.0003431588411331177, 0.0003592446446418762, 0.00037533044815063477, 0.0003914162516593933, 0.00040750205516815186, 0.0004235878586769104, 0.00043967366218566895, 0.0004557594656944275, 0.00047184526920318604, 0.0004879310727119446, 0.0005040168762207031]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 2.0, 5.0, 3.0, 7.0, 6.0, 8.0, 9.0, 6.0, 12.0, 20.0, 22.0, 24.0, 23.0, 36.0, 51.0, 58.0, 67.0, 121.0, 180.0, 432.0, 1523.0, 582451.0, 461018.0, 1471.0, 405.0, 176.0, 116.0, 57.0, 53.0, 38.0, 31.0, 25.0, 18.0, 18.0, 12.0, 8.0, 9.0, 6.0, 7.0, 6.0, 4.0, 0.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01116943359375, -0.010770320892333984, -0.010371208190917969, -0.009972095489501953, -0.009572982788085938, -0.009173870086669922, -0.008774757385253906, -0.00837564468383789, -0.007976531982421875, -0.007577419281005859, -0.007178306579589844, -0.006779193878173828, -0.0063800811767578125, -0.005980968475341797, -0.005581855773925781, -0.005182743072509766, -0.00478363037109375, -0.004384517669677734, -0.003985404968261719, -0.003586292266845703, -0.0031871795654296875, -0.002788066864013672, -0.0023889541625976562, -0.0019898414611816406, -0.001590728759765625, -0.0011916160583496094, -0.0007925033569335938, -0.0003933906555175781, 5.7220458984375e-06, 0.0004048347473144531, 0.0008039474487304688, 0.0012030601501464844, 0.0016021728515625, 0.0020012855529785156, 0.0024003982543945312, 0.002799510955810547, 0.0031986236572265625, 0.003597736358642578, 0.003996849060058594, 0.004395961761474609, 0.004795074462890625, 0.005194187164306641, 0.005593299865722656, 0.005992412567138672, 0.0063915252685546875, 0.006790637969970703, 0.007189750671386719, 0.007588863372802734, 0.00798797607421875, 0.008387088775634766, 0.008786201477050781, 0.009185314178466797, 0.009584426879882812, 0.009983539581298828, 0.010382652282714844, 0.01078176498413086, 0.011180877685546875, 0.01157999038696289, 0.011979103088378906, 0.012378215789794922, 0.012777328491210938, 0.013176441192626953, 0.013575553894042969, 0.013974666595458984, 0.014373779296875]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 12.0, 26.0, 161.0, 399.0, 314.0, 89.0, 16.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.0024153057020157576, -0.0023727656807750463, -0.002330225659534335, -0.002287685638293624, -0.0022451456170529127, -0.002202605362981558, -0.0021600653417408466, -0.0021175253205001354, -0.002074985299259424, -0.002032445278018713, -0.001989905256778002, -0.0019473651191219687, -0.0019048250978812575, -0.0018622850766405463, -0.0018197450553998351, -0.001777204917743802, -0.0017346648965030909, -0.0016921248752623796, -0.0016495848540216684, -0.0016070447163656354, -0.0015645046951249242, -0.001521964673884213, -0.0014794246526435018, -0.0014368845149874687, -0.0013943446101620793, -0.0013518045889213681, -0.001309264567680657, -0.0012667244300246239, -0.0012241844087839127, -0.0011816443875432014, -0.0011391043663024902, -0.001096564345061779, -0.001054024207405746, -0.0010114841861650348, -0.0009689441067166626, -0.0009264040854759514, -0.0008838640060275793, -0.0008413239847868681, -0.0007987839635461569, -0.0007562438840977848, -0.0007137038046494126, -0.0006711637834087014, -0.0006286237039603293, -0.0005860836827196181, -0.000543543603271246, -0.0005010035820305347, -0.0004584635316859931, -0.0004159234813414514, -0.0003733834601007402, -0.0003308434097561985, -0.00028830335941165686, -0.00024576333817094564, -0.00020322327327448875, -0.00016068322292994708, -0.00011814318713732064, -7.560313679277897e-05, -3.30630864482373e-05, 9.476960258325562e-06, 5.2017006964888424e-05, 9.455705003347248e-05, 0.00013709710037801415, 0.00017963715072255582, 0.00022217718651518226, 0.0002647172368597239, 0.0003072572872042656]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 8.0, 4.0, 9.0, 5.0, 7.0, 13.0, 15.0, 13.0, 16.0, 18.0, 28.0, 36.0, 44.0, 45.0, 41.0, 50.0, 48.0, 43.0, 43.0, 41.0, 46.0, 49.0, 49.0, 48.0, 40.0, 27.0, 35.0, 30.0, 24.0, 32.0, 18.0, 16.0, 17.0, 15.0, 9.0, 11.0, 4.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036776065826416016, -0.0003566090017557144, -0.0003454573452472687, -0.00033430568873882294, -0.0003231540322303772, -0.00031200237572193146, -0.0003008507192134857, -0.00028969906270504, -0.00027854740619659424, -0.0002673957496881485, -0.00025624409317970276, -0.000245092436671257, -0.00023394078016281128, -0.00022278912365436554, -0.0002116374671459198, -0.00020048581063747406, -0.00018933415412902832, -0.00017818249762058258, -0.00016703084111213684, -0.0001558791846036911, -0.00014472752809524536, -0.00013357587158679962, -0.00012242421507835388, -0.00011127255856990814, -0.0001001209020614624, -8.896924555301666e-05, -7.781758904457092e-05, -6.666593253612518e-05, -5.551427602767944e-05, -4.4362619519233704e-05, -3.3210963010787964e-05, -2.2059306502342224e-05, -1.0907649993896484e-05, 2.4400651454925537e-07, 1.1395663022994995e-05, 2.2547319531440735e-05, 3.3698976039886475e-05, 4.4850632548332214e-05, 5.6002289056777954e-05, 6.71539455652237e-05, 7.830560207366943e-05, 8.945725858211517e-05, 0.00010060891509056091, 0.00011176057159900665, 0.0001229122281074524, 0.00013406388461589813, 0.00014521554112434387, 0.0001563671976327896, 0.00016751885414123535, 0.0001786705106496811, 0.00018982216715812683, 0.00020097382366657257, 0.0002121254801750183, 0.00022327713668346405, 0.0002344287931919098, 0.00024558044970035553, 0.00025673210620880127, 0.000267883762717247, 0.00027903541922569275, 0.0002901870757341385, 0.00030133873224258423, 0.00031249038875102997, 0.0003236420452594757, 0.00033479370176792145, 0.0003459453582763672]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 0.0, 8.0, 4.0, 5.0, 9.0, 7.0, 6.0, 21.0, 16.0, 17.0, 14.0, 29.0, 32.0, 13.0, 34.0, 31.0, 26.0, 35.0, 40.0, 38.0, 38.0, 46.0, 36.0, 43.0, 34.0, 42.0, 39.0, 41.0, 29.0, 31.0, 21.0, 27.0, 26.0, 15.0, 22.0, 18.0, 13.0, 24.0, 11.0, 12.0, 8.0, 4.0, 8.0, 6.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2734375, -4.13812255859375, -4.0028076171875, -3.86749267578125, -3.732177734375, -3.59686279296875, -3.4615478515625, -3.32623291015625, -3.19091796875, -3.05560302734375, -2.9202880859375, -2.78497314453125, -2.649658203125, -2.51434326171875, -2.3790283203125, -2.24371337890625, -2.1083984375, -1.97308349609375, -1.8377685546875, -1.70245361328125, -1.567138671875, -1.43182373046875, -1.2965087890625, -1.16119384765625, -1.02587890625, -0.89056396484375, -0.7552490234375, -0.61993408203125, -0.484619140625, -0.34930419921875, -0.2139892578125, -0.07867431640625, 0.056640625, 0.19195556640625, 0.3272705078125, 0.46258544921875, 0.597900390625, 0.73321533203125, 0.8685302734375, 1.00384521484375, 1.13916015625, 1.27447509765625, 1.4097900390625, 1.54510498046875, 1.680419921875, 1.81573486328125, 1.9510498046875, 2.08636474609375, 2.2216796875, 2.35699462890625, 2.4923095703125, 2.62762451171875, 2.762939453125, 2.89825439453125, 3.0335693359375, 3.16888427734375, 3.30419921875, 3.43951416015625, 3.5748291015625, 3.71014404296875, 3.845458984375, 3.98077392578125, 4.1160888671875, 4.25140380859375, 4.38671875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 10.0, 9.0, 11.0, 10.0, 12.0, 20.0, 18.0, 26.0, 50.0, 52.0, 118.0, 192.0, 353.0, 660.0, 1270.0, 2552.0, 4955.0, 9991.0, 20287.0, 44634.0, 108413.0, 275024.0, 334703.0, 139969.0, 55966.0, 24545.0, 12240.0, 6169.0, 2960.0, 1540.0, 797.0, 411.0, 203.0, 123.0, 73.0, 44.0, 21.0, 27.0, 17.0, 21.0, 11.0, 10.0, 8.0, 9.0, 5.0, 3.0, 1.0, 5.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.00390625, -3.87530517578125, -3.7467041015625, -3.61810302734375, -3.489501953125, -3.36090087890625, -3.2322998046875, -3.10369873046875, -2.97509765625, -2.84649658203125, -2.7178955078125, -2.58929443359375, -2.460693359375, -2.33209228515625, -2.2034912109375, -2.07489013671875, -1.9462890625, -1.81768798828125, -1.6890869140625, -1.56048583984375, -1.431884765625, -1.30328369140625, -1.1746826171875, -1.04608154296875, -0.91748046875, -0.78887939453125, -0.6602783203125, -0.53167724609375, -0.403076171875, -0.27447509765625, -0.1458740234375, -0.01727294921875, 0.111328125, 0.23992919921875, 0.3685302734375, 0.49713134765625, 0.625732421875, 0.75433349609375, 0.8829345703125, 1.01153564453125, 1.14013671875, 1.26873779296875, 1.3973388671875, 1.52593994140625, 1.654541015625, 1.78314208984375, 1.9117431640625, 2.04034423828125, 2.1689453125, 2.29754638671875, 2.4261474609375, 2.55474853515625, 2.683349609375, 2.81195068359375, 2.9405517578125, 3.06915283203125, 3.19775390625, 3.32635498046875, 3.4549560546875, 3.58355712890625, 3.712158203125, 3.84075927734375, 3.9693603515625, 4.09796142578125, 4.2265625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 4.0, 5.0, 8.0, 10.0, 14.0, 17.0, 17.0, 17.0, 32.0, 31.0, 35.0, 40.0, 39.0, 47.0, 67.0, 101.0, 175.0, 1529.0, 344.0, 108.0, 63.0, 61.0, 45.0, 43.0, 39.0, 32.0, 22.0, 24.0, 16.0, 17.0, 13.0, 8.0, 6.0, 7.0, 6.0, 2.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.390625, -19.76904296875, -19.1474609375, -18.52587890625, -17.904296875, -17.28271484375, -16.6611328125, -16.03955078125, -15.41796875, -14.79638671875, -14.1748046875, -13.55322265625, -12.931640625, -12.31005859375, -11.6884765625, -11.06689453125, -10.4453125, -9.82373046875, -9.2021484375, -8.58056640625, -7.958984375, -7.33740234375, -6.7158203125, -6.09423828125, -5.47265625, -4.85107421875, -4.2294921875, -3.60791015625, -2.986328125, -2.36474609375, -1.7431640625, -1.12158203125, -0.5, 0.12158203125, 0.7431640625, 1.36474609375, 1.986328125, 2.60791015625, 3.2294921875, 3.85107421875, 4.47265625, 5.09423828125, 5.7158203125, 6.33740234375, 6.958984375, 7.58056640625, 8.2021484375, 8.82373046875, 9.4453125, 10.06689453125, 10.6884765625, 11.31005859375, 11.931640625, 12.55322265625, 13.1748046875, 13.79638671875, 14.41796875, 15.03955078125, 15.6611328125, 16.28271484375, 16.904296875, 17.52587890625, 18.1474609375, 18.76904296875, 19.390625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 6.0, 7.0, 7.0, 12.0, 19.0, 24.0, 27.0, 37.0, 54.0, 53.0, 104.0, 143.0, 248.0, 400.0, 940.0, 67395.0, 3071819.0, 2850.0, 592.0, 327.0, 213.0, 131.0, 78.0, 54.0, 34.0, 36.0, 29.0, 17.0, 13.0, 11.0, 7.0, 5.0, 8.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.9375, -60.01611328125, -58.0947265625, -56.17333984375, -54.251953125, -52.33056640625, -50.4091796875, -48.48779296875, -46.56640625, -44.64501953125, -42.7236328125, -40.80224609375, -38.880859375, -36.95947265625, -35.0380859375, -33.11669921875, -31.1953125, -29.27392578125, -27.3525390625, -25.43115234375, -23.509765625, -21.58837890625, -19.6669921875, -17.74560546875, -15.82421875, -13.90283203125, -11.9814453125, -10.06005859375, -8.138671875, -6.21728515625, -4.2958984375, -2.37451171875, -0.453125, 1.46826171875, 3.3896484375, 5.31103515625, 7.232421875, 9.15380859375, 11.0751953125, 12.99658203125, 14.91796875, 16.83935546875, 18.7607421875, 20.68212890625, 22.603515625, 24.52490234375, 26.4462890625, 28.36767578125, 30.2890625, 32.21044921875, 34.1318359375, 36.05322265625, 37.974609375, 39.89599609375, 41.8173828125, 43.73876953125, 45.66015625, 47.58154296875, 49.5029296875, 51.42431640625, 53.345703125, 55.26708984375, 57.1884765625, 59.10986328125, 61.03125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 14.0, 411.0, 564.0, 27.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-211.0338134765625, -207.33335876464844, -203.6328887939453, -199.93243408203125, -196.2319793701172, -192.53152465820312, -188.8310546875, -185.13059997558594, -181.43014526367188, -177.7296905517578, -174.0292205810547, -170.32876586914062, -166.62831115722656, -162.9278564453125, -159.22738647460938, -155.5269317626953, -151.8264617919922, -148.12600708007812, -144.425537109375, -140.72508239746094, -137.02462768554688, -133.32415771484375, -129.6237030029297, -125.92324829101562, -122.22279357910156, -118.52233123779297, -114.8218765258789, -111.12141418457031, -107.42095947265625, -103.72049713134766, -100.02003479003906, -96.319580078125, -92.61911010742188, -88.91864776611328, -85.21819305419922, -81.51773071289062, -77.81727600097656, -74.11681365966797, -70.41635131835938, -66.71589660644531, -63.01544189453125, -59.31498336791992, -55.614524841308594, -51.9140625, -48.21360397338867, -44.513145446777344, -40.812686920166016, -37.11222839355469, -33.411766052246094, -29.711307525634766, -26.010847091674805, -22.310388565063477, -18.609928131103516, -14.909469604492188, -11.20901107788086, -7.508550643920898, -3.8080921173095703, -0.10763287544250488, 3.5928263664245605, 7.293285369873047, 10.993744850158691, 14.694204330444336, 18.394662857055664, 22.095123291015625, 25.795581817626953]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 7.0, 2.0, 9.0, 1.0, 12.0, 13.0, 12.0, 7.0, 22.0, 22.0, 19.0, 23.0, 28.0, 30.0, 25.0, 34.0, 36.0, 29.0, 50.0, 58.0, 42.0, 38.0, 47.0, 47.0, 50.0, 48.0, 31.0, 29.0, 27.0, 23.0, 24.0, 20.0, 28.0, 17.0, 13.0, 21.0, 8.0, 14.0, 7.0, 11.0, 4.0, 6.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-40.97172546386719, -39.65695571899414, -38.342185974121094, -37.02741622924805, -35.712646484375, -34.39787673950195, -33.083106994628906, -31.768339157104492, -30.453569412231445, -29.1387996673584, -27.82402992248535, -26.509260177612305, -25.19449234008789, -23.879722595214844, -22.564952850341797, -21.25018310546875, -19.935413360595703, -18.620643615722656, -17.30587387084961, -15.991105079650879, -14.676335334777832, -13.361565589904785, -12.046796798706055, -10.732027053833008, -9.417257308959961, -8.102487564086914, -6.787718296051025, -5.472949028015137, -4.15817928314209, -2.843409538269043, -1.5286402702331543, -0.21387100219726562, 1.1008987426757812, 2.415668249130249, 3.730437755584717, 5.0452070236206055, 6.359976768493652, 7.674746513366699, 8.98951530456543, 10.304285049438477, 11.619054794311523, 12.93382453918457, 14.248594284057617, 15.563363075256348, 16.878131866455078, 18.192901611328125, 19.507671356201172, 20.82244110107422, 22.137210845947266, 23.451980590820312, 24.76675033569336, 26.081520080566406, 27.396289825439453, 28.7110595703125, 30.025827407836914, 31.34059715270996, 32.655364990234375, 33.97013473510742, 35.28490447998047, 36.599674224853516, 37.91444396972656, 39.22921371459961, 40.543983459472656, 41.85874938964844, 43.17352294921875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 6.0, 1.0, 9.0, 6.0, 6.0, 4.0, 10.0, 18.0, 11.0, 23.0, 18.0, 20.0, 17.0, 24.0, 31.0, 25.0, 27.0, 32.0, 39.0, 37.0, 42.0, 31.0, 41.0, 42.0, 45.0, 40.0, 37.0, 39.0, 28.0, 28.0, 26.0, 31.0, 21.0, 16.0, 23.0, 23.0, 14.0, 18.0, 13.0, 21.0, 8.0, 7.0, 11.0, 9.0, 4.0, 3.0, 3.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.73046875, -4.5848388671875, -4.439208984375, -4.2935791015625, -4.14794921875, -4.0023193359375, -3.856689453125, -3.7110595703125, -3.5654296875, -3.4197998046875, -3.274169921875, -3.1285400390625, -2.98291015625, -2.8372802734375, -2.691650390625, -2.5460205078125, -2.400390625, -2.2547607421875, -2.109130859375, -1.9635009765625, -1.81787109375, -1.6722412109375, -1.526611328125, -1.3809814453125, -1.2353515625, -1.0897216796875, -0.944091796875, -0.7984619140625, -0.65283203125, -0.5072021484375, -0.361572265625, -0.2159423828125, -0.0703125, 0.0753173828125, 0.220947265625, 0.3665771484375, 0.51220703125, 0.6578369140625, 0.803466796875, 0.9490966796875, 1.0947265625, 1.2403564453125, 1.385986328125, 1.5316162109375, 1.67724609375, 1.8228759765625, 1.968505859375, 2.1141357421875, 2.259765625, 2.4053955078125, 2.551025390625, 2.6966552734375, 2.84228515625, 2.9879150390625, 3.133544921875, 3.2791748046875, 3.4248046875, 3.5704345703125, 3.716064453125, 3.8616943359375, 4.00732421875, 4.1529541015625, 4.298583984375, 4.4442138671875, 4.58984375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 3.0, 7.0, 7.0, 11.0, 10.0, 8.0, 16.0, 13.0, 18.0, 26.0, 36.0, 54.0, 54.0, 67.0, 100.0, 130.0, 220.0, 474.0, 1466.0, 8941.0, 306519.0, 3096792.0, 756071.0, 19471.0, 2190.0, 662.0, 288.0, 152.0, 77.0, 77.0, 64.0, 51.0, 43.0, 25.0, 25.0, 24.0, 20.0, 11.0, 10.0, 9.0, 10.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-16.359375, -15.886962890625, -15.41455078125, -14.942138671875, -14.4697265625, -13.997314453125, -13.52490234375, -13.052490234375, -12.580078125, -12.107666015625, -11.63525390625, -11.162841796875, -10.6904296875, -10.218017578125, -9.74560546875, -9.273193359375, -8.80078125, -8.328369140625, -7.85595703125, -7.383544921875, -6.9111328125, -6.438720703125, -5.96630859375, -5.493896484375, -5.021484375, -4.549072265625, -4.07666015625, -3.604248046875, -3.1318359375, -2.659423828125, -2.18701171875, -1.714599609375, -1.2421875, -0.769775390625, -0.29736328125, 0.175048828125, 0.6474609375, 1.119873046875, 1.59228515625, 2.064697265625, 2.537109375, 3.009521484375, 3.48193359375, 3.954345703125, 4.4267578125, 4.899169921875, 5.37158203125, 5.843994140625, 6.31640625, 6.788818359375, 7.26123046875, 7.733642578125, 8.2060546875, 8.678466796875, 9.15087890625, 9.623291015625, 10.095703125, 10.568115234375, 11.04052734375, 11.512939453125, 11.9853515625, 12.457763671875, 12.93017578125, 13.402587890625, 13.875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 12.0, 21.0, 36.0, 51.0, 58.0, 81.0, 149.0, 193.0, 289.0, 449.0, 603.0, 624.0, 488.0, 353.0, 243.0, 125.0, 98.0, 70.0, 33.0, 24.0, 23.0, 21.0, 9.0, 4.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3984375, -13.9769287109375, -13.555419921875, -13.1339111328125, -12.71240234375, -12.2908935546875, -11.869384765625, -11.4478759765625, -11.0263671875, -10.6048583984375, -10.183349609375, -9.7618408203125, -9.34033203125, -8.9188232421875, -8.497314453125, -8.0758056640625, -7.654296875, -7.2327880859375, -6.811279296875, -6.3897705078125, -5.96826171875, -5.5467529296875, -5.125244140625, -4.7037353515625, -4.2822265625, -3.8607177734375, -3.439208984375, -3.0177001953125, -2.59619140625, -2.1746826171875, -1.753173828125, -1.3316650390625, -0.91015625, -0.4886474609375, -0.067138671875, 0.3543701171875, 0.77587890625, 1.1973876953125, 1.618896484375, 2.0404052734375, 2.4619140625, 2.8834228515625, 3.304931640625, 3.7264404296875, 4.14794921875, 4.5694580078125, 4.990966796875, 5.4124755859375, 5.833984375, 6.2554931640625, 6.677001953125, 7.0985107421875, 7.52001953125, 7.9415283203125, 8.363037109375, 8.7845458984375, 9.2060546875, 9.6275634765625, 10.049072265625, 10.4705810546875, 10.89208984375, 11.3135986328125, 11.735107421875, 12.1566162109375, 12.578125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 4.0, 12.0, 21.0, 21.0, 34.0, 46.0, 84.0, 124.0, 165.0, 325.0, 477.0, 1199.0, 681665.0, 3506683.0, 1905.0, 545.0, 317.0, 237.0, 137.0, 106.0, 70.0, 38.0, 33.0, 12.0, 9.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.5, -56.556640625, -54.61328125, -52.669921875, -50.7265625, -48.783203125, -46.83984375, -44.896484375, -42.953125, -41.009765625, -39.06640625, -37.123046875, -35.1796875, -33.236328125, -31.29296875, -29.349609375, -27.40625, -25.462890625, -23.51953125, -21.576171875, -19.6328125, -17.689453125, -15.74609375, -13.802734375, -11.859375, -9.916015625, -7.97265625, -6.029296875, -4.0859375, -2.142578125, -0.19921875, 1.744140625, 3.6875, 5.630859375, 7.57421875, 9.517578125, 11.4609375, 13.404296875, 15.34765625, 17.291015625, 19.234375, 21.177734375, 23.12109375, 25.064453125, 27.0078125, 28.951171875, 30.89453125, 32.837890625, 34.78125, 36.724609375, 38.66796875, 40.611328125, 42.5546875, 44.498046875, 46.44140625, 48.384765625, 50.328125, 52.271484375, 54.21484375, 56.158203125, 58.1015625, 60.044921875, 61.98828125, 63.931640625, 65.875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 29.0, 184.0, 480.0, 268.0, 53.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-176.27511596679688, -171.4671173095703, -166.65911865234375, -161.85110473632812, -157.04310607910156, -152.235107421875, -147.42709350585938, -142.6190948486328, -137.81109619140625, -133.0030975341797, -128.19509887695312, -123.3870849609375, -118.57908630371094, -113.77108764648438, -108.96308135986328, -104.15507507324219, -99.34707641601562, -94.53907775878906, -89.73107147216797, -84.92306518554688, -80.11506652832031, -75.30706787109375, -70.49906158447266, -65.69105529785156, -60.883056640625, -56.07505416870117, -51.267051696777344, -46.459049224853516, -41.65104675292969, -36.84304428100586, -32.03504180908203, -27.227039337158203, -22.419036865234375, -17.611034393310547, -12.803031921386719, -7.995029449462891, -3.1870269775390625, 1.6209754943847656, 6.428977966308594, 11.236980438232422, 16.04498291015625, 20.852985382080078, 25.660987854003906, 30.468990325927734, 35.27699279785156, 40.08499526977539, 44.89299774169922, 49.70100021362305, 54.509002685546875, 59.3170051574707, 64.12500762939453, 68.93301391601562, 73.74101257324219, 78.54901123046875, 83.35701751708984, 88.16502380371094, 92.9730224609375, 97.78102111816406, 102.58902740478516, 107.39703369140625, 112.20503234863281, 117.01303100585938, 121.82103729248047, 126.62904357910156, 131.43704223632812]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 6.0, 5.0, 7.0, 9.0, 11.0, 13.0, 13.0, 13.0, 17.0, 15.0, 24.0, 24.0, 21.0, 18.0, 28.0, 42.0, 39.0, 38.0, 43.0, 32.0, 40.0, 39.0, 48.0, 41.0, 34.0, 50.0, 43.0, 39.0, 20.0, 22.0, 21.0, 22.0, 27.0, 26.0, 14.0, 15.0, 19.0, 13.0, 9.0, 3.0, 15.0, 5.0, 3.0, 6.0, 1.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.30865478515625, -28.362224578857422, -27.415794372558594, -26.469364166259766, -25.52293586730957, -24.576505661010742, -23.630075454711914, -22.683645248413086, -21.73721694946289, -20.790786743164062, -19.844356536865234, -18.897926330566406, -17.95149803161621, -17.005067825317383, -16.058637619018555, -15.112207412719727, -14.165777206420898, -13.21934700012207, -12.272917747497559, -11.32648754119873, -10.380058288574219, -9.43362808227539, -8.487197875976562, -7.540768146514893, -6.594338417053223, -5.647908687591553, -4.701478958129883, -3.7550487518310547, -2.8086190223693848, -1.8621892929077148, -0.9157590866088867, 0.030670642852783203, 0.9770984649658203, 1.9235283136367798, 2.8699581623077393, 3.8163881301879883, 4.762817859649658, 5.709247589111328, 6.655677795410156, 7.602107524871826, 8.548537254333496, 9.494967460632324, 10.441396713256836, 11.387826919555664, 12.334257125854492, 13.280686378479004, 14.227116584777832, 15.173545837402344, 16.119976043701172, 17.06640625, 18.012836456298828, 18.959266662597656, 19.90569496154785, 20.85212516784668, 21.798555374145508, 22.744985580444336, 23.69141387939453, 24.63784408569336, 25.584274291992188, 26.530704498291016, 27.47713279724121, 28.42356300354004, 29.369993209838867, 30.316423416137695, 31.262853622436523]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 2.0, 5.0, 10.0, 8.0, 12.0, 11.0, 15.0, 14.0, 8.0, 20.0, 25.0, 18.0, 23.0, 34.0, 33.0, 45.0, 34.0, 37.0, 48.0, 45.0, 44.0, 37.0, 50.0, 42.0, 40.0, 38.0, 34.0, 29.0, 26.0, 23.0, 30.0, 27.0, 22.0, 14.0, 17.0, 15.0, 8.0, 16.0, 11.0, 3.0, 7.0, 6.0, 7.0, 3.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8046875, -4.65191650390625, -4.4991455078125, -4.34637451171875, -4.193603515625, -4.04083251953125, -3.8880615234375, -3.73529052734375, -3.58251953125, -3.42974853515625, -3.2769775390625, -3.12420654296875, -2.971435546875, -2.81866455078125, -2.6658935546875, -2.51312255859375, -2.3603515625, -2.20758056640625, -2.0548095703125, -1.90203857421875, -1.749267578125, -1.59649658203125, -1.4437255859375, -1.29095458984375, -1.13818359375, -0.98541259765625, -0.8326416015625, -0.67987060546875, -0.527099609375, -0.37432861328125, -0.2215576171875, -0.06878662109375, 0.083984375, 0.23675537109375, 0.3895263671875, 0.54229736328125, 0.695068359375, 0.84783935546875, 1.0006103515625, 1.15338134765625, 1.30615234375, 1.45892333984375, 1.6116943359375, 1.76446533203125, 1.917236328125, 2.07000732421875, 2.2227783203125, 2.37554931640625, 2.5283203125, 2.68109130859375, 2.8338623046875, 2.98663330078125, 3.139404296875, 3.29217529296875, 3.4449462890625, 3.59771728515625, 3.75048828125, 3.90325927734375, 4.0560302734375, 4.20880126953125, 4.361572265625, 4.51434326171875, 4.6671142578125, 4.81988525390625, 4.97265625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 6.0, 4.0, 13.0, 10.0, 28.0, 26.0, 45.0, 58.0, 91.0, 136.0, 197.0, 293.0, 411.0, 585.0, 861.0, 1189.0, 1926.0, 2695.0, 3892.0, 5897.0, 8567.0, 12585.0, 19038.0, 28899.0, 45479.0, 76641.0, 149381.0, 330459.0, 149140.0, 76622.0, 46023.0, 29030.0, 18845.0, 12611.0, 8791.0, 5801.0, 3905.0, 2580.0, 1881.0, 1250.0, 830.0, 604.0, 404.0, 281.0, 183.0, 120.0, 92.0, 57.0, 34.0, 28.0, 12.0, 14.0, 8.0, 7.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.0498046875, -1.0175018310546875, -0.985198974609375, -0.9528961181640625, -0.92059326171875, -0.8882904052734375, -0.855987548828125, -0.8236846923828125, -0.7913818359375, -0.7590789794921875, -0.726776123046875, -0.6944732666015625, -0.66217041015625, -0.6298675537109375, -0.597564697265625, -0.5652618408203125, -0.532958984375, -0.5006561279296875, -0.468353271484375, -0.4360504150390625, -0.40374755859375, -0.3714447021484375, -0.339141845703125, -0.3068389892578125, -0.2745361328125, -0.2422332763671875, -0.209930419921875, -0.1776275634765625, -0.14532470703125, -0.1130218505859375, -0.080718994140625, -0.0484161376953125, -0.01611328125, 0.0161895751953125, 0.048492431640625, 0.0807952880859375, 0.11309814453125, 0.1454010009765625, 0.177703857421875, 0.2100067138671875, 0.2423095703125, 0.2746124267578125, 0.306915283203125, 0.3392181396484375, 0.37152099609375, 0.4038238525390625, 0.436126708984375, 0.4684295654296875, 0.500732421875, 0.5330352783203125, 0.565338134765625, 0.5976409912109375, 0.62994384765625, 0.6622467041015625, 0.694549560546875, 0.7268524169921875, 0.7591552734375, 0.7914581298828125, 0.823760986328125, 0.8560638427734375, 0.88836669921875, 0.9206695556640625, 0.952972412109375, 0.9852752685546875, 1.017578125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 7.0, 6.0, 9.0, 15.0, 14.0, 18.0, 15.0, 16.0, 34.0, 24.0, 32.0, 31.0, 32.0, 22.0, 47.0, 25.0, 33.0, 38.0, 44.0, 1054.0, 33.0, 51.0, 40.0, 31.0, 38.0, 34.0, 36.0, 23.0, 32.0, 30.0, 21.0, 24.0, 19.0, 16.0, 20.0, 12.0, 8.0, 11.0, 4.0, 6.0, 5.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.03515625, -2.94207763671875, -2.8489990234375, -2.75592041015625, -2.662841796875, -2.56976318359375, -2.4766845703125, -2.38360595703125, -2.29052734375, -2.19744873046875, -2.1043701171875, -2.01129150390625, -1.918212890625, -1.82513427734375, -1.7320556640625, -1.63897705078125, -1.5458984375, -1.45281982421875, -1.3597412109375, -1.26666259765625, -1.173583984375, -1.08050537109375, -0.9874267578125, -0.89434814453125, -0.80126953125, -0.70819091796875, -0.6151123046875, -0.52203369140625, -0.428955078125, -0.33587646484375, -0.2427978515625, -0.14971923828125, -0.056640625, 0.03643798828125, 0.1295166015625, 0.22259521484375, 0.315673828125, 0.40875244140625, 0.5018310546875, 0.59490966796875, 0.68798828125, 0.78106689453125, 0.8741455078125, 0.96722412109375, 1.060302734375, 1.15338134765625, 1.2464599609375, 1.33953857421875, 1.4326171875, 1.52569580078125, 1.6187744140625, 1.71185302734375, 1.804931640625, 1.89801025390625, 1.9910888671875, 2.08416748046875, 2.17724609375, 2.27032470703125, 2.3634033203125, 2.45648193359375, 2.549560546875, 2.64263916015625, 2.7357177734375, 2.82879638671875, 2.921875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 1.0, 11.0, 8.0, 16.0, 28.0, 30.0, 71.0, 100.0, 147.0, 226.0, 341.0, 569.0, 876.0, 1391.0, 2254.0, 3658.0, 6073.0, 10034.0, 16960.0, 29203.0, 50523.0, 89955.0, 190686.0, 1396222.0, 130625.0, 70013.0, 39556.0, 23064.0, 13701.0, 7990.0, 4979.0, 2904.0, 1817.0, 1129.0, 718.0, 427.0, 275.0, 185.0, 113.0, 86.0, 55.0, 34.0, 30.0, 16.0, 12.0, 9.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1962890625, -1.158050537109375, -1.11981201171875, -1.081573486328125, -1.0433349609375, -1.005096435546875, -0.96685791015625, -0.928619384765625, -0.890380859375, -0.852142333984375, -0.81390380859375, -0.775665283203125, -0.7374267578125, -0.699188232421875, -0.66094970703125, -0.622711181640625, -0.58447265625, -0.546234130859375, -0.50799560546875, -0.469757080078125, -0.4315185546875, -0.393280029296875, -0.35504150390625, -0.316802978515625, -0.278564453125, -0.240325927734375, -0.20208740234375, -0.163848876953125, -0.1256103515625, -0.087371826171875, -0.04913330078125, -0.010894775390625, 0.02734375, 0.065582275390625, 0.10382080078125, 0.142059326171875, 0.1802978515625, 0.218536376953125, 0.25677490234375, 0.295013427734375, 0.333251953125, 0.371490478515625, 0.40972900390625, 0.447967529296875, 0.4862060546875, 0.524444580078125, 0.56268310546875, 0.600921630859375, 0.63916015625, 0.677398681640625, 0.71563720703125, 0.753875732421875, 0.7921142578125, 0.830352783203125, 0.86859130859375, 0.906829833984375, 0.945068359375, 0.983306884765625, 1.02154541015625, 1.059783935546875, 1.0980224609375, 1.136260986328125, 1.17449951171875, 1.212738037109375, 1.2509765625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 1.0, 5.0, 6.0, 9.0, 8.0, 13.0, 18.0, 20.0, 31.0, 26.0, 43.0, 74.0, 96.0, 126.0, 121.0, 105.0, 70.0, 48.0, 40.0, 27.0, 25.0, 19.0, 11.0, 12.0, 8.0, 5.0, 5.0, 4.0, 4.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010776519775390625, -0.0010460317134857178, -0.001014411449432373, -0.0009827911853790283, -0.0009511709213256836, -0.0009195506572723389, -0.0008879303932189941, -0.0008563101291656494, -0.0008246898651123047, -0.00079306960105896, -0.0007614493370056152, -0.0007298290729522705, -0.0006982088088989258, -0.0006665885448455811, -0.0006349682807922363, -0.0006033480167388916, -0.0005717277526855469, -0.0005401074886322021, -0.0005084872245788574, -0.0004768669605255127, -0.00044524669647216797, -0.00041362643241882324, -0.0003820061683654785, -0.0003503859043121338, -0.00031876564025878906, -0.00028714537620544434, -0.0002555251121520996, -0.00022390484809875488, -0.00019228458404541016, -0.00016066431999206543, -0.0001290440559387207, -9.742379188537598e-05, -6.580352783203125e-05, -3.4183263778686523e-05, -2.562999725341797e-06, 2.905726432800293e-05, 6.0677528381347656e-05, 9.229779243469238e-05, 0.0001239180564880371, 0.00015553832054138184, 0.00018715858459472656, 0.0002187788486480713, 0.000250399112701416, 0.00028201937675476074, 0.00031363964080810547, 0.0003452599048614502, 0.0003768801689147949, 0.00040850043296813965, 0.0004401206970214844, 0.0004717409610748291, 0.0005033612251281738, 0.0005349814891815186, 0.0005666017532348633, 0.000598222017288208, 0.0006298422813415527, 0.0006614625453948975, 0.0006930828094482422, 0.0007247030735015869, 0.0007563233375549316, 0.0007879436016082764, 0.0008195638656616211, 0.0008511841297149658, 0.0008828043937683105, 0.0009144246578216553, 0.000946044921875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 0.0, 4.0, 4.0, 7.0, 5.0, 6.0, 4.0, 7.0, 16.0, 19.0, 19.0, 22.0, 27.0, 46.0, 77.0, 112.0, 168.0, 394.0, 1831.0, 1027074.0, 17498.0, 567.0, 230.0, 144.0, 79.0, 45.0, 37.0, 26.0, 22.0, 12.0, 9.0, 10.0, 6.0, 8.0, 9.0, 2.0, 1.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0209197998046875, -0.020259857177734375, -0.01959991455078125, -0.018939971923828125, -0.018280029296875, -0.017620086669921875, -0.01696014404296875, -0.016300201416015625, -0.0156402587890625, -0.014980316162109375, -0.01432037353515625, -0.013660430908203125, -0.01300048828125, -0.012340545654296875, -0.01168060302734375, -0.011020660400390625, -0.0103607177734375, -0.009700775146484375, -0.00904083251953125, -0.008380889892578125, -0.007720947265625, -0.007061004638671875, -0.00640106201171875, -0.005741119384765625, -0.0050811767578125, -0.004421234130859375, -0.00376129150390625, -0.003101348876953125, -0.00244140625, -0.001781463623046875, -0.00112152099609375, -0.000461578369140625, 0.0001983642578125, 0.000858306884765625, 0.00151824951171875, 0.002178192138671875, 0.002838134765625, 0.003498077392578125, 0.00415802001953125, 0.004817962646484375, 0.0054779052734375, 0.006137847900390625, 0.00679779052734375, 0.007457733154296875, 0.00811767578125, 0.008777618408203125, 0.00943756103515625, 0.010097503662109375, 0.0107574462890625, 0.011417388916015625, 0.01207733154296875, 0.012737274169921875, 0.013397216796875, 0.014057159423828125, 0.01471710205078125, 0.015377044677734375, 0.0160369873046875, 0.016696929931640625, 0.01735687255859375, 0.018016815185546875, 0.0186767578125, 0.019336700439453125, 0.01999664306640625, 0.020656585693359375, 0.0213165283203125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 17.0, 19.0, 36.0, 35.0, 56.0, 76.0, 99.0, 146.0, 150.0, 114.0, 85.0, 54.0, 31.0, 36.0, 19.0, 14.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0005531213246285915, -0.0005389315774664283, -0.000524741830304265, -0.0005105520831421018, -0.0004963623359799385, -0.00048217258881777525, -0.000467982841655612, -0.00045379309449344873, -0.0004396033473312855, -0.0004254136001691222, -0.00041122385300695896, -0.0003970341058447957, -0.00038284435868263245, -0.0003686546115204692, -0.00035446486435830593, -0.0003402751171961427, -0.0003260853700339794, -0.00031189562287181616, -0.0002977058757096529, -0.00028351612854748964, -0.0002693263813853264, -0.00025513663422316313, -0.00024094688706099987, -0.0002267571398988366, -0.0002125673636328429, -0.00019837761647067964, -0.00018418786930851638, -0.00016999812214635313, -0.00015580837498418987, -0.0001416186278220266, -0.00012742888065986335, -0.00011323912622174248, -9.904938633553684e-05, -8.485963917337358e-05, -7.066989201121032e-05, -5.648014121106826e-05, -4.2290394048905e-05, -2.8100643248762935e-05, -1.3910896086599678e-05, 2.788510755635798e-07, 1.4468598237726837e-05, 2.8658345399890095e-05, 4.284809256205335e-05, 5.703784336219542e-05, 7.122759416233748e-05, 8.541734132450074e-05, 9.9607088486664e-05, 0.00011379683564882725, 0.0001279865828109905, 0.00014217632997315377, 0.00015636607713531703, 0.00017055582429748029, 0.00018474557145964354, 0.00019893533317372203, 0.00021312508033588529, 0.00022731482749804854, 0.0002415045746602118, 0.00025569432182237506, 0.0002698840689845383, 0.0002840738161467016, 0.00029826356330886483, 0.0003124533104710281, 0.00032664305763319135, 0.0003408328047953546, 0.00035502255195751786]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 9.0, 7.0, 3.0, 5.0, 10.0, 16.0, 16.0, 14.0, 15.0, 16.0, 19.0, 17.0, 24.0, 25.0, 31.0, 23.0, 29.0, 39.0, 29.0, 38.0, 47.0, 44.0, 30.0, 44.0, 41.0, 30.0, 39.0, 35.0, 36.0, 41.0, 31.0, 35.0, 24.0, 25.0, 16.0, 15.0, 21.0, 12.0, 11.0, 7.0, 9.0, 7.0, 8.0, 2.0, 7.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003560185432434082, -0.00034403055906295776, -0.0003320425748825073, -0.0003200545907020569, -0.00030806660652160645, -0.000296078622341156, -0.00028409063816070557, -0.0002721026539802551, -0.0002601146697998047, -0.00024812668561935425, -0.0002361387014389038, -0.00022415071725845337, -0.00021216273307800293, -0.0002001747488975525, -0.00018818676471710205, -0.0001761987805366516, -0.00016421079635620117, -0.00015222281217575073, -0.0001402348279953003, -0.00012824684381484985, -0.00011625885963439941, -0.00010427087545394897, -9.228289127349854e-05, -8.02949070930481e-05, -6.830692291259766e-05, -5.631893873214722e-05, -4.433095455169678e-05, -3.234297037124634e-05, -2.03549861907959e-05, -8.367002010345459e-06, 3.6209821701049805e-06, 1.560896635055542e-05, 2.759695053100586e-05, 3.95849347114563e-05, 5.157291889190674e-05, 6.356090307235718e-05, 7.554888725280762e-05, 8.753687143325806e-05, 9.95248556137085e-05, 0.00011151283979415894, 0.00012350082397460938, 0.00013548880815505981, 0.00014747679233551025, 0.0001594647765159607, 0.00017145276069641113, 0.00018344074487686157, 0.000195428729057312, 0.00020741671323776245, 0.0002194046974182129, 0.00023139268159866333, 0.00024338066577911377, 0.0002553686499595642, 0.00026735663414001465, 0.0002793446183204651, 0.00029133260250091553, 0.00030332058668136597, 0.0003153085708618164, 0.00032729655504226685, 0.0003392845392227173, 0.0003512725234031677, 0.00036326050758361816, 0.0003752484917640686, 0.00038723647594451904, 0.0003992244601249695, 0.0004112124443054199]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 2.0, 5.0, 10.0, 8.0, 12.0, 11.0, 15.0, 14.0, 8.0, 20.0, 25.0, 18.0, 23.0, 34.0, 33.0, 45.0, 34.0, 37.0, 48.0, 45.0, 44.0, 37.0, 50.0, 42.0, 40.0, 38.0, 34.0, 29.0, 26.0, 23.0, 30.0, 27.0, 22.0, 14.0, 17.0, 15.0, 8.0, 16.0, 11.0, 3.0, 7.0, 6.0, 7.0, 3.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8046875, -4.65191650390625, -4.4991455078125, -4.34637451171875, -4.193603515625, -4.04083251953125, -3.8880615234375, -3.73529052734375, -3.58251953125, -3.42974853515625, -3.2769775390625, -3.12420654296875, -2.971435546875, -2.81866455078125, -2.6658935546875, -2.51312255859375, -2.3603515625, -2.20758056640625, -2.0548095703125, -1.90203857421875, -1.749267578125, -1.59649658203125, -1.4437255859375, -1.29095458984375, -1.13818359375, -0.98541259765625, -0.8326416015625, -0.67987060546875, -0.527099609375, -0.37432861328125, -0.2215576171875, -0.06878662109375, 0.083984375, 0.23675537109375, 0.3895263671875, 0.54229736328125, 0.695068359375, 0.84783935546875, 1.0006103515625, 1.15338134765625, 1.30615234375, 1.45892333984375, 1.6116943359375, 1.76446533203125, 1.917236328125, 2.07000732421875, 2.2227783203125, 2.37554931640625, 2.5283203125, 2.68109130859375, 2.8338623046875, 2.98663330078125, 3.139404296875, 3.29217529296875, 3.4449462890625, 3.59771728515625, 3.75048828125, 3.90325927734375, 4.0560302734375, 4.20880126953125, 4.361572265625, 4.51434326171875, 4.6671142578125, 4.81988525390625, 4.97265625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 7.0, 10.0, 13.0, 22.0, 30.0, 27.0, 37.0, 40.0, 57.0, 74.0, 102.0, 140.0, 205.0, 397.0, 909.0, 2095.0, 5471.0, 14438.0, 39633.0, 106753.0, 284194.0, 368092.0, 141546.0, 52319.0, 19559.0, 7141.0, 2733.0, 1144.0, 478.0, 253.0, 178.0, 82.0, 80.0, 58.0, 58.0, 35.0, 33.0, 27.0, 15.0, 20.0, 14.0, 9.0, 5.0, 7.0, 8.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.11328125, -4.9490966796875, -4.784912109375, -4.6207275390625, -4.45654296875, -4.2923583984375, -4.128173828125, -3.9639892578125, -3.7998046875, -3.6356201171875, -3.471435546875, -3.3072509765625, -3.14306640625, -2.9788818359375, -2.814697265625, -2.6505126953125, -2.486328125, -2.3221435546875, -2.157958984375, -1.9937744140625, -1.82958984375, -1.6654052734375, -1.501220703125, -1.3370361328125, -1.1728515625, -1.0086669921875, -0.844482421875, -0.6802978515625, -0.51611328125, -0.3519287109375, -0.187744140625, -0.0235595703125, 0.140625, 0.3048095703125, 0.468994140625, 0.6331787109375, 0.79736328125, 0.9615478515625, 1.125732421875, 1.2899169921875, 1.4541015625, 1.6182861328125, 1.782470703125, 1.9466552734375, 2.11083984375, 2.2750244140625, 2.439208984375, 2.6033935546875, 2.767578125, 2.9317626953125, 3.095947265625, 3.2601318359375, 3.42431640625, 3.5885009765625, 3.752685546875, 3.9168701171875, 4.0810546875, 4.2452392578125, 4.409423828125, 4.5736083984375, 4.73779296875, 4.9019775390625, 5.066162109375, 5.2303466796875, 5.39453125]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 9.0, 10.0, 18.0, 19.0, 23.0, 20.0, 23.0, 27.0, 26.0, 33.0, 31.0, 39.0, 36.0, 47.0, 90.0, 149.0, 1531.0, 341.0, 117.0, 73.0, 45.0, 39.0, 50.0, 44.0, 26.0, 39.0, 27.0, 15.0, 17.0, 17.0, 16.0, 10.0, 7.0, 6.0, 2.0, 4.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.171875, -14.662353515625, -14.15283203125, -13.643310546875, -13.1337890625, -12.624267578125, -12.11474609375, -11.605224609375, -11.095703125, -10.586181640625, -10.07666015625, -9.567138671875, -9.0576171875, -8.548095703125, -8.03857421875, -7.529052734375, -7.01953125, -6.510009765625, -6.00048828125, -5.490966796875, -4.9814453125, -4.471923828125, -3.96240234375, -3.452880859375, -2.943359375, -2.433837890625, -1.92431640625, -1.414794921875, -0.9052734375, -0.395751953125, 0.11376953125, 0.623291015625, 1.1328125, 1.642333984375, 2.15185546875, 2.661376953125, 3.1708984375, 3.680419921875, 4.18994140625, 4.699462890625, 5.208984375, 5.718505859375, 6.22802734375, 6.737548828125, 7.2470703125, 7.756591796875, 8.26611328125, 8.775634765625, 9.28515625, 9.794677734375, 10.30419921875, 10.813720703125, 11.3232421875, 11.832763671875, 12.34228515625, 12.851806640625, 13.361328125, 13.870849609375, 14.38037109375, 14.889892578125, 15.3994140625, 15.908935546875, 16.41845703125, 16.927978515625, 17.4375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 5.0, 6.0, 10.0, 8.0, 13.0, 17.0, 34.0, 34.0, 63.0, 80.0, 146.0, 263.0, 664.0, 2211.0, 3052158.0, 87672.0, 1258.0, 428.0, 228.0, 134.0, 101.0, 49.0, 35.0, 20.0, 20.0, 11.0, 9.0, 4.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.4375, -76.048828125, -73.66015625, -71.271484375, -68.8828125, -66.494140625, -64.10546875, -61.716796875, -59.328125, -56.939453125, -54.55078125, -52.162109375, -49.7734375, -47.384765625, -44.99609375, -42.607421875, -40.21875, -37.830078125, -35.44140625, -33.052734375, -30.6640625, -28.275390625, -25.88671875, -23.498046875, -21.109375, -18.720703125, -16.33203125, -13.943359375, -11.5546875, -9.166015625, -6.77734375, -4.388671875, -2.0, 0.388671875, 2.77734375, 5.166015625, 7.5546875, 9.943359375, 12.33203125, 14.720703125, 17.109375, 19.498046875, 21.88671875, 24.275390625, 26.6640625, 29.052734375, 31.44140625, 33.830078125, 36.21875, 38.607421875, 40.99609375, 43.384765625, 45.7734375, 48.162109375, 50.55078125, 52.939453125, 55.328125, 57.716796875, 60.10546875, 62.494140625, 64.8828125, 67.271484375, 69.66015625, 72.048828125, 74.4375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 12.0, 43.0, 177.0, 315.0, 282.0, 141.0, 35.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.007919311523438, -26.525442123413086, -25.042964935302734, -23.560487747192383, -22.07801055908203, -20.59553337097168, -19.113056182861328, -17.63058090209961, -16.148101806640625, -14.665624618530273, -13.183147430419922, -11.70067024230957, -10.218193054199219, -8.735715866088867, -7.253239631652832, -5.7707624435424805, -4.288286209106445, -2.8058090209960938, -1.3233320713043213, 0.15914487838745117, 1.6416220664978027, 3.1240992546081543, 4.606575965881348, 6.089053153991699, 7.571530342102051, 9.054007530212402, 10.536484718322754, 12.018960952758789, 13.50143814086914, 14.983915328979492, 16.466392517089844, 17.948869705200195, 19.431346893310547, 20.9138240814209, 22.39630126953125, 23.8787784576416, 25.361255645751953, 26.843732833862305, 28.326210021972656, 29.808685302734375, 31.29116439819336, 32.77363967895508, 34.25611877441406, 35.73859405517578, 37.221073150634766, 38.703548431396484, 40.18602752685547, 41.66850280761719, 43.150978088378906, 44.633453369140625, 46.11593246459961, 47.59840774536133, 49.08088684082031, 50.56336212158203, 52.045841217041016, 53.528316497802734, 55.01079559326172, 56.49327087402344, 57.97574996948242, 59.45822525024414, 60.940704345703125, 62.423179626464844, 63.90565872192383, 65.38813781738281, 66.87061309814453]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 3.0, 4.0, 3.0, 2.0, 6.0, 7.0, 6.0, 14.0, 12.0, 16.0, 16.0, 17.0, 22.0, 29.0, 23.0, 19.0, 31.0, 36.0, 26.0, 40.0, 42.0, 41.0, 39.0, 45.0, 46.0, 44.0, 35.0, 41.0, 40.0, 36.0, 20.0, 31.0, 29.0, 33.0, 17.0, 24.0, 29.0, 13.0, 4.0, 12.0, 15.0, 10.0, 10.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.497459411621094, -36.32136917114258, -35.14528274536133, -33.96919250488281, -32.79310607910156, -31.617015838623047, -30.44092559814453, -29.26483726501465, -28.088748931884766, -26.912660598754883, -25.736572265625, -24.560482025146484, -23.3843936920166, -22.20830535888672, -21.032215118408203, -19.85612678527832, -18.680038452148438, -17.503950119018555, -16.327861785888672, -15.151771545410156, -13.975683212280273, -12.79959487915039, -11.623505592346191, -10.447416305541992, -9.27132797241211, -8.095239639282227, -6.919150352478027, -5.743061542510986, -4.566972732543945, -3.3908839225769043, -2.2147951126098633, -1.038705825805664, 0.13738250732421875, 1.3134713172912598, 2.489560127258301, 3.665648937225342, 4.841737747192383, 6.017826557159424, 7.193915367126465, 8.370004653930664, 9.546092987060547, 10.72218132019043, 11.898270606994629, 13.074359893798828, 14.250448226928711, 15.426536560058594, 16.60262680053711, 17.778715133666992, 18.954803466796875, 20.130891799926758, 21.30698013305664, 22.483070373535156, 23.65915870666504, 24.835247039794922, 26.011337280273438, 27.18742561340332, 28.363513946533203, 29.539602279663086, 30.71569061279297, 31.891780853271484, 33.06787109375, 34.24395751953125, 35.420047760009766, 36.59613800048828, 37.77222442626953]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 2.0, 5.0, 7.0, 6.0, 10.0, 10.0, 12.0, 14.0, 11.0, 17.0, 18.0, 23.0, 29.0, 34.0, 22.0, 37.0, 29.0, 32.0, 34.0, 42.0, 43.0, 40.0, 41.0, 39.0, 27.0, 38.0, 39.0, 29.0, 32.0, 27.0, 23.0, 24.0, 28.0, 19.0, 25.0, 25.0, 14.0, 19.0, 11.0, 10.0, 6.0, 8.0, 7.0, 1.0, 10.0, 7.0, 5.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.953125, -4.79815673828125, -4.6431884765625, -4.48822021484375, -4.333251953125, -4.17828369140625, -4.0233154296875, -3.86834716796875, -3.71337890625, -3.55841064453125, -3.4034423828125, -3.24847412109375, -3.093505859375, -2.93853759765625, -2.7835693359375, -2.62860107421875, -2.4736328125, -2.31866455078125, -2.1636962890625, -2.00872802734375, -1.853759765625, -1.69879150390625, -1.5438232421875, -1.38885498046875, -1.23388671875, -1.07891845703125, -0.9239501953125, -0.76898193359375, -0.614013671875, -0.45904541015625, -0.3040771484375, -0.14910888671875, 0.005859375, 0.16082763671875, 0.3157958984375, 0.47076416015625, 0.625732421875, 0.78070068359375, 0.9356689453125, 1.09063720703125, 1.24560546875, 1.40057373046875, 1.5555419921875, 1.71051025390625, 1.865478515625, 2.02044677734375, 2.1754150390625, 2.33038330078125, 2.4853515625, 2.64031982421875, 2.7952880859375, 2.95025634765625, 3.105224609375, 3.26019287109375, 3.4151611328125, 3.57012939453125, 3.72509765625, 3.88006591796875, 4.0350341796875, 4.19000244140625, 4.344970703125, 4.49993896484375, 4.6549072265625, 4.80987548828125, 4.96484375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 8.0, 4.0, 7.0, 14.0, 13.0, 14.0, 21.0, 18.0, 42.0, 31.0, 34.0, 58.0, 72.0, 62.0, 96.0, 120.0, 148.0, 248.0, 647.0, 3751.0, 81023.0, 2138497.0, 1905398.0, 58982.0, 3386.0, 625.0, 218.0, 130.0, 119.0, 80.0, 57.0, 56.0, 41.0, 48.0, 41.0, 30.0, 22.0, 25.0, 21.0, 19.0, 4.0, 8.0, 5.0, 6.0, 10.0, 7.0, 1.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0], "bins": [-16.125, -15.6358642578125, -15.146728515625, -14.6575927734375, -14.16845703125, -13.6793212890625, -13.190185546875, -12.7010498046875, -12.2119140625, -11.7227783203125, -11.233642578125, -10.7445068359375, -10.25537109375, -9.7662353515625, -9.277099609375, -8.7879638671875, -8.298828125, -7.8096923828125, -7.320556640625, -6.8314208984375, -6.34228515625, -5.8531494140625, -5.364013671875, -4.8748779296875, -4.3857421875, -3.8966064453125, -3.407470703125, -2.9183349609375, -2.42919921875, -1.9400634765625, -1.450927734375, -0.9617919921875, -0.47265625, 0.0164794921875, 0.505615234375, 0.9947509765625, 1.48388671875, 1.9730224609375, 2.462158203125, 2.9512939453125, 3.4404296875, 3.9295654296875, 4.418701171875, 4.9078369140625, 5.39697265625, 5.8861083984375, 6.375244140625, 6.8643798828125, 7.353515625, 7.8426513671875, 8.331787109375, 8.8209228515625, 9.31005859375, 9.7991943359375, 10.288330078125, 10.7774658203125, 11.2666015625, 11.7557373046875, 12.244873046875, 12.7340087890625, 13.22314453125, 13.7122802734375, 14.201416015625, 14.6905517578125, 15.1796875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 3.0, 8.0, 7.0, 11.0, 8.0, 18.0, 21.0, 34.0, 51.0, 48.0, 70.0, 103.0, 165.0, 220.0, 313.0, 406.0, 490.0, 536.0, 415.0, 314.0, 219.0, 175.0, 126.0, 69.0, 61.0, 40.0, 40.0, 26.0, 16.0, 20.0, 9.0, 5.0, 8.0, 9.0, 3.0, 1.0, 3.0, 1.0, 1.0, 4.0], "bins": [-13.6796875, -13.3472900390625, -13.014892578125, -12.6824951171875, -12.35009765625, -12.0177001953125, -11.685302734375, -11.3529052734375, -11.0205078125, -10.6881103515625, -10.355712890625, -10.0233154296875, -9.69091796875, -9.3585205078125, -9.026123046875, -8.6937255859375, -8.361328125, -8.0289306640625, -7.696533203125, -7.3641357421875, -7.03173828125, -6.6993408203125, -6.366943359375, -6.0345458984375, -5.7021484375, -5.3697509765625, -5.037353515625, -4.7049560546875, -4.37255859375, -4.0401611328125, -3.707763671875, -3.3753662109375, -3.04296875, -2.7105712890625, -2.378173828125, -2.0457763671875, -1.71337890625, -1.3809814453125, -1.048583984375, -0.7161865234375, -0.3837890625, -0.0513916015625, 0.281005859375, 0.6134033203125, 0.94580078125, 1.2781982421875, 1.610595703125, 1.9429931640625, 2.275390625, 2.6077880859375, 2.940185546875, 3.2725830078125, 3.60498046875, 3.9373779296875, 4.269775390625, 4.6021728515625, 4.9345703125, 5.2669677734375, 5.599365234375, 5.9317626953125, 6.26416015625, 6.5965576171875, 6.928955078125, 7.2613525390625, 7.59375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 9.0, 1.0, 12.0, 12.0, 14.0, 19.0, 15.0, 49.0, 58.0, 73.0, 106.0, 154.0, 219.0, 349.0, 469.0, 1420.0, 970654.0, 3216737.0, 2201.0, 537.0, 351.0, 262.0, 168.0, 124.0, 73.0, 60.0, 34.0, 37.0, 18.0, 14.0, 8.0, 12.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.875, -42.052734375, -40.23046875, -38.408203125, -36.5859375, -34.763671875, -32.94140625, -31.119140625, -29.296875, -27.474609375, -25.65234375, -23.830078125, -22.0078125, -20.185546875, -18.36328125, -16.541015625, -14.71875, -12.896484375, -11.07421875, -9.251953125, -7.4296875, -5.607421875, -3.78515625, -1.962890625, -0.140625, 1.681640625, 3.50390625, 5.326171875, 7.1484375, 8.970703125, 10.79296875, 12.615234375, 14.4375, 16.259765625, 18.08203125, 19.904296875, 21.7265625, 23.548828125, 25.37109375, 27.193359375, 29.015625, 30.837890625, 32.66015625, 34.482421875, 36.3046875, 38.126953125, 39.94921875, 41.771484375, 43.59375, 45.416015625, 47.23828125, 49.060546875, 50.8828125, 52.705078125, 54.52734375, 56.349609375, 58.171875, 59.994140625, 61.81640625, 63.638671875, 65.4609375, 67.283203125, 69.10546875, 70.927734375, 72.75]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 5.0, 37.0, 73.0, 142.0, 174.0, 195.0, 149.0, 102.0, 72.0, 28.0, 18.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.84767532348633, -57.087432861328125, -55.32719039916992, -53.56694793701172, -51.80670928955078, -50.04646682739258, -48.286224365234375, -46.52598190307617, -44.76573944091797, -43.005496978759766, -41.24525451660156, -39.485015869140625, -37.72477340698242, -35.96453094482422, -34.204288482666016, -32.44404602050781, -30.683805465698242, -28.92356300354004, -27.16332244873047, -25.403079986572266, -23.642837524414062, -21.88259506225586, -20.12235450744629, -18.362112045288086, -16.601871490478516, -14.841629981994629, -13.081387519836426, -11.321146011352539, -9.560903549194336, -7.800662040710449, -6.0404205322265625, -4.280178070068359, -2.5199356079101562, -0.7596937417984009, 1.0005481243133545, 2.7607898712158203, 4.521031856536865, 6.28127384185791, 8.041515350341797, 9.8017578125, 11.561999320983887, 13.322240829467773, 15.082483291625977, 16.842723846435547, 18.60296630859375, 20.363208770751953, 22.123451232910156, 23.88369369506836, 25.64393424987793, 27.404176712036133, 29.164417266845703, 30.924659729003906, 32.68490219116211, 34.44514465332031, 36.20538330078125, 37.96562957763672, 39.725868225097656, 41.48611068725586, 43.24635314941406, 45.006591796875, 46.7668342590332, 48.527076721191406, 50.28731918334961, 52.04756164550781, 53.807804107666016]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 7.0, 3.0, 6.0, 8.0, 5.0, 6.0, 14.0, 14.0, 19.0, 23.0, 18.0, 19.0, 35.0, 22.0, 43.0, 29.0, 49.0, 38.0, 38.0, 45.0, 39.0, 43.0, 43.0, 44.0, 49.0, 40.0, 32.0, 26.0, 24.0, 35.0, 28.0, 27.0, 14.0, 22.0, 19.0, 15.0, 16.0, 8.0, 7.0, 8.0, 8.0, 6.0, 4.0, 2.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.35517883300781, -31.319854736328125, -30.284530639648438, -29.24920654296875, -28.213882446289062, -27.178558349609375, -26.143234252929688, -25.10791015625, -24.072586059570312, -23.037261962890625, -22.001937866210938, -20.96661376953125, -19.931289672851562, -18.895965576171875, -17.860641479492188, -16.8253173828125, -15.78999137878418, -14.754667282104492, -13.719343185424805, -12.684019088745117, -11.64869499206543, -10.613370895385742, -9.578045845031738, -8.54272174835205, -7.507397651672363, -6.472073554992676, -5.436749458312988, -4.401424884796143, -3.366100788116455, -2.3307766914367676, -1.2954521179199219, -0.2601280212402344, 0.7751960754394531, 1.8105202913284302, 2.8458445072174072, 3.881168842315674, 4.916492938995361, 5.951817035675049, 6.9871416091918945, 8.022465705871582, 9.05778980255127, 10.093113899230957, 11.128437995910645, 12.163763046264648, 13.199087142944336, 14.234411239624023, 15.269735336303711, 16.3050594329834, 17.340383529663086, 18.375707626342773, 19.41103172302246, 20.44635581970215, 21.481679916381836, 22.517004013061523, 23.552330017089844, 24.58765411376953, 25.62297821044922, 26.658302307128906, 27.693626403808594, 28.72895050048828, 29.76427459716797, 30.799598693847656, 31.834922790527344, 32.87024688720703, 33.90557098388672]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 13.0, 16.0, 15.0, 15.0, 17.0, 20.0, 23.0, 32.0, 31.0, 33.0, 29.0, 48.0, 47.0, 39.0, 55.0, 35.0, 64.0, 44.0, 41.0, 44.0, 34.0, 32.0, 22.0, 38.0, 29.0, 21.0, 19.0, 19.0, 23.0, 13.0, 17.0, 20.0, 9.0, 7.0, 8.0, 3.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90234375, -5.71435546875, -5.5263671875, -5.33837890625, -5.150390625, -4.96240234375, -4.7744140625, -4.58642578125, -4.3984375, -4.21044921875, -4.0224609375, -3.83447265625, -3.646484375, -3.45849609375, -3.2705078125, -3.08251953125, -2.89453125, -2.70654296875, -2.5185546875, -2.33056640625, -2.142578125, -1.95458984375, -1.7666015625, -1.57861328125, -1.390625, -1.20263671875, -1.0146484375, -0.82666015625, -0.638671875, -0.45068359375, -0.2626953125, -0.07470703125, 0.11328125, 0.30126953125, 0.4892578125, 0.67724609375, 0.865234375, 1.05322265625, 1.2412109375, 1.42919921875, 1.6171875, 1.80517578125, 1.9931640625, 2.18115234375, 2.369140625, 2.55712890625, 2.7451171875, 2.93310546875, 3.12109375, 3.30908203125, 3.4970703125, 3.68505859375, 3.873046875, 4.06103515625, 4.2490234375, 4.43701171875, 4.625, 4.81298828125, 5.0009765625, 5.18896484375, 5.376953125, 5.56494140625, 5.7529296875, 5.94091796875, 6.12890625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 10.0, 16.0, 21.0, 30.0, 38.0, 75.0, 89.0, 148.0, 207.0, 333.0, 476.0, 735.0, 1115.0, 1641.0, 2467.0, 3497.0, 5220.0, 7608.0, 11087.0, 16476.0, 24441.0, 37919.0, 61873.0, 109091.0, 269082.0, 225652.0, 101573.0, 58652.0, 36025.0, 23784.0, 15793.0, 10618.0, 7294.0, 5023.0, 3407.0, 2305.0, 1556.0, 1032.0, 722.0, 487.0, 312.0, 199.0, 140.0, 97.0, 65.0, 45.0, 24.0, 19.0, 20.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.1767578125, -1.139923095703125, -1.10308837890625, -1.066253662109375, -1.0294189453125, -0.992584228515625, -0.95574951171875, -0.918914794921875, -0.882080078125, -0.845245361328125, -0.80841064453125, -0.771575927734375, -0.7347412109375, -0.697906494140625, -0.66107177734375, -0.624237060546875, -0.58740234375, -0.550567626953125, -0.51373291015625, -0.476898193359375, -0.4400634765625, -0.403228759765625, -0.36639404296875, -0.329559326171875, -0.292724609375, -0.255889892578125, -0.21905517578125, -0.182220458984375, -0.1453857421875, -0.108551025390625, -0.07171630859375, -0.034881591796875, 0.001953125, 0.038787841796875, 0.07562255859375, 0.112457275390625, 0.1492919921875, 0.186126708984375, 0.22296142578125, 0.259796142578125, 0.296630859375, 0.333465576171875, 0.37030029296875, 0.407135009765625, 0.4439697265625, 0.480804443359375, 0.51763916015625, 0.554473876953125, 0.59130859375, 0.628143310546875, 0.66497802734375, 0.701812744140625, 0.7386474609375, 0.775482177734375, 0.81231689453125, 0.849151611328125, 0.885986328125, 0.922821044921875, 0.95965576171875, 0.996490478515625, 1.0333251953125, 1.070159912109375, 1.10699462890625, 1.143829345703125, 1.1806640625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 3.0, 5.0, 6.0, 6.0, 8.0, 11.0, 11.0, 6.0, 15.0, 12.0, 19.0, 20.0, 19.0, 24.0, 23.0, 32.0, 36.0, 24.0, 36.0, 27.0, 28.0, 21.0, 36.0, 44.0, 1061.0, 31.0, 39.0, 45.0, 30.0, 38.0, 26.0, 37.0, 29.0, 22.0, 18.0, 27.0, 26.0, 16.0, 16.0, 16.0, 12.0, 8.0, 9.0, 11.0, 8.0, 8.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0], "bins": [-3.189453125, -3.0904541015625, -2.991455078125, -2.8924560546875, -2.79345703125, -2.6944580078125, -2.595458984375, -2.4964599609375, -2.3974609375, -2.2984619140625, -2.199462890625, -2.1004638671875, -2.00146484375, -1.9024658203125, -1.803466796875, -1.7044677734375, -1.60546875, -1.5064697265625, -1.407470703125, -1.3084716796875, -1.20947265625, -1.1104736328125, -1.011474609375, -0.9124755859375, -0.8134765625, -0.7144775390625, -0.615478515625, -0.5164794921875, -0.41748046875, -0.3184814453125, -0.219482421875, -0.1204833984375, -0.021484375, 0.0775146484375, 0.176513671875, 0.2755126953125, 0.37451171875, 0.4735107421875, 0.572509765625, 0.6715087890625, 0.7705078125, 0.8695068359375, 0.968505859375, 1.0675048828125, 1.16650390625, 1.2655029296875, 1.364501953125, 1.4635009765625, 1.5625, 1.6614990234375, 1.760498046875, 1.8594970703125, 1.95849609375, 2.0574951171875, 2.156494140625, 2.2554931640625, 2.3544921875, 2.4534912109375, 2.552490234375, 2.6514892578125, 2.75048828125, 2.8494873046875, 2.948486328125, 3.0474853515625, 3.146484375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 12.0, 13.0, 18.0, 32.0, 40.0, 52.0, 66.0, 100.0, 145.0, 225.0, 329.0, 490.0, 710.0, 1110.0, 1573.0, 2559.0, 3764.0, 5677.0, 8988.0, 14009.0, 22290.0, 37018.0, 62319.0, 108298.0, 1323308.0, 244511.0, 104416.0, 59297.0, 35363.0, 21661.0, 13663.0, 8726.0, 5518.0, 3579.0, 2458.0, 1590.0, 1019.0, 707.0, 475.0, 335.0, 220.0, 137.0, 94.0, 72.0, 49.0, 20.0, 32.0, 12.0, 13.0, 5.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.28125, -1.2411651611328125, -1.201080322265625, -1.1609954833984375, -1.12091064453125, -1.0808258056640625, -1.040740966796875, -1.0006561279296875, -0.9605712890625, -0.9204864501953125, -0.880401611328125, -0.8403167724609375, -0.80023193359375, -0.7601470947265625, -0.720062255859375, -0.6799774169921875, -0.639892578125, -0.5998077392578125, -0.559722900390625, -0.5196380615234375, -0.47955322265625, -0.4394683837890625, -0.399383544921875, -0.3592987060546875, -0.3192138671875, -0.2791290283203125, -0.239044189453125, -0.1989593505859375, -0.15887451171875, -0.1187896728515625, -0.078704833984375, -0.0386199951171875, 0.00146484375, 0.0415496826171875, 0.081634521484375, 0.1217193603515625, 0.16180419921875, 0.2018890380859375, 0.241973876953125, 0.2820587158203125, 0.3221435546875, 0.3622283935546875, 0.402313232421875, 0.4423980712890625, 0.48248291015625, 0.5225677490234375, 0.562652587890625, 0.6027374267578125, 0.642822265625, 0.6829071044921875, 0.722991943359375, 0.7630767822265625, 0.80316162109375, 0.8432464599609375, 0.883331298828125, 0.9234161376953125, 0.9635009765625, 1.0035858154296875, 1.043670654296875, 1.0837554931640625, 1.12384033203125, 1.1639251708984375, 1.204010009765625, 1.2440948486328125, 1.2841796875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 11.0, 4.0, 5.0, 10.0, 7.0, 14.0, 10.0, 23.0, 13.0, 30.0, 24.0, 31.0, 32.0, 36.0, 53.0, 72.0, 74.0, 73.0, 75.0, 65.0, 60.0, 51.0, 29.0, 21.0, 36.0, 18.0, 22.0, 21.0, 6.0, 5.0, 15.0, 9.0, 7.0, 11.0, 2.0, 2.0, 3.0, 5.0, 3.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.000698089599609375, -0.0006785765290260315, -0.000659063458442688, -0.0006395503878593445, -0.000620037317276001, -0.0006005242466926575, -0.000581011176109314, -0.0005614981055259705, -0.000541985034942627, -0.0005224719643592834, -0.0005029588937759399, -0.00048344582319259644, -0.00046393275260925293, -0.0004444196820259094, -0.0004249066114425659, -0.0004053935408592224, -0.0003858804702758789, -0.0003663673996925354, -0.0003468543291091919, -0.0003273412585258484, -0.0003078281879425049, -0.0002883151173591614, -0.00026880204677581787, -0.00024928897619247437, -0.00022977590560913086, -0.00021026283502578735, -0.00019074976444244385, -0.00017123669385910034, -0.00015172362327575684, -0.00013221055269241333, -0.00011269748210906982, -9.318441152572632e-05, -7.367134094238281e-05, -5.415827035903931e-05, -3.46451997756958e-05, -1.5132129192352295e-05, 4.380941390991211e-06, 2.3894011974334717e-05, 4.340708255767822e-05, 6.292015314102173e-05, 8.243322372436523e-05, 0.00010194629430770874, 0.00012145936489105225, 0.00014097243547439575, 0.00016048550605773926, 0.00017999857664108276, 0.00019951164722442627, 0.00021902471780776978, 0.00023853778839111328, 0.0002580508589744568, 0.0002775639295578003, 0.0002970770001411438, 0.0003165900707244873, 0.0003361031413078308, 0.0003556162118911743, 0.0003751292824745178, 0.00039464235305786133, 0.00041415542364120483, 0.00043366849422454834, 0.00045318156480789185, 0.00047269463539123535, 0.0004922077059745789, 0.0005117207765579224, 0.0005312338471412659, 0.0005507469177246094]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 7.0, 10.0, 4.0, 14.0, 6.0, 17.0, 12.0, 9.0, 18.0, 32.0, 29.0, 38.0, 43.0, 71.0, 88.0, 119.0, 210.0, 351.0, 1068.0, 50831.0, 988123.0, 5881.0, 604.0, 287.0, 188.0, 114.0, 88.0, 54.0, 56.0, 33.0, 27.0, 31.0, 18.0, 16.0, 16.0, 7.0, 10.0, 6.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01131439208984375, -0.010900020599365234, -0.010485649108886719, -0.010071277618408203, -0.009656906127929688, -0.009242534637451172, -0.008828163146972656, -0.00841379165649414, -0.007999420166015625, -0.007585048675537109, -0.007170677185058594, -0.006756305694580078, -0.0063419342041015625, -0.005927562713623047, -0.005513191223144531, -0.005098819732666016, -0.0046844482421875, -0.004270076751708984, -0.0038557052612304688, -0.003441333770751953, -0.0030269622802734375, -0.002612590789794922, -0.0021982192993164062, -0.0017838478088378906, -0.001369476318359375, -0.0009551048278808594, -0.0005407333374023438, -0.00012636184692382812, 0.0002880096435546875, 0.0007023811340332031, 0.0011167526245117188, 0.0015311241149902344, 0.00194549560546875, 0.0023598670959472656, 0.0027742385864257812, 0.003188610076904297, 0.0036029815673828125, 0.004017353057861328, 0.004431724548339844, 0.004846096038818359, 0.005260467529296875, 0.005674839019775391, 0.006089210510253906, 0.006503582000732422, 0.0069179534912109375, 0.007332324981689453, 0.007746696472167969, 0.008161067962646484, 0.008575439453125, 0.008989810943603516, 0.009404182434082031, 0.009818553924560547, 0.010232925415039062, 0.010647296905517578, 0.011061668395996094, 0.01147603988647461, 0.011890411376953125, 0.01230478286743164, 0.012719154357910156, 0.013133525848388672, 0.013547897338867188, 0.013962268829345703, 0.014376640319824219, 0.014791011810302734, 0.01520538330078125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 13.0, 59.0, 255.0, 403.0, 209.0, 58.0, 13.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000501918257214129, -0.0004538766806945205, -0.000405835104174912, -0.00035779355675913393, -0.00030975198023952544, -0.00026171040371991694, -0.0002136688563041389, -0.0001656272797845304, -0.0001175857032649219, -6.954413402127102e-05, -2.1502564777620137e-05, 2.6538997190073133e-05, 7.458057370968163e-05, 0.00012262215022929013, 0.00017066369764506817, 0.00021870527416467667, 0.00026674685068428516, 0.00031478842720389366, 0.00036283000372350216, 0.0004108715511392802, 0.0004589131276588887, 0.0005069547332823277, 0.0005549962515942752, 0.0006030378281138837, 0.0006510794046334922, 0.0006991209811531007, 0.0007471625576727092, 0.0007952040759846568, 0.0008432456525042653, 0.0008912872290238738, 0.0009393288055434823, 0.0009873703820630908, 0.0010354118421673775, 0.001083453418686986, 0.0011314949952065945, 0.001179536571726203, 0.0012275781482458115, 0.00127561972476542, 0.0013236613012850285, 0.001371702877804637, 0.0014197444543242455, 0.001467786030843854, 0.0015158276073634624, 0.001563869183883071, 0.0016119107604026794, 0.001659952336922288, 0.0017079939134418964, 0.001756035489961505, 0.0018040769500657916, 0.0018521185265854, 0.0019001601031050086, 0.001948201679624617, 0.0019962431397289038, 0.0020442847162485123, 0.0020923262927681208, 0.0021403678692877293, 0.0021884094458073378, 0.0022364510223269463, 0.0022844925988465548, 0.0023325341753661633, 0.0023805757518857718, 0.0024286173284053802, 0.0024766589049249887, 0.0025247004814445972, 0.0025727420579642057]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 10.0, 12.0, 11.0, 19.0, 15.0, 20.0, 17.0, 28.0, 21.0, 23.0, 32.0, 33.0, 47.0, 48.0, 40.0, 34.0, 47.0, 44.0, 37.0, 43.0, 42.0, 42.0, 46.0, 40.0, 44.0, 34.0, 25.0, 25.0, 22.0, 16.0, 15.0, 14.0, 8.0, 13.0, 8.0, 7.0, 7.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0003611445426940918, -0.00034975167363882065, -0.0003383588045835495, -0.00032696593552827835, -0.0003155730664730072, -0.00030418019741773605, -0.0002927873283624649, -0.00028139445930719376, -0.0002700015902519226, -0.00025860872119665146, -0.0002472158521413803, -0.00023582298308610916, -0.000224430114030838, -0.00021303724497556686, -0.00020164437592029572, -0.00019025150686502457, -0.00017885863780975342, -0.00016746576875448227, -0.00015607289969921112, -0.00014468003064393997, -0.00013328716158866882, -0.00012189429253339767, -0.00011050142347812653, -9.910855442285538e-05, -8.771568536758423e-05, -7.632281631231308e-05, -6.492994725704193e-05, -5.353707820177078e-05, -4.2144209146499634e-05, -3.0751340091228485e-05, -1.9358471035957336e-05, -7.965601980686188e-06, 3.427267074584961e-06, 1.482013612985611e-05, 2.6213005185127258e-05, 3.760587424039841e-05, 4.8998743295669556e-05, 6.0391612350940704e-05, 7.178448140621185e-05, 8.3177350461483e-05, 9.457021951675415e-05, 0.0001059630885720253, 0.00011735595762729645, 0.0001287488266825676, 0.00014014169573783875, 0.0001515345647931099, 0.00016292743384838104, 0.0001743203029036522, 0.00018571317195892334, 0.0001971060410141945, 0.00020849891006946564, 0.00021989177912473679, 0.00023128464818000793, 0.00024267751723527908, 0.00025407038629055023, 0.0002654632553458214, 0.00027685612440109253, 0.0002882489934563637, 0.0002996418625116348, 0.000311034731566906, 0.0003224276006221771, 0.00033382046967744827, 0.0003452133387327194, 0.00035660620778799057, 0.0003679990768432617]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 13.0, 16.0, 15.0, 15.0, 17.0, 20.0, 23.0, 32.0, 31.0, 33.0, 29.0, 48.0, 47.0, 39.0, 55.0, 35.0, 64.0, 44.0, 41.0, 44.0, 34.0, 32.0, 22.0, 38.0, 29.0, 21.0, 19.0, 19.0, 23.0, 13.0, 17.0, 20.0, 9.0, 7.0, 8.0, 3.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90234375, -5.71435546875, -5.5263671875, -5.33837890625, -5.150390625, -4.96240234375, -4.7744140625, -4.58642578125, -4.3984375, -4.21044921875, -4.0224609375, -3.83447265625, -3.646484375, -3.45849609375, -3.2705078125, -3.08251953125, -2.89453125, -2.70654296875, -2.5185546875, -2.33056640625, -2.142578125, -1.95458984375, -1.7666015625, -1.57861328125, -1.390625, -1.20263671875, -1.0146484375, -0.82666015625, -0.638671875, -0.45068359375, -0.2626953125, -0.07470703125, 0.11328125, 0.30126953125, 0.4892578125, 0.67724609375, 0.865234375, 1.05322265625, 1.2412109375, 1.42919921875, 1.6171875, 1.80517578125, 1.9931640625, 2.18115234375, 2.369140625, 2.55712890625, 2.7451171875, 2.93310546875, 3.12109375, 3.30908203125, 3.4970703125, 3.68505859375, 3.873046875, 4.06103515625, 4.2490234375, 4.43701171875, 4.625, 4.81298828125, 5.0009765625, 5.18896484375, 5.376953125, 5.56494140625, 5.7529296875, 5.94091796875, 6.12890625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 14.0, 14.0, 15.0, 23.0, 30.0, 37.0, 49.0, 71.0, 93.0, 149.0, 190.0, 335.0, 560.0, 1276.0, 6148.0, 54057.0, 604802.0, 341368.0, 32927.0, 3951.0, 1046.0, 470.0, 292.0, 154.0, 116.0, 87.0, 63.0, 45.0, 33.0, 29.0, 23.0, 19.0, 15.0, 9.0, 10.0, 7.0, 4.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.234375, -11.8507080078125, -11.467041015625, -11.0833740234375, -10.69970703125, -10.3160400390625, -9.932373046875, -9.5487060546875, -9.1650390625, -8.7813720703125, -8.397705078125, -8.0140380859375, -7.63037109375, -7.2467041015625, -6.863037109375, -6.4793701171875, -6.095703125, -5.7120361328125, -5.328369140625, -4.9447021484375, -4.56103515625, -4.1773681640625, -3.793701171875, -3.4100341796875, -3.0263671875, -2.6427001953125, -2.259033203125, -1.8753662109375, -1.49169921875, -1.1080322265625, -0.724365234375, -0.3406982421875, 0.04296875, 0.4266357421875, 0.810302734375, 1.1939697265625, 1.57763671875, 1.9613037109375, 2.344970703125, 2.7286376953125, 3.1123046875, 3.4959716796875, 3.879638671875, 4.2633056640625, 4.64697265625, 5.0306396484375, 5.414306640625, 5.7979736328125, 6.181640625, 6.5653076171875, 6.948974609375, 7.3326416015625, 7.71630859375, 8.0999755859375, 8.483642578125, 8.8673095703125, 9.2509765625, 9.6346435546875, 10.018310546875, 10.4019775390625, 10.78564453125, 11.1693115234375, 11.552978515625, 11.9366455078125, 12.3203125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 9.0, 2.0, 6.0, 13.0, 8.0, 10.0, 12.0, 7.0, 15.0, 23.0, 24.0, 35.0, 28.0, 27.0, 39.0, 38.0, 65.0, 82.0, 129.0, 270.0, 1522.0, 198.0, 87.0, 63.0, 47.0, 39.0, 29.0, 32.0, 28.0, 25.0, 24.0, 18.0, 21.0, 18.0, 12.0, 14.0, 7.0, 3.0, 7.0, 4.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.515625, -16.896484375, -16.27734375, -15.658203125, -15.0390625, -14.419921875, -13.80078125, -13.181640625, -12.5625, -11.943359375, -11.32421875, -10.705078125, -10.0859375, -9.466796875, -8.84765625, -8.228515625, -7.609375, -6.990234375, -6.37109375, -5.751953125, -5.1328125, -4.513671875, -3.89453125, -3.275390625, -2.65625, -2.037109375, -1.41796875, -0.798828125, -0.1796875, 0.439453125, 1.05859375, 1.677734375, 2.296875, 2.916015625, 3.53515625, 4.154296875, 4.7734375, 5.392578125, 6.01171875, 6.630859375, 7.25, 7.869140625, 8.48828125, 9.107421875, 9.7265625, 10.345703125, 10.96484375, 11.583984375, 12.203125, 12.822265625, 13.44140625, 14.060546875, 14.6796875, 15.298828125, 15.91796875, 16.537109375, 17.15625, 17.775390625, 18.39453125, 19.013671875, 19.6328125, 20.251953125, 20.87109375, 21.490234375, 22.109375]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 7.0, 4.0, 7.0, 13.0, 8.0, 14.0, 18.0, 26.0, 28.0, 36.0, 40.0, 48.0, 55.0, 60.0, 102.0, 161.0, 314.0, 702.0, 2784.0, 2777525.0, 360385.0, 1916.0, 549.0, 259.0, 165.0, 89.0, 74.0, 62.0, 57.0, 38.0, 30.0, 24.0, 14.0, 12.0, 23.0, 14.0, 14.0, 4.0, 5.0, 7.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.8125, -62.90087890625, -60.9892578125, -59.07763671875, -57.166015625, -55.25439453125, -53.3427734375, -51.43115234375, -49.51953125, -47.60791015625, -45.6962890625, -43.78466796875, -41.873046875, -39.96142578125, -38.0498046875, -36.13818359375, -34.2265625, -32.31494140625, -30.4033203125, -28.49169921875, -26.580078125, -24.66845703125, -22.7568359375, -20.84521484375, -18.93359375, -17.02197265625, -15.1103515625, -13.19873046875, -11.287109375, -9.37548828125, -7.4638671875, -5.55224609375, -3.640625, -1.72900390625, 0.1826171875, 2.09423828125, 4.005859375, 5.91748046875, 7.8291015625, 9.74072265625, 11.65234375, 13.56396484375, 15.4755859375, 17.38720703125, 19.298828125, 21.21044921875, 23.1220703125, 25.03369140625, 26.9453125, 28.85693359375, 30.7685546875, 32.68017578125, 34.591796875, 36.50341796875, 38.4150390625, 40.32666015625, 42.23828125, 44.14990234375, 46.0615234375, 47.97314453125, 49.884765625, 51.79638671875, 53.7080078125, 55.61962890625, 57.53125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [2.0, 2.0, 10.0, 62.0, 220.0, 342.0, 266.0, 88.0, 21.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.037247657775879, -7.4186272621154785, -5.800006866455078, -4.181386947631836, -2.5627665519714355, -0.9441461563110352, 0.674473762512207, 2.2930946350097656, 3.911714553833008, 5.530334949493408, 7.148955345153809, 8.76757526397705, 10.38619613647461, 12.004816055297852, 13.623435974121094, 15.242056846618652, 16.860675811767578, 18.47929573059082, 20.097915649414062, 21.716537475585938, 23.33515739440918, 24.953777313232422, 26.572397232055664, 28.191017150878906, 29.80963897705078, 31.428258895874023, 33.046878814697266, 34.66550064086914, 36.28411865234375, 37.902740478515625, 39.5213623046875, 41.13998031616211, 42.758602142333984, 44.37722396850586, 45.99584197998047, 47.614463806152344, 49.23308181762695, 50.85170364379883, 52.47032165527344, 54.08894348144531, 55.70756530761719, 57.32618713378906, 58.94480514526367, 60.56342697143555, 62.182044982910156, 63.80066680908203, 65.4192886352539, 67.03791046142578, 68.65652465820312, 70.275146484375, 71.89376831054688, 73.51238250732422, 75.1310043334961, 76.74962615966797, 78.36824798583984, 79.98686981201172, 81.6054916381836, 83.22411346435547, 84.84273529052734, 86.46134948730469, 88.07997131347656, 89.69859313964844, 91.31721496582031, 92.93583679199219, 94.55445098876953]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 6.0, 5.0, 11.0, 16.0, 19.0, 11.0, 21.0, 14.0, 23.0, 35.0, 30.0, 27.0, 38.0, 46.0, 48.0, 46.0, 55.0, 43.0, 53.0, 39.0, 50.0, 46.0, 31.0, 45.0, 24.0, 38.0, 28.0, 24.0, 17.0, 22.0, 19.0, 15.0, 15.0, 16.0, 6.0, 4.0, 2.0, 5.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.4478988647461, -62.54887390136719, -60.649845123291016, -58.75082015991211, -56.85179138183594, -54.95276641845703, -53.053741455078125, -51.15471267700195, -49.25568389892578, -47.356658935546875, -45.4576301574707, -43.5586051940918, -41.659576416015625, -39.76055145263672, -37.86152648925781, -35.96249771118164, -34.063472747802734, -32.16444778442383, -30.265419006347656, -28.36639404296875, -26.467365264892578, -24.568340301513672, -22.669313430786133, -20.770286560058594, -18.871259689331055, -16.972232818603516, -15.073205947875977, -13.174180030822754, -11.275153160095215, -9.376126289367676, -7.477100372314453, -5.578073501586914, -3.6790504455566406, -1.7800238132476807, 0.1190028190612793, 2.01802921295166, 3.917056083679199, 5.816082954406738, 7.715108871459961, 9.6141357421875, 11.513162612915039, 13.412189483642578, 15.311216354370117, 17.210243225097656, 19.109268188476562, 21.008296966552734, 22.90732192993164, 24.80634880065918, 26.70537567138672, 28.604402542114258, 30.503429412841797, 32.4024543762207, 34.301483154296875, 36.20050811767578, 38.09953308105469, 39.99856185913086, 41.89759063720703, 43.79661560058594, 45.69564437866211, 47.594669342041016, 49.49369812011719, 51.392723083496094, 53.291748046875, 55.19077682495117, 57.08980178833008]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 3.0, 11.0, 10.0, 12.0, 11.0, 12.0, 5.0, 9.0, 23.0, 28.0, 20.0, 30.0, 34.0, 33.0, 34.0, 34.0, 33.0, 35.0, 29.0, 35.0, 47.0, 38.0, 41.0, 43.0, 38.0, 38.0, 29.0, 39.0, 25.0, 22.0, 30.0, 22.0, 20.0, 17.0, 13.0, 18.0, 17.0, 20.0, 6.0, 2.0, 10.0, 8.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.76953125, -5.57916259765625, -5.3887939453125, -5.19842529296875, -5.008056640625, -4.81768798828125, -4.6273193359375, -4.43695068359375, -4.24658203125, -4.05621337890625, -3.8658447265625, -3.67547607421875, -3.485107421875, -3.29473876953125, -3.1043701171875, -2.91400146484375, -2.7236328125, -2.53326416015625, -2.3428955078125, -2.15252685546875, -1.962158203125, -1.77178955078125, -1.5814208984375, -1.39105224609375, -1.20068359375, -1.01031494140625, -0.8199462890625, -0.62957763671875, -0.439208984375, -0.24884033203125, -0.0584716796875, 0.13189697265625, 0.322265625, 0.51263427734375, 0.7030029296875, 0.89337158203125, 1.083740234375, 1.27410888671875, 1.4644775390625, 1.65484619140625, 1.84521484375, 2.03558349609375, 2.2259521484375, 2.41632080078125, 2.606689453125, 2.79705810546875, 2.9874267578125, 3.17779541015625, 3.3681640625, 3.55853271484375, 3.7489013671875, 3.93927001953125, 4.129638671875, 4.32000732421875, 4.5103759765625, 4.70074462890625, 4.89111328125, 5.08148193359375, 5.2718505859375, 5.46221923828125, 5.652587890625, 5.84295654296875, 6.0333251953125, 6.22369384765625, 6.4140625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 6.0, 2.0, 5.0, 8.0, 12.0, 10.0, 10.0, 24.0, 19.0, 28.0, 47.0, 39.0, 68.0, 100.0, 151.0, 233.0, 434.0, 856.0, 2191.0, 7648.0, 43566.0, 290943.0, 1193392.0, 1765672.0, 737662.0, 125201.0, 18413.0, 4368.0, 1468.0, 670.0, 386.0, 221.0, 107.0, 86.0, 62.0, 37.0, 21.0, 25.0, 23.0, 22.0, 9.0, 9.0, 8.0, 6.0, 8.0, 5.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.9765625, -6.711181640625, -6.44580078125, -6.180419921875, -5.9150390625, -5.649658203125, -5.38427734375, -5.118896484375, -4.853515625, -4.588134765625, -4.32275390625, -4.057373046875, -3.7919921875, -3.526611328125, -3.26123046875, -2.995849609375, -2.73046875, -2.465087890625, -2.19970703125, -1.934326171875, -1.6689453125, -1.403564453125, -1.13818359375, -0.872802734375, -0.607421875, -0.342041015625, -0.07666015625, 0.188720703125, 0.4541015625, 0.719482421875, 0.98486328125, 1.250244140625, 1.515625, 1.781005859375, 2.04638671875, 2.311767578125, 2.5771484375, 2.842529296875, 3.10791015625, 3.373291015625, 3.638671875, 3.904052734375, 4.16943359375, 4.434814453125, 4.7001953125, 4.965576171875, 5.23095703125, 5.496337890625, 5.76171875, 6.027099609375, 6.29248046875, 6.557861328125, 6.8232421875, 7.088623046875, 7.35400390625, 7.619384765625, 7.884765625, 8.150146484375, 8.41552734375, 8.680908203125, 8.9462890625, 9.211669921875, 9.47705078125, 9.742431640625, 10.0078125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 8.0, 4.0, 24.0, 24.0, 48.0, 44.0, 85.0, 117.0, 189.0, 326.0, 463.0, 646.0, 562.0, 499.0, 345.0, 248.0, 152.0, 76.0, 72.0, 49.0, 31.0, 23.0, 13.0, 12.0, 5.0, 8.0, 7.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.25, -20.769775390625, -20.28955078125, -19.809326171875, -19.3291015625, -18.848876953125, -18.36865234375, -17.888427734375, -17.408203125, -16.927978515625, -16.44775390625, -15.967529296875, -15.4873046875, -15.007080078125, -14.52685546875, -14.046630859375, -13.56640625, -13.086181640625, -12.60595703125, -12.125732421875, -11.6455078125, -11.165283203125, -10.68505859375, -10.204833984375, -9.724609375, -9.244384765625, -8.76416015625, -8.283935546875, -7.8037109375, -7.323486328125, -6.84326171875, -6.363037109375, -5.8828125, -5.402587890625, -4.92236328125, -4.442138671875, -3.9619140625, -3.481689453125, -3.00146484375, -2.521240234375, -2.041015625, -1.560791015625, -1.08056640625, -0.600341796875, -0.1201171875, 0.360107421875, 0.84033203125, 1.320556640625, 1.80078125, 2.281005859375, 2.76123046875, 3.241455078125, 3.7216796875, 4.201904296875, 4.68212890625, 5.162353515625, 5.642578125, 6.122802734375, 6.60302734375, 7.083251953125, 7.5634765625, 8.043701171875, 8.52392578125, 9.004150390625, 9.484375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 4.0, 11.0, 16.0, 19.0, 35.0, 58.0, 82.0, 120.0, 202.0, 352.0, 656.0, 1519.0, 11633.0, 4079440.0, 96082.0, 2192.0, 789.0, 424.0, 250.0, 149.0, 91.0, 60.0, 43.0, 20.0, 21.0, 8.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.09375, -35.38134765625, -33.6689453125, -31.95654296875, -30.244140625, -28.53173828125, -26.8193359375, -25.10693359375, -23.39453125, -21.68212890625, -19.9697265625, -18.25732421875, -16.544921875, -14.83251953125, -13.1201171875, -11.40771484375, -9.6953125, -7.98291015625, -6.2705078125, -4.55810546875, -2.845703125, -1.13330078125, 0.5791015625, 2.29150390625, 4.00390625, 5.71630859375, 7.4287109375, 9.14111328125, 10.853515625, 12.56591796875, 14.2783203125, 15.99072265625, 17.703125, 19.41552734375, 21.1279296875, 22.84033203125, 24.552734375, 26.26513671875, 27.9775390625, 29.68994140625, 31.40234375, 33.11474609375, 34.8271484375, 36.53955078125, 38.251953125, 39.96435546875, 41.6767578125, 43.38916015625, 45.1015625, 46.81396484375, 48.5263671875, 50.23876953125, 51.951171875, 53.66357421875, 55.3759765625, 57.08837890625, 58.80078125, 60.51318359375, 62.2255859375, 63.93798828125, 65.650390625, 67.36279296875, 69.0751953125, 70.78759765625, 72.5]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 10.0, 149.0, 457.0, 336.0, 56.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.36093139648438, -139.35037231445312, -134.33981323242188, -129.3292694091797, -124.31871032714844, -119.30815124511719, -114.29759216308594, -109.28703308105469, -104.27648162841797, -99.26592254638672, -94.25537109375, -89.24481201171875, -84.2342529296875, -79.22370147705078, -74.21314239501953, -69.20259094238281, -64.19203186035156, -59.18147659301758, -54.170921325683594, -49.160362243652344, -44.14980697631836, -39.139251708984375, -34.128692626953125, -29.11813735961914, -24.107582092285156, -19.097026824951172, -14.086469650268555, -9.075913429260254, -4.065357208251953, 0.9451980590820312, 5.955755233764648, 10.966312408447266, 15.976882934570312, 20.987438201904297, 25.997995376586914, 31.00855255126953, 36.019107818603516, 41.0296630859375, 46.04022216796875, 51.050777435302734, 56.06133270263672, 61.0718879699707, 66.08244323730469, 71.09300231933594, 76.10356140136719, 81.1141128540039, 86.12467193603516, 91.13522338867188, 96.14578247070312, 101.15634155273438, 106.1668930053711, 111.17745208740234, 116.18800354003906, 121.19856262207031, 126.20912170410156, 131.2196807861328, 136.230224609375, 141.24078369140625, 146.2513427734375, 151.2618865966797, 156.27244567871094, 161.2830047607422, 166.29356384277344, 171.3041229248047, 176.31468200683594]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 3.0, 7.0, 13.0, 15.0, 10.0, 9.0, 19.0, 26.0, 30.0, 24.0, 23.0, 32.0, 33.0, 37.0, 40.0, 40.0, 53.0, 41.0, 45.0, 44.0, 44.0, 44.0, 42.0, 20.0, 36.0, 35.0, 46.0, 29.0, 30.0, 27.0, 13.0, 16.0, 19.0, 15.0, 9.0, 7.0, 9.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.76203155517578, -36.543174743652344, -35.324317932128906, -34.10546112060547, -32.88660430908203, -31.667747497558594, -30.44889259338379, -29.23003578186035, -28.011178970336914, -26.792322158813477, -25.57346534729004, -24.3546085357666, -23.135753631591797, -21.91689682006836, -20.698040008544922, -19.479183197021484, -18.260326385498047, -17.04146957397461, -15.822612762451172, -14.60375690460205, -13.384900093078613, -12.166043281555176, -10.947187423706055, -9.728330612182617, -8.50947380065918, -7.290616989135742, -6.071760654449463, -4.852904319763184, -3.634047508239746, -2.4151906967163086, -1.1963343620300293, 0.02252197265625, 1.2413749694824219, 2.4602315425872803, 3.6790881156921387, 4.897944450378418, 6.1168012619018555, 7.335658073425293, 8.554513931274414, 9.773370742797852, 10.992227554321289, 12.211084365844727, 13.429941177368164, 14.648797035217285, 15.867653846740723, 17.086509704589844, 18.30536651611328, 19.52422332763672, 20.743080139160156, 21.961936950683594, 23.18079376220703, 24.39965057373047, 25.618507385253906, 26.837364196777344, 28.05621910095215, 29.275075912475586, 30.493932723999023, 31.71278953552246, 32.931644439697266, 34.1505012512207, 35.36935806274414, 36.58821487426758, 37.807071685791016, 39.02592849731445, 40.24478530883789]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 3.0, 8.0, 4.0, 15.0, 11.0, 15.0, 15.0, 16.0, 19.0, 26.0, 16.0, 18.0, 20.0, 29.0, 21.0, 35.0, 37.0, 43.0, 33.0, 34.0, 39.0, 53.0, 45.0, 40.0, 35.0, 35.0, 37.0, 29.0, 24.0, 27.0, 33.0, 32.0, 19.0, 12.0, 28.0, 17.0, 11.0, 9.0, 9.0, 12.0, 8.0, 7.0, 4.0, 7.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-5.578125, -5.39715576171875, -5.2161865234375, -5.03521728515625, -4.854248046875, -4.67327880859375, -4.4923095703125, -4.31134033203125, -4.13037109375, -3.94940185546875, -3.7684326171875, -3.58746337890625, -3.406494140625, -3.22552490234375, -3.0445556640625, -2.86358642578125, -2.6826171875, -2.50164794921875, -2.3206787109375, -2.13970947265625, -1.958740234375, -1.77777099609375, -1.5968017578125, -1.41583251953125, -1.23486328125, -1.05389404296875, -0.8729248046875, -0.69195556640625, -0.510986328125, -0.33001708984375, -0.1490478515625, 0.03192138671875, 0.212890625, 0.39385986328125, 0.5748291015625, 0.75579833984375, 0.936767578125, 1.11773681640625, 1.2987060546875, 1.47967529296875, 1.66064453125, 1.84161376953125, 2.0225830078125, 2.20355224609375, 2.384521484375, 2.56549072265625, 2.7464599609375, 2.92742919921875, 3.1083984375, 3.28936767578125, 3.4703369140625, 3.65130615234375, 3.832275390625, 4.01324462890625, 4.1942138671875, 4.37518310546875, 4.55615234375, 4.73712158203125, 4.9180908203125, 5.09906005859375, 5.280029296875, 5.46099853515625, 5.6419677734375, 5.82293701171875, 6.00390625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 3.0, 13.0, 29.0, 16.0, 37.0, 58.0, 74.0, 92.0, 161.0, 229.0, 300.0, 445.0, 673.0, 919.0, 1337.0, 1934.0, 2783.0, 4116.0, 5930.0, 8892.0, 13028.0, 19653.0, 29339.0, 46020.0, 74705.0, 135151.0, 323480.0, 152338.0, 81367.0, 49280.0, 31702.0, 20843.0, 13931.0, 9405.0, 6275.0, 4357.0, 2930.0, 2029.0, 1412.0, 1018.0, 684.0, 482.0, 339.0, 226.0, 175.0, 100.0, 81.0, 64.0, 32.0, 26.0, 19.0, 14.0, 5.0, 5.0, 3.0, 1.0, 3.0], "bins": [-1.3291015625, -1.289520263671875, -1.24993896484375, -1.210357666015625, -1.1707763671875, -1.131195068359375, -1.09161376953125, -1.052032470703125, -1.012451171875, -0.972869873046875, -0.93328857421875, -0.893707275390625, -0.8541259765625, -0.814544677734375, -0.77496337890625, -0.735382080078125, -0.69580078125, -0.656219482421875, -0.61663818359375, -0.577056884765625, -0.5374755859375, -0.497894287109375, -0.45831298828125, -0.418731689453125, -0.379150390625, -0.339569091796875, -0.29998779296875, -0.260406494140625, -0.2208251953125, -0.181243896484375, -0.14166259765625, -0.102081298828125, -0.0625, -0.022918701171875, 0.01666259765625, 0.056243896484375, 0.0958251953125, 0.135406494140625, 0.17498779296875, 0.214569091796875, 0.254150390625, 0.293731689453125, 0.33331298828125, 0.372894287109375, 0.4124755859375, 0.452056884765625, 0.49163818359375, 0.531219482421875, 0.57080078125, 0.610382080078125, 0.64996337890625, 0.689544677734375, 0.7291259765625, 0.768707275390625, 0.80828857421875, 0.847869873046875, 0.887451171875, 0.927032470703125, 0.96661376953125, 1.006195068359375, 1.0457763671875, 1.085357666015625, 1.12493896484375, 1.164520263671875, 1.2041015625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 5.0, 7.0, 10.0, 11.0, 6.0, 14.0, 14.0, 20.0, 17.0, 21.0, 26.0, 33.0, 26.0, 28.0, 43.0, 36.0, 30.0, 36.0, 57.0, 38.0, 1069.0, 37.0, 39.0, 44.0, 39.0, 35.0, 34.0, 34.0, 21.0, 29.0, 25.0, 25.0, 19.0, 8.0, 15.0, 7.0, 12.0, 5.0, 12.0, 9.0, 3.0, 3.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.75, -3.632598876953125, -3.51519775390625, -3.397796630859375, -3.2803955078125, -3.162994384765625, -3.04559326171875, -2.928192138671875, -2.810791015625, -2.693389892578125, -2.57598876953125, -2.458587646484375, -2.3411865234375, -2.223785400390625, -2.10638427734375, -1.988983154296875, -1.87158203125, -1.754180908203125, -1.63677978515625, -1.519378662109375, -1.4019775390625, -1.284576416015625, -1.16717529296875, -1.049774169921875, -0.932373046875, -0.814971923828125, -0.69757080078125, -0.580169677734375, -0.4627685546875, -0.345367431640625, -0.22796630859375, -0.110565185546875, 0.0068359375, 0.124237060546875, 0.24163818359375, 0.359039306640625, 0.4764404296875, 0.593841552734375, 0.71124267578125, 0.828643798828125, 0.946044921875, 1.063446044921875, 1.18084716796875, 1.298248291015625, 1.4156494140625, 1.533050537109375, 1.65045166015625, 1.767852783203125, 1.88525390625, 2.002655029296875, 2.12005615234375, 2.237457275390625, 2.3548583984375, 2.472259521484375, 2.58966064453125, 2.707061767578125, 2.824462890625, 2.941864013671875, 3.05926513671875, 3.176666259765625, 3.2940673828125, 3.411468505859375, 3.52886962890625, 3.646270751953125, 3.763671875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 6.0, 12.0, 22.0, 20.0, 31.0, 52.0, 77.0, 90.0, 129.0, 214.0, 324.0, 417.0, 676.0, 1057.0, 1600.0, 2537.0, 4005.0, 6535.0, 10416.0, 17568.0, 29839.0, 52014.0, 96998.0, 240289.0, 1376395.0, 112916.0, 59324.0, 33109.0, 19245.0, 11361.0, 7068.0, 4468.0, 2887.0, 1883.0, 1238.0, 771.0, 517.0, 352.0, 237.0, 154.0, 77.0, 67.0, 47.0, 30.0, 11.0, 18.0, 11.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.544921875, -1.496795654296875, -1.44866943359375, -1.400543212890625, -1.3524169921875, -1.304290771484375, -1.25616455078125, -1.208038330078125, -1.159912109375, -1.111785888671875, -1.06365966796875, -1.015533447265625, -0.9674072265625, -0.919281005859375, -0.87115478515625, -0.823028564453125, -0.77490234375, -0.726776123046875, -0.67864990234375, -0.630523681640625, -0.5823974609375, -0.534271240234375, -0.48614501953125, -0.438018798828125, -0.389892578125, -0.341766357421875, -0.29364013671875, -0.245513916015625, -0.1973876953125, -0.149261474609375, -0.10113525390625, -0.053009033203125, -0.0048828125, 0.043243408203125, 0.09136962890625, 0.139495849609375, 0.1876220703125, 0.235748291015625, 0.28387451171875, 0.332000732421875, 0.380126953125, 0.428253173828125, 0.47637939453125, 0.524505615234375, 0.5726318359375, 0.620758056640625, 0.66888427734375, 0.717010498046875, 0.76513671875, 0.813262939453125, 0.86138916015625, 0.909515380859375, 0.9576416015625, 1.005767822265625, 1.05389404296875, 1.102020263671875, 1.150146484375, 1.198272705078125, 1.24639892578125, 1.294525146484375, 1.3426513671875, 1.390777587890625, 1.43890380859375, 1.487030029296875, 1.53515625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 3.0, 6.0, 5.0, 9.0, 6.0, 9.0, 11.0, 20.0, 29.0, 41.0, 82.0, 123.0, 175.0, 178.0, 108.0, 68.0, 38.0, 25.0, 19.0, 10.0, 9.0, 9.0, 0.0, 5.0, 7.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011463165283203125, -0.0011051595211029053, -0.001064002513885498, -0.0010228455066680908, -0.0009816884994506836, -0.0009405314922332764, -0.0008993744850158691, -0.0008582174777984619, -0.0008170604705810547, -0.0007759034633636475, -0.0007347464561462402, -0.000693589448928833, -0.0006524324417114258, -0.0006112754344940186, -0.0005701184272766113, -0.0005289614200592041, -0.0004878044128417969, -0.00044664740562438965, -0.0004054903984069824, -0.0003643333911895752, -0.00032317638397216797, -0.00028201937675476074, -0.00024086236953735352, -0.0001997053623199463, -0.00015854835510253906, -0.00011739134788513184, -7.623434066772461e-05, -3.507733345031738e-05, 6.079673767089844e-06, 4.723668098449707e-05, 8.83936882019043e-05, 0.00012955069541931152, 0.00017070770263671875, 0.00021186470985412598, 0.0002530217170715332, 0.00029417872428894043, 0.00033533573150634766, 0.0003764927387237549, 0.0004176497459411621, 0.00045880675315856934, 0.0004999637603759766, 0.0005411207675933838, 0.000582277774810791, 0.0006234347820281982, 0.0006645917892456055, 0.0007057487964630127, 0.0007469058036804199, 0.0007880628108978271, 0.0008292198181152344, 0.0008703768253326416, 0.0009115338325500488, 0.0009526908397674561, 0.0009938478469848633, 0.0010350048542022705, 0.0010761618614196777, 0.001117318868637085, 0.0011584758758544922, 0.0011996328830718994, 0.0012407898902893066, 0.0012819468975067139, 0.001323103904724121, 0.0013642609119415283, 0.0014054179191589355, 0.0014465749263763428, 0.00148773193359375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 8.0, 8.0, 13.0, 11.0, 13.0, 23.0, 31.0, 60.0, 70.0, 132.0, 268.0, 715.0, 39494.0, 1005556.0, 1308.0, 353.0, 178.0, 103.0, 58.0, 31.0, 29.0, 13.0, 20.0, 10.0, 12.0, 5.0, 5.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0], "bins": [-0.027862548828125, -0.027092695236206055, -0.02632284164428711, -0.025552988052368164, -0.02478313446044922, -0.024013280868530273, -0.023243427276611328, -0.022473573684692383, -0.021703720092773438, -0.020933866500854492, -0.020164012908935547, -0.0193941593170166, -0.018624305725097656, -0.01785445213317871, -0.017084598541259766, -0.01631474494934082, -0.015544891357421875, -0.01477503776550293, -0.014005184173583984, -0.013235330581665039, -0.012465476989746094, -0.011695623397827148, -0.010925769805908203, -0.010155916213989258, -0.009386062622070312, -0.008616209030151367, -0.007846355438232422, -0.0070765018463134766, -0.006306648254394531, -0.005536794662475586, -0.004766941070556641, -0.003997087478637695, -0.00322723388671875, -0.0024573802947998047, -0.0016875267028808594, -0.0009176731109619141, -0.00014781951904296875, 0.0006220340728759766, 0.0013918876647949219, 0.002161741256713867, 0.0029315948486328125, 0.003701448440551758, 0.004471302032470703, 0.0052411556243896484, 0.006011009216308594, 0.006780862808227539, 0.007550716400146484, 0.00832056999206543, 0.009090423583984375, 0.00986027717590332, 0.010630130767822266, 0.011399984359741211, 0.012169837951660156, 0.012939691543579102, 0.013709545135498047, 0.014479398727416992, 0.015249252319335938, 0.016019105911254883, 0.016788959503173828, 0.017558813095092773, 0.01832866668701172, 0.019098520278930664, 0.01986837387084961, 0.020638227462768555, 0.0214080810546875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 9.0, 499.0, 498.0, 10.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006397530902177095, -0.0062641846016049385, -0.006130837835371494, -0.005997491534799337, -0.0058641452342271805, -0.005730798467993736, -0.005597452167421579, -0.005464105401188135, -0.005330759100615978, -0.005197412800043821, -0.005064066033810377, -0.00493071973323822, -0.004797372967004776, -0.004664026666432619, -0.004530680365860462, -0.004397333599627018, -0.004263987299054861, -0.004130640998482704, -0.00399729423224926, -0.003863947931677103, -0.0037306013982743025, -0.003597254864871502, -0.003463908564299345, -0.0033305620308965445, -0.003197215497493744, -0.0030638689640909433, -0.0029305224306881428, -0.002797176130115986, -0.0026638295967131853, -0.0025304830633103848, -0.002397136762738228, -0.0022637902293354273, -0.002130444161593914, -0.0019970976281911135, -0.0018637512112036347, -0.001730404794216156, -0.0015970582608133554, -0.0014637117274105549, -0.0013303653104230762, -0.0011970188934355974, -0.0010636723600327969, -0.0009303258848376572, -0.0007969794096425176, -0.0006636329344473779, -0.0005302864592522383, -0.0003969399840570986, -0.000263593508861959, -0.00013024703366681933, 3.0994415283203125e-06, 0.00013644591672345996, 0.0002697923919185996, 0.00040313886711373925, 0.0005364853423088789, 0.0006698318175040185, 0.0008031782926991582, 0.0009365247678942978, 0.0010698712430894375, 0.001203217776492238, 0.0013365641934797168, 0.0014699106104671955, 0.001603257143869996, 0.0017366036772727966, 0.0018699500942602754, 0.002003296511247754, 0.0021366430446505547]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 10.0, 7.0, 14.0, 13.0, 15.0, 10.0, 23.0, 18.0, 26.0, 27.0, 25.0, 34.0, 36.0, 48.0, 38.0, 45.0, 42.0, 50.0, 56.0, 44.0, 55.0, 43.0, 38.0, 44.0, 36.0, 37.0, 30.0, 23.0, 24.0, 19.0, 16.0, 11.0, 7.0, 11.0, 4.0, 5.0, 7.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004138350486755371, -0.0003994675353169441, -0.00038510002195835114, -0.00037073250859975815, -0.00035636499524116516, -0.0003419974818825722, -0.0003276299685239792, -0.0003132624551653862, -0.0002988949418067932, -0.0002845274284482002, -0.00027015991508960724, -0.00025579240173101425, -0.00024142488837242126, -0.00022705737501382828, -0.0002126898616552353, -0.0001983223482966423, -0.00018395483493804932, -0.00016958732157945633, -0.00015521980822086334, -0.00014085229486227036, -0.00012648478150367737, -0.00011211726814508438, -9.77497547864914e-05, -8.338224142789841e-05, -6.901472806930542e-05, -5.464721471071243e-05, -4.0279701352119446e-05, -2.591218799352646e-05, -1.1544674634933472e-05, 2.8228387236595154e-06, 1.7190352082252502e-05, 3.155786544084549e-05, 4.5925378799438477e-05, 6.0292892158031464e-05, 7.466040551662445e-05, 8.902791887521744e-05, 0.00010339543223381042, 0.00011776294559240341, 0.0001321304589509964, 0.00014649797230958939, 0.00016086548566818237, 0.00017523299902677536, 0.00018960051238536835, 0.00020396802574396133, 0.00021833553910255432, 0.0002327030524611473, 0.0002470705658197403, 0.0002614380791783333, 0.00027580559253692627, 0.00029017310589551926, 0.00030454061925411224, 0.00031890813261270523, 0.0003332756459712982, 0.0003476431593298912, 0.0003620106726884842, 0.0003763781860470772, 0.00039074569940567017, 0.00040511321276426315, 0.00041948072612285614, 0.00043384823948144913, 0.0004482157528400421, 0.0004625832661986351, 0.0004769507795572281, 0.0004913182929158211, 0.0005056858062744141]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 3.0, 8.0, 4.0, 15.0, 11.0, 15.0, 15.0, 16.0, 19.0, 26.0, 16.0, 18.0, 20.0, 29.0, 21.0, 35.0, 37.0, 43.0, 33.0, 34.0, 40.0, 52.0, 45.0, 40.0, 35.0, 35.0, 37.0, 29.0, 24.0, 27.0, 33.0, 32.0, 19.0, 12.0, 28.0, 17.0, 11.0, 9.0, 9.0, 12.0, 8.0, 7.0, 4.0, 7.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-5.578125, -5.39715576171875, -5.2161865234375, -5.03521728515625, -4.854248046875, -4.67327880859375, -4.4923095703125, -4.31134033203125, -4.13037109375, -3.94940185546875, -3.7684326171875, -3.58746337890625, -3.406494140625, -3.22552490234375, -3.0445556640625, -2.86358642578125, -2.6826171875, -2.50164794921875, -2.3206787109375, -2.13970947265625, -1.958740234375, -1.77777099609375, -1.5968017578125, -1.41583251953125, -1.23486328125, -1.05389404296875, -0.8729248046875, -0.69195556640625, -0.510986328125, -0.33001708984375, -0.1490478515625, 0.03192138671875, 0.212890625, 0.39385986328125, 0.5748291015625, 0.75579833984375, 0.936767578125, 1.11773681640625, 1.2987060546875, 1.47967529296875, 1.66064453125, 1.84161376953125, 2.0225830078125, 2.20355224609375, 2.384521484375, 2.56549072265625, 2.7464599609375, 2.92742919921875, 3.1083984375, 3.28936767578125, 3.4703369140625, 3.65130615234375, 3.832275390625, 4.01324462890625, 4.1942138671875, 4.37518310546875, 4.55615234375, 4.73712158203125, 4.9180908203125, 5.09906005859375, 5.280029296875, 5.46099853515625, 5.6419677734375, 5.82293701171875, 6.00390625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 13.0, 5.0, 9.0, 13.0, 17.0, 23.0, 29.0, 38.0, 48.0, 76.0, 141.0, 236.0, 516.0, 1048.0, 2379.0, 5749.0, 13634.0, 33254.0, 87751.0, 252025.0, 379933.0, 170369.0, 60243.0, 23612.0, 9850.0, 4155.0, 1701.0, 765.0, 372.0, 192.0, 98.0, 68.0, 52.0, 27.0, 19.0, 14.0, 15.0, 17.0, 10.0, 5.0, 3.0, 9.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-6.03515625, -5.8424072265625, -5.649658203125, -5.4569091796875, -5.26416015625, -5.0714111328125, -4.878662109375, -4.6859130859375, -4.4931640625, -4.3004150390625, -4.107666015625, -3.9149169921875, -3.72216796875, -3.5294189453125, -3.336669921875, -3.1439208984375, -2.951171875, -2.7584228515625, -2.565673828125, -2.3729248046875, -2.18017578125, -1.9874267578125, -1.794677734375, -1.6019287109375, -1.4091796875, -1.2164306640625, -1.023681640625, -0.8309326171875, -0.63818359375, -0.4454345703125, -0.252685546875, -0.0599365234375, 0.1328125, 0.3255615234375, 0.518310546875, 0.7110595703125, 0.90380859375, 1.0965576171875, 1.289306640625, 1.4820556640625, 1.6748046875, 1.8675537109375, 2.060302734375, 2.2530517578125, 2.44580078125, 2.6385498046875, 2.831298828125, 3.0240478515625, 3.216796875, 3.4095458984375, 3.602294921875, 3.7950439453125, 3.98779296875, 4.1805419921875, 4.373291015625, 4.5660400390625, 4.7587890625, 4.9515380859375, 5.144287109375, 5.3370361328125, 5.52978515625, 5.7225341796875, 5.915283203125, 6.1080322265625, 6.30078125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 10.0, 6.0, 9.0, 12.0, 13.0, 19.0, 26.0, 22.0, 32.0, 26.0, 36.0, 30.0, 43.0, 33.0, 58.0, 85.0, 199.0, 1449.0, 347.0, 108.0, 79.0, 42.0, 37.0, 42.0, 44.0, 28.0, 31.0, 34.0, 21.0, 13.0, 18.0, 13.0, 11.0, 10.0, 10.0, 13.0, 6.0, 4.0, 2.0, 3.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 5.0], "bins": [-22.875, -22.217041015625, -21.55908203125, -20.901123046875, -20.2431640625, -19.585205078125, -18.92724609375, -18.269287109375, -17.611328125, -16.953369140625, -16.29541015625, -15.637451171875, -14.9794921875, -14.321533203125, -13.66357421875, -13.005615234375, -12.34765625, -11.689697265625, -11.03173828125, -10.373779296875, -9.7158203125, -9.057861328125, -8.39990234375, -7.741943359375, -7.083984375, -6.426025390625, -5.76806640625, -5.110107421875, -4.4521484375, -3.794189453125, -3.13623046875, -2.478271484375, -1.8203125, -1.162353515625, -0.50439453125, 0.153564453125, 0.8115234375, 1.469482421875, 2.12744140625, 2.785400390625, 3.443359375, 4.101318359375, 4.75927734375, 5.417236328125, 6.0751953125, 6.733154296875, 7.39111328125, 8.049072265625, 8.70703125, 9.364990234375, 10.02294921875, 10.680908203125, 11.3388671875, 11.996826171875, 12.65478515625, 13.312744140625, 13.970703125, 14.628662109375, 15.28662109375, 15.944580078125, 16.6025390625, 17.260498046875, 17.91845703125, 18.576416015625, 19.234375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 3.0, 5.0, 20.0, 14.0, 14.0, 14.0, 26.0, 36.0, 55.0, 55.0, 77.0, 149.0, 244.0, 376.0, 811.0, 4082.0, 2929729.0, 206590.0, 1877.0, 629.0, 334.0, 185.0, 97.0, 74.0, 50.0, 50.0, 24.0, 16.0, 14.0, 13.0, 6.0, 7.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-58.125, -56.35498046875, -54.5849609375, -52.81494140625, -51.044921875, -49.27490234375, -47.5048828125, -45.73486328125, -43.96484375, -42.19482421875, -40.4248046875, -38.65478515625, -36.884765625, -35.11474609375, -33.3447265625, -31.57470703125, -29.8046875, -28.03466796875, -26.2646484375, -24.49462890625, -22.724609375, -20.95458984375, -19.1845703125, -17.41455078125, -15.64453125, -13.87451171875, -12.1044921875, -10.33447265625, -8.564453125, -6.79443359375, -5.0244140625, -3.25439453125, -1.484375, 0.28564453125, 2.0556640625, 3.82568359375, 5.595703125, 7.36572265625, 9.1357421875, 10.90576171875, 12.67578125, 14.44580078125, 16.2158203125, 17.98583984375, 19.755859375, 21.52587890625, 23.2958984375, 25.06591796875, 26.8359375, 28.60595703125, 30.3759765625, 32.14599609375, 33.916015625, 35.68603515625, 37.4560546875, 39.22607421875, 40.99609375, 42.76611328125, 44.5361328125, 46.30615234375, 48.076171875, 49.84619140625, 51.6162109375, 53.38623046875, 55.15625]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 117.0, 766.0, 129.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.33853149414062, -105.20160675048828, -100.0646743774414, -94.92774963378906, -89.79081726074219, -84.65389251708984, -79.5169677734375, -74.38003540039062, -69.24311065673828, -64.10618591308594, -58.96925354003906, -53.83232879638672, -48.69540023803711, -43.5584716796875, -38.421546936035156, -33.28461837768555, -28.147689819335938, -23.010761260986328, -17.87383460998535, -12.736907005310059, -7.599979400634766, -2.4630508422851562, 2.6738758087158203, 7.810802459716797, 12.947731018066406, 18.084659576416016, 23.221586227416992, 28.35851287841797, 33.49544143676758, 38.63236999511719, 43.76929473876953, 48.90622329711914, 54.04316711425781, 59.18009567260742, 64.31702423095703, 69.45394897460938, 74.59088134765625, 79.7278060913086, 84.86473083496094, 90.00166320800781, 95.13858795166016, 100.2755126953125, 105.41244506835938, 110.54936981201172, 115.68629455566406, 120.82322692871094, 125.96015167236328, 131.09707641601562, 136.2340087890625, 141.37094116210938, 146.5078582763672, 151.64479064941406, 156.78172302246094, 161.91864013671875, 167.05557250976562, 172.1925048828125, 177.32943725585938, 182.46636962890625, 187.60328674316406, 192.74021911621094, 197.8771514892578, 203.01406860351562, 208.1510009765625, 213.28793334960938, 218.4248504638672]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 7.0, 3.0, 7.0, 10.0, 13.0, 15.0, 15.0, 23.0, 27.0, 24.0, 18.0, 35.0, 21.0, 37.0, 35.0, 37.0, 37.0, 39.0, 49.0, 46.0, 41.0, 37.0, 24.0, 40.0, 38.0, 38.0, 37.0, 22.0, 29.0, 32.0, 32.0, 23.0, 17.0, 15.0, 17.0, 9.0, 11.0, 7.0, 10.0, 5.0, 3.0, 2.0, 4.0, 0.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-56.971168518066406, -55.327877044677734, -53.68458938598633, -52.041297912597656, -50.398006439208984, -48.75471878051758, -47.111427307128906, -45.4681396484375, -43.82484817504883, -42.181556701660156, -40.53826904296875, -38.89497756958008, -37.251686096191406, -35.6083984375, -33.96510696411133, -32.321815490722656, -30.678525924682617, -29.035236358642578, -27.391944885253906, -25.748655319213867, -24.105365753173828, -22.462074279785156, -20.818784713745117, -19.175495147705078, -17.532203674316406, -15.88891315460205, -14.245623588562012, -12.602333068847656, -10.959043502807617, -9.315752983093262, -7.672462463378906, -6.029172897338867, -4.385883331298828, -2.742593288421631, -1.0993030071258545, 0.5439872741699219, 2.187277317047119, 3.8305673599243164, 5.473857879638672, 7.117147445678711, 8.760437965393066, 10.403728485107422, 12.047018051147461, 13.690308570861816, 15.333599090576172, 16.97688865661621, 18.62017822265625, 20.263469696044922, 21.90675926208496, 23.550048828125, 25.193340301513672, 26.83662986755371, 28.47991943359375, 30.123210906982422, 31.76650047302246, 33.4097900390625, 35.05308151245117, 36.696372985839844, 38.33966064453125, 39.98295211791992, 41.626243591308594, 43.26953125, 44.91282272338867, 46.556114196777344, 48.19940185546875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 7.0, 7.0, 6.0, 3.0, 8.0, 15.0, 13.0, 19.0, 19.0, 13.0, 13.0, 26.0, 20.0, 40.0, 30.0, 26.0, 36.0, 34.0, 39.0, 38.0, 48.0, 45.0, 43.0, 36.0, 34.0, 51.0, 27.0, 22.0, 33.0, 24.0, 32.0, 27.0, 18.0, 16.0, 19.0, 21.0, 13.0, 16.0, 11.0, 12.0, 10.0, 7.0, 6.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-5.80078125, -5.60845947265625, -5.4161376953125, -5.22381591796875, -5.031494140625, -4.83917236328125, -4.6468505859375, -4.45452880859375, -4.26220703125, -4.06988525390625, -3.8775634765625, -3.68524169921875, -3.492919921875, -3.30059814453125, -3.1082763671875, -2.91595458984375, -2.7236328125, -2.53131103515625, -2.3389892578125, -2.14666748046875, -1.954345703125, -1.76202392578125, -1.5697021484375, -1.37738037109375, -1.18505859375, -0.99273681640625, -0.8004150390625, -0.60809326171875, -0.415771484375, -0.22344970703125, -0.0311279296875, 0.16119384765625, 0.353515625, 0.54583740234375, 0.7381591796875, 0.93048095703125, 1.122802734375, 1.31512451171875, 1.5074462890625, 1.69976806640625, 1.89208984375, 2.08441162109375, 2.2767333984375, 2.46905517578125, 2.661376953125, 2.85369873046875, 3.0460205078125, 3.23834228515625, 3.4306640625, 3.62298583984375, 3.8153076171875, 4.00762939453125, 4.199951171875, 4.39227294921875, 4.5845947265625, 4.77691650390625, 4.96923828125, 5.16156005859375, 5.3538818359375, 5.54620361328125, 5.738525390625, 5.93084716796875, 6.1231689453125, 6.31549072265625, 6.5078125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 6.0, 6.0, 10.0, 13.0, 14.0, 13.0, 8.0, 15.0, 22.0, 23.0, 32.0, 41.0, 50.0, 54.0, 71.0, 101.0, 155.0, 281.0, 914.0, 9774.0, 843542.0, 3222740.0, 112466.0, 2638.0, 531.0, 191.0, 114.0, 89.0, 68.0, 49.0, 46.0, 29.0, 28.0, 24.0, 16.0, 24.0, 16.0, 15.0, 9.0, 10.0, 7.0, 5.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.65625, -18.01904296875, -17.3818359375, -16.74462890625, -16.107421875, -15.47021484375, -14.8330078125, -14.19580078125, -13.55859375, -12.92138671875, -12.2841796875, -11.64697265625, -11.009765625, -10.37255859375, -9.7353515625, -9.09814453125, -8.4609375, -7.82373046875, -7.1865234375, -6.54931640625, -5.912109375, -5.27490234375, -4.6376953125, -4.00048828125, -3.36328125, -2.72607421875, -2.0888671875, -1.45166015625, -0.814453125, -0.17724609375, 0.4599609375, 1.09716796875, 1.734375, 2.37158203125, 3.0087890625, 3.64599609375, 4.283203125, 4.92041015625, 5.5576171875, 6.19482421875, 6.83203125, 7.46923828125, 8.1064453125, 8.74365234375, 9.380859375, 10.01806640625, 10.6552734375, 11.29248046875, 11.9296875, 12.56689453125, 13.2041015625, 13.84130859375, 14.478515625, 15.11572265625, 15.7529296875, 16.39013671875, 17.02734375, 17.66455078125, 18.3017578125, 18.93896484375, 19.576171875, 20.21337890625, 20.8505859375, 21.48779296875, 22.125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 8.0, 11.0, 9.0, 16.0, 25.0, 26.0, 36.0, 51.0, 47.0, 69.0, 127.0, 131.0, 236.0, 314.0, 411.0, 429.0, 496.0, 403.0, 287.0, 253.0, 181.0, 121.0, 92.0, 72.0, 45.0, 49.0, 29.0, 20.0, 13.0, 12.0, 11.0, 5.0, 5.0, 5.0, 6.0, 8.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.359375, -9.0489501953125, -8.738525390625, -8.4281005859375, -8.11767578125, -7.8072509765625, -7.496826171875, -7.1864013671875, -6.8759765625, -6.5655517578125, -6.255126953125, -5.9447021484375, -5.63427734375, -5.3238525390625, -5.013427734375, -4.7030029296875, -4.392578125, -4.0821533203125, -3.771728515625, -3.4613037109375, -3.15087890625, -2.8404541015625, -2.530029296875, -2.2196044921875, -1.9091796875, -1.5987548828125, -1.288330078125, -0.9779052734375, -0.66748046875, -0.3570556640625, -0.046630859375, 0.2637939453125, 0.57421875, 0.8846435546875, 1.195068359375, 1.5054931640625, 1.81591796875, 2.1263427734375, 2.436767578125, 2.7471923828125, 3.0576171875, 3.3680419921875, 3.678466796875, 3.9888916015625, 4.29931640625, 4.6097412109375, 4.920166015625, 5.2305908203125, 5.541015625, 5.8514404296875, 6.161865234375, 6.4722900390625, 6.78271484375, 7.0931396484375, 7.403564453125, 7.7139892578125, 8.0244140625, 8.3348388671875, 8.645263671875, 8.9556884765625, 9.26611328125, 9.5765380859375, 9.886962890625, 10.1973876953125, 10.5078125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 8.0, 2.0, 11.0, 13.0, 10.0, 11.0, 17.0, 24.0, 29.0, 44.0, 58.0, 67.0, 71.0, 108.0, 170.0, 196.0, 287.0, 428.0, 807.0, 5192.0, 457244.0, 3694055.0, 31836.0, 1741.0, 589.0, 376.0, 231.0, 159.0, 122.0, 101.0, 64.0, 63.0, 45.0, 24.0, 25.0, 13.0, 11.0, 10.0, 7.0, 7.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.40625, -31.2587890625, -30.111328125, -28.9638671875, -27.81640625, -26.6689453125, -25.521484375, -24.3740234375, -23.2265625, -22.0791015625, -20.931640625, -19.7841796875, -18.63671875, -17.4892578125, -16.341796875, -15.1943359375, -14.046875, -12.8994140625, -11.751953125, -10.6044921875, -9.45703125, -8.3095703125, -7.162109375, -6.0146484375, -4.8671875, -3.7197265625, -2.572265625, -1.4248046875, -0.27734375, 0.8701171875, 2.017578125, 3.1650390625, 4.3125, 5.4599609375, 6.607421875, 7.7548828125, 8.90234375, 10.0498046875, 11.197265625, 12.3447265625, 13.4921875, 14.6396484375, 15.787109375, 16.9345703125, 18.08203125, 19.2294921875, 20.376953125, 21.5244140625, 22.671875, 23.8193359375, 24.966796875, 26.1142578125, 27.26171875, 28.4091796875, 29.556640625, 30.7041015625, 31.8515625, 32.9990234375, 34.146484375, 35.2939453125, 36.44140625, 37.5888671875, 38.736328125, 39.8837890625, 41.03125]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 31.0, 369.0, 529.0, 78.0, 10.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.16609954833984, -107.54523468017578, -101.92436981201172, -96.30350494384766, -90.6826400756836, -85.06177520751953, -79.44091033935547, -73.8200454711914, -68.19918060302734, -62.57831573486328, -56.95745086669922, -51.336585998535156, -45.715721130371094, -40.09485626220703, -34.47399139404297, -28.853126525878906, -23.232261657714844, -17.61139678955078, -11.990531921386719, -6.369667053222656, -0.7488021850585938, 4.872062683105469, 10.492927551269531, 16.113792419433594, 21.734657287597656, 27.35552215576172, 32.97638702392578, 38.597251892089844, 44.218116760253906, 49.83898162841797, 55.45984649658203, 61.080711364746094, 66.70156860351562, 72.32243347167969, 77.94329833984375, 83.56416320800781, 89.18502807617188, 94.80589294433594, 100.4267578125, 106.04762268066406, 111.66848754882812, 117.28935241699219, 122.91021728515625, 128.5310821533203, 134.15194702148438, 139.77281188964844, 145.3936767578125, 151.01454162597656, 156.63540649414062, 162.2562713623047, 167.87713623046875, 173.4980010986328, 179.11886596679688, 184.73973083496094, 190.360595703125, 195.98146057128906, 201.60232543945312, 207.2231903076172, 212.84405517578125, 218.4649200439453, 224.08578491210938, 229.70664978027344, 235.3275146484375, 240.94837951660156, 246.56924438476562]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 7.0, 9.0, 10.0, 9.0, 12.0, 19.0, 14.0, 20.0, 16.0, 23.0, 31.0, 37.0, 36.0, 29.0, 34.0, 39.0, 49.0, 46.0, 38.0, 38.0, 40.0, 35.0, 36.0, 43.0, 38.0, 28.0, 40.0, 31.0, 26.0, 25.0, 15.0, 22.0, 17.0, 8.0, 19.0, 11.0, 13.0, 6.0, 6.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-35.00153732299805, -33.92715072631836, -32.85276412963867, -31.778379440307617, -30.703994750976562, -29.629608154296875, -28.555221557617188, -27.480836868286133, -26.406452178955078, -25.33206558227539, -24.257680892944336, -23.18329429626465, -22.108909606933594, -21.034523010253906, -19.96013641357422, -18.885751724243164, -17.811365127563477, -16.73697853088379, -15.662593841552734, -14.588207244873047, -13.513822555541992, -12.439435958862305, -11.365050315856934, -10.290664672851562, -9.216279029846191, -8.14189338684082, -7.067507743835449, -5.99312162399292, -4.918735980987549, -3.8443503379821777, -2.7699642181396484, -1.6955785751342773, -0.6211929321289062, 0.4531928300857544, 1.527578592300415, 2.6019644737243652, 3.6763501167297363, 4.750735759735107, 5.825121879577637, 6.899507522583008, 7.973893165588379, 9.04827880859375, 10.122664451599121, 11.197050094604492, 12.27143669128418, 13.345821380615234, 14.420207977294922, 15.494593620300293, 16.568979263305664, 17.64336585998535, 18.717750549316406, 19.792137145996094, 20.86652183532715, 21.940908432006836, 23.01529312133789, 24.089679718017578, 25.164066314697266, 26.238452911376953, 27.312837600708008, 28.387224197387695, 29.46160888671875, 30.535995483398438, 31.610382080078125, 32.68476867675781, 33.759151458740234]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 2.0, 10.0, 14.0, 12.0, 17.0, 22.0, 20.0, 33.0, 34.0, 28.0, 40.0, 38.0, 39.0, 51.0, 44.0, 40.0, 37.0, 60.0, 50.0, 37.0, 45.0, 37.0, 29.0, 23.0, 26.0, 19.0, 31.0, 34.0, 21.0, 18.0, 16.0, 14.0, 9.0, 10.0, 9.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3828125, -6.17108154296875, -5.9593505859375, -5.74761962890625, -5.535888671875, -5.32415771484375, -5.1124267578125, -4.90069580078125, -4.68896484375, -4.47723388671875, -4.2655029296875, -4.05377197265625, -3.842041015625, -3.63031005859375, -3.4185791015625, -3.20684814453125, -2.9951171875, -2.78338623046875, -2.5716552734375, -2.35992431640625, -2.148193359375, -1.93646240234375, -1.7247314453125, -1.51300048828125, -1.30126953125, -1.08953857421875, -0.8778076171875, -0.66607666015625, -0.454345703125, -0.24261474609375, -0.0308837890625, 0.18084716796875, 0.392578125, 0.60430908203125, 0.8160400390625, 1.02777099609375, 1.239501953125, 1.45123291015625, 1.6629638671875, 1.87469482421875, 2.08642578125, 2.29815673828125, 2.5098876953125, 2.72161865234375, 2.933349609375, 3.14508056640625, 3.3568115234375, 3.56854248046875, 3.7802734375, 3.99200439453125, 4.2037353515625, 4.41546630859375, 4.627197265625, 4.83892822265625, 5.0506591796875, 5.26239013671875, 5.47412109375, 5.68585205078125, 5.8975830078125, 6.10931396484375, 6.321044921875, 6.53277587890625, 6.7445068359375, 6.95623779296875, 7.16796875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 6.0, 9.0, 13.0, 19.0, 26.0, 51.0, 60.0, 104.0, 129.0, 218.0, 303.0, 462.0, 718.0, 1083.0, 1666.0, 2720.0, 4324.0, 7208.0, 11811.0, 19812.0, 34442.0, 62058.0, 124254.0, 358041.0, 210063.0, 91710.0, 48806.0, 27459.0, 15899.0, 9690.0, 5877.0, 3459.0, 2161.0, 1370.0, 859.0, 570.0, 349.0, 253.0, 174.0, 111.0, 79.0, 47.0, 31.0, 24.0, 9.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.82421875, -1.770233154296875, -1.71624755859375, -1.662261962890625, -1.6082763671875, -1.554290771484375, -1.50030517578125, -1.446319580078125, -1.392333984375, -1.338348388671875, -1.28436279296875, -1.230377197265625, -1.1763916015625, -1.122406005859375, -1.06842041015625, -1.014434814453125, -0.96044921875, -0.906463623046875, -0.85247802734375, -0.798492431640625, -0.7445068359375, -0.690521240234375, -0.63653564453125, -0.582550048828125, -0.528564453125, -0.474578857421875, -0.42059326171875, -0.366607666015625, -0.3126220703125, -0.258636474609375, -0.20465087890625, -0.150665283203125, -0.0966796875, -0.042694091796875, 0.01129150390625, 0.065277099609375, 0.1192626953125, 0.173248291015625, 0.22723388671875, 0.281219482421875, 0.335205078125, 0.389190673828125, 0.44317626953125, 0.497161865234375, 0.5511474609375, 0.605133056640625, 0.65911865234375, 0.713104248046875, 0.76708984375, 0.821075439453125, 0.87506103515625, 0.929046630859375, 0.9830322265625, 1.037017822265625, 1.09100341796875, 1.144989013671875, 1.198974609375, 1.252960205078125, 1.30694580078125, 1.360931396484375, 1.4149169921875, 1.468902587890625, 1.52288818359375, 1.576873779296875, 1.630859375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 12.0, 14.0, 11.0, 7.0, 10.0, 13.0, 19.0, 13.0, 27.0, 27.0, 25.0, 19.0, 27.0, 28.0, 38.0, 31.0, 44.0, 26.0, 35.0, 32.0, 1054.0, 46.0, 28.0, 36.0, 33.0, 39.0, 33.0, 39.0, 25.0, 32.0, 30.0, 24.0, 20.0, 21.0, 16.0, 10.0, 10.0, 17.0, 9.0, 9.0, 6.0, 7.0, 7.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.37890625, -3.26141357421875, -3.1439208984375, -3.02642822265625, -2.908935546875, -2.79144287109375, -2.6739501953125, -2.55645751953125, -2.43896484375, -2.32147216796875, -2.2039794921875, -2.08648681640625, -1.968994140625, -1.85150146484375, -1.7340087890625, -1.61651611328125, -1.4990234375, -1.38153076171875, -1.2640380859375, -1.14654541015625, -1.029052734375, -0.91156005859375, -0.7940673828125, -0.67657470703125, -0.55908203125, -0.44158935546875, -0.3240966796875, -0.20660400390625, -0.089111328125, 0.02838134765625, 0.1458740234375, 0.26336669921875, 0.380859375, 0.49835205078125, 0.6158447265625, 0.73333740234375, 0.850830078125, 0.96832275390625, 1.0858154296875, 1.20330810546875, 1.32080078125, 1.43829345703125, 1.5557861328125, 1.67327880859375, 1.790771484375, 1.90826416015625, 2.0257568359375, 2.14324951171875, 2.2607421875, 2.37823486328125, 2.4957275390625, 2.61322021484375, 2.730712890625, 2.84820556640625, 2.9656982421875, 3.08319091796875, 3.20068359375, 3.31817626953125, 3.4356689453125, 3.55316162109375, 3.670654296875, 3.78814697265625, 3.9056396484375, 4.02313232421875, 4.140625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 10.0, 1.0, 2.0, 9.0, 20.0, 17.0, 35.0, 23.0, 51.0, 86.0, 118.0, 165.0, 211.0, 378.0, 550.0, 807.0, 1251.0, 1996.0, 3203.0, 4611.0, 7874.0, 12194.0, 19773.0, 32625.0, 55758.0, 97788.0, 203540.0, 1363515.0, 121136.0, 67252.0, 39491.0, 23420.0, 14257.0, 8992.0, 5616.0, 3602.0, 2371.0, 1503.0, 973.0, 633.0, 479.0, 263.0, 172.0, 130.0, 86.0, 41.0, 42.0, 27.0, 22.0, 10.0, 3.0, 0.0, 4.0, 3.0, 4.0, 2.0], "bins": [-1.6669921875, -1.619598388671875, -1.57220458984375, -1.524810791015625, -1.4774169921875, -1.430023193359375, -1.38262939453125, -1.335235595703125, -1.287841796875, -1.240447998046875, -1.19305419921875, -1.145660400390625, -1.0982666015625, -1.050872802734375, -1.00347900390625, -0.956085205078125, -0.90869140625, -0.861297607421875, -0.81390380859375, -0.766510009765625, -0.7191162109375, -0.671722412109375, -0.62432861328125, -0.576934814453125, -0.529541015625, -0.482147216796875, -0.43475341796875, -0.387359619140625, -0.3399658203125, -0.292572021484375, -0.24517822265625, -0.197784423828125, -0.150390625, -0.102996826171875, -0.05560302734375, -0.008209228515625, 0.0391845703125, 0.086578369140625, 0.13397216796875, 0.181365966796875, 0.228759765625, 0.276153564453125, 0.32354736328125, 0.370941162109375, 0.4183349609375, 0.465728759765625, 0.51312255859375, 0.560516357421875, 0.60791015625, 0.655303955078125, 0.70269775390625, 0.750091552734375, 0.7974853515625, 0.844879150390625, 0.89227294921875, 0.939666748046875, 0.987060546875, 1.034454345703125, 1.08184814453125, 1.129241943359375, 1.1766357421875, 1.224029541015625, 1.27142333984375, 1.318817138671875, 1.3662109375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 3.0, 8.0, 6.0, 5.0, 8.0, 12.0, 15.0, 16.0, 16.0, 11.0, 22.0, 21.0, 26.0, 28.0, 29.0, 39.0, 33.0, 55.0, 68.0, 74.0, 72.0, 55.0, 51.0, 50.0, 39.0, 36.0, 31.0, 31.0, 19.0, 17.0, 16.0, 14.0, 12.0, 8.0, 8.0, 9.0, 7.0, 7.0, 2.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0008640289306640625, -0.0008352398872375488, -0.0008064508438110352, -0.0007776618003845215, -0.0007488727569580078, -0.0007200837135314941, -0.0006912946701049805, -0.0006625056266784668, -0.0006337165832519531, -0.0006049275398254395, -0.0005761384963989258, -0.0005473494529724121, -0.0005185604095458984, -0.0004897713661193848, -0.0004609823226928711, -0.0004321932792663574, -0.00040340423583984375, -0.0003746151924133301, -0.0003458261489868164, -0.00031703710556030273, -0.00028824806213378906, -0.0002594590187072754, -0.00023066997528076172, -0.00020188093185424805, -0.00017309188842773438, -0.0001443028450012207, -0.00011551380157470703, -8.672475814819336e-05, -5.793571472167969e-05, -2.9146671295166016e-05, -3.5762786865234375e-07, 2.8431415557861328e-05, 5.7220458984375e-05, 8.600950241088867e-05, 0.00011479854583740234, 0.00014358758926391602, 0.0001723766326904297, 0.00020116567611694336, 0.00022995471954345703, 0.0002587437629699707, 0.0002875328063964844, 0.00031632184982299805, 0.0003451108932495117, 0.0003738999366760254, 0.00040268898010253906, 0.00043147802352905273, 0.0004602670669555664, 0.0004890561103820801, 0.0005178451538085938, 0.0005466341972351074, 0.0005754232406616211, 0.0006042122840881348, 0.0006330013275146484, 0.0006617903709411621, 0.0006905794143676758, 0.0007193684577941895, 0.0007481575012207031, 0.0007769465446472168, 0.0008057355880737305, 0.0008345246315002441, 0.0008633136749267578, 0.0008921027183532715, 0.0009208917617797852, 0.0009496808052062988, 0.0009784698486328125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 8.0, 9.0, 5.0, 6.0, 14.0, 11.0, 19.0, 18.0, 29.0, 34.0, 35.0, 49.0, 68.0, 97.0, 125.0, 213.0, 380.0, 723.0, 7014.0, 1028818.0, 8966.0, 734.0, 373.0, 229.0, 130.0, 88.0, 66.0, 41.0, 42.0, 40.0, 27.0, 27.0, 24.0, 18.0, 16.0, 8.0, 7.0, 15.0, 8.0, 5.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0214080810546875, -0.020787954330444336, -0.020167827606201172, -0.019547700881958008, -0.018927574157714844, -0.01830744743347168, -0.017687320709228516, -0.01706719398498535, -0.016447067260742188, -0.015826940536499023, -0.01520681381225586, -0.014586687088012695, -0.013966560363769531, -0.013346433639526367, -0.012726306915283203, -0.012106180191040039, -0.011486053466796875, -0.010865926742553711, -0.010245800018310547, -0.009625673294067383, -0.009005546569824219, -0.008385419845581055, -0.007765293121337891, -0.0071451663970947266, -0.0065250396728515625, -0.0059049129486083984, -0.005284786224365234, -0.00466465950012207, -0.004044532775878906, -0.003424406051635742, -0.002804279327392578, -0.002184152603149414, -0.00156402587890625, -0.0009438991546630859, -0.0003237724304199219, 0.0002963542938232422, 0.0009164810180664062, 0.0015366077423095703, 0.0021567344665527344, 0.0027768611907958984, 0.0033969879150390625, 0.0040171146392822266, 0.004637241363525391, 0.005257368087768555, 0.005877494812011719, 0.006497621536254883, 0.007117748260498047, 0.007737874984741211, 0.008358001708984375, 0.008978128433227539, 0.009598255157470703, 0.010218381881713867, 0.010838508605957031, 0.011458635330200195, 0.01207876205444336, 0.012698888778686523, 0.013319015502929688, 0.013939142227172852, 0.014559268951416016, 0.01517939567565918, 0.015799522399902344, 0.016419649124145508, 0.017039775848388672, 0.017659902572631836, 0.018280029296875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 24.0, 444.0, 523.0, 23.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001531265559606254, -0.0014137448742985725, -0.0012962243054062128, -0.0011787036200985312, -0.0010611829347908497, -0.0009436622494831681, -0.0008261416223831475, -0.0007086209952831268, -0.0005911003099754453, -0.00047357965377159417, -0.00035605899756774306, -0.00023853834136389196, -0.00012101768516004086, -3.496999852359295e-06, 0.00011402362724766135, 0.000231544254347682, 0.00034906493965536356, 0.00046658559585921466, 0.0005841062520630658, 0.0007016268791630864, 0.000819147564470768, 0.0009366682497784495, 0.001054188935086131, 0.0011717095039784908, 0.0012892301892861724, 0.001406750874593854, 0.0015242714434862137, 0.0016417921287938952, 0.0017593128141015768, 0.0018768334994092584, 0.00199435418471694, 0.0021118747536092997, 0.0022293953225016594, 0.002346915891394019, 0.0024644366931170225, 0.0025819572620093822, 0.0026994780637323856, 0.0028169986326247454, 0.002934519201517105, 0.0030520400032401085, 0.0031695605721324682, 0.003287081141024828, 0.0034046019427478313, 0.003522122511640191, 0.003639643080532551, 0.003757163882255554, 0.003874684451147914, 0.003992205020040274, 0.004109725821763277, 0.0042272466234862804, 0.0043447669595479965, 0.004462287761271, 0.004579808562994003, 0.004697329364717007, 0.004814849700778723, 0.004932370502501726, 0.005049890838563442, 0.005167411640286446, 0.005284931976348162, 0.005402452778071165, 0.0055199735797941685, 0.0056374939158558846, 0.005755014717578888, 0.005872535519301891, 0.005990056321024895]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 5.0, 10.0, 5.0, 8.0, 6.0, 11.0, 10.0, 10.0, 14.0, 17.0, 22.0, 26.0, 22.0, 21.0, 35.0, 27.0, 34.0, 36.0, 29.0, 42.0, 44.0, 43.0, 41.0, 45.0, 49.0, 26.0, 48.0, 37.0, 38.0, 29.0, 25.0, 30.0, 19.0, 21.0, 20.0, 22.0, 12.0, 12.0, 9.0, 10.0, 7.0, 8.0, 7.0, 7.0, 3.0, 3.0, 0.0, 0.0, 5.0, 3.0], "bins": [-0.0005950927734375, -0.000578789971768856, -0.0005624871701002121, -0.0005461843684315681, -0.0005298815667629242, -0.0005135787650942802, -0.0004972759634256363, -0.00048097316175699234, -0.0004646703600883484, -0.00044836755841970444, -0.0004320647567510605, -0.00041576195508241653, -0.0003994591534137726, -0.00038315635174512863, -0.0003668535500764847, -0.00035055074840784073, -0.0003342479467391968, -0.0003179451450705528, -0.0003016423434019089, -0.0002853395417332649, -0.00026903674006462097, -0.000252733938395977, -0.00023643113672733307, -0.00022012833505868912, -0.00020382553339004517, -0.00018752273172140121, -0.00017121993005275726, -0.0001549171283841133, -0.00013861432671546936, -0.0001223115250468254, -0.00010600872337818146, -8.97059217095375e-05, -7.340312004089355e-05, -5.71003183722496e-05, -4.079751670360565e-05, -2.44947150349617e-05, -8.191913366317749e-06, 8.110888302326202e-06, 2.4413689970970154e-05, 4.0716491639614105e-05, 5.701929330825806e-05, 7.332209497690201e-05, 8.962489664554596e-05, 0.00010592769831418991, 0.00012223049998283386, 0.00013853330165147781, 0.00015483610332012177, 0.00017113890498876572, 0.00018744170665740967, 0.00020374450832605362, 0.00022004730999469757, 0.00023635011166334152, 0.0002526529133319855, 0.0002689557150006294, 0.0002852585166692734, 0.00030156131833791733, 0.0003178641200065613, 0.00033416692167520523, 0.0003504697233438492, 0.00036677252501249313, 0.0003830753266811371, 0.00039937812834978104, 0.000415680930018425, 0.00043198373168706894, 0.0004482865333557129]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 2.0, 10.0, 14.0, 12.0, 17.0, 22.0, 20.0, 33.0, 34.0, 28.0, 40.0, 38.0, 39.0, 51.0, 44.0, 40.0, 37.0, 60.0, 50.0, 37.0, 45.0, 37.0, 29.0, 23.0, 26.0, 19.0, 31.0, 34.0, 21.0, 18.0, 16.0, 14.0, 9.0, 10.0, 9.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3828125, -6.17108154296875, -5.9593505859375, -5.74761962890625, -5.535888671875, -5.32415771484375, -5.1124267578125, -4.90069580078125, -4.68896484375, -4.47723388671875, -4.2655029296875, -4.05377197265625, -3.842041015625, -3.63031005859375, -3.4185791015625, -3.20684814453125, -2.9951171875, -2.78338623046875, -2.5716552734375, -2.35992431640625, -2.148193359375, -1.93646240234375, -1.7247314453125, -1.51300048828125, -1.30126953125, -1.08953857421875, -0.8778076171875, -0.66607666015625, -0.454345703125, -0.24261474609375, -0.0308837890625, 0.18084716796875, 0.392578125, 0.60430908203125, 0.8160400390625, 1.02777099609375, 1.239501953125, 1.45123291015625, 1.6629638671875, 1.87469482421875, 2.08642578125, 2.29815673828125, 2.5098876953125, 2.72161865234375, 2.933349609375, 3.14508056640625, 3.3568115234375, 3.56854248046875, 3.7802734375, 3.99200439453125, 4.2037353515625, 4.41546630859375, 4.627197265625, 4.83892822265625, 5.0506591796875, 5.26239013671875, 5.47412109375, 5.68585205078125, 5.8975830078125, 6.10931396484375, 6.321044921875, 6.53277587890625, 6.7445068359375, 6.95623779296875, 7.16796875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 9.0, 5.0, 12.0, 14.0, 17.0, 25.0, 27.0, 42.0, 67.0, 98.0, 111.0, 175.0, 234.0, 410.0, 800.0, 2271.0, 10916.0, 69620.0, 528707.0, 376957.0, 46629.0, 7834.0, 1683.0, 696.0, 381.0, 209.0, 165.0, 114.0, 78.0, 62.0, 44.0, 32.0, 29.0, 20.0, 18.0, 15.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.4609375, -11.07763671875, -10.6943359375, -10.31103515625, -9.927734375, -9.54443359375, -9.1611328125, -8.77783203125, -8.39453125, -8.01123046875, -7.6279296875, -7.24462890625, -6.861328125, -6.47802734375, -6.0947265625, -5.71142578125, -5.328125, -4.94482421875, -4.5615234375, -4.17822265625, -3.794921875, -3.41162109375, -3.0283203125, -2.64501953125, -2.26171875, -1.87841796875, -1.4951171875, -1.11181640625, -0.728515625, -0.34521484375, 0.0380859375, 0.42138671875, 0.8046875, 1.18798828125, 1.5712890625, 1.95458984375, 2.337890625, 2.72119140625, 3.1044921875, 3.48779296875, 3.87109375, 4.25439453125, 4.6376953125, 5.02099609375, 5.404296875, 5.78759765625, 6.1708984375, 6.55419921875, 6.9375, 7.32080078125, 7.7041015625, 8.08740234375, 8.470703125, 8.85400390625, 9.2373046875, 9.62060546875, 10.00390625, 10.38720703125, 10.7705078125, 11.15380859375, 11.537109375, 11.92041015625, 12.3037109375, 12.68701171875, 13.0703125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 6.0, 9.0, 7.0, 8.0, 20.0, 12.0, 13.0, 24.0, 18.0, 29.0, 31.0, 33.0, 41.0, 41.0, 42.0, 56.0, 67.0, 117.0, 251.0, 1464.0, 209.0, 77.0, 72.0, 50.0, 47.0, 44.0, 34.0, 26.0, 32.0, 23.0, 29.0, 19.0, 13.0, 13.0, 12.0, 8.0, 10.0, 8.0, 5.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.65625, -20.01953125, -19.3828125, -18.74609375, -18.109375, -17.47265625, -16.8359375, -16.19921875, -15.5625, -14.92578125, -14.2890625, -13.65234375, -13.015625, -12.37890625, -11.7421875, -11.10546875, -10.46875, -9.83203125, -9.1953125, -8.55859375, -7.921875, -7.28515625, -6.6484375, -6.01171875, -5.375, -4.73828125, -4.1015625, -3.46484375, -2.828125, -2.19140625, -1.5546875, -0.91796875, -0.28125, 0.35546875, 0.9921875, 1.62890625, 2.265625, 2.90234375, 3.5390625, 4.17578125, 4.8125, 5.44921875, 6.0859375, 6.72265625, 7.359375, 7.99609375, 8.6328125, 9.26953125, 9.90625, 10.54296875, 11.1796875, 11.81640625, 12.453125, 13.08984375, 13.7265625, 14.36328125, 15.0, 15.63671875, 16.2734375, 16.91015625, 17.546875, 18.18359375, 18.8203125, 19.45703125, 20.09375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 5.0, 5.0, 13.0, 10.0, 25.0, 28.0, 53.0, 70.0, 92.0, 189.0, 329.0, 1022.0, 24863.0, 3114130.0, 3589.0, 592.0, 268.0, 137.0, 105.0, 66.0, 40.0, 22.0, 20.0, 9.0, 12.0, 6.0, 9.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.125, -66.2802734375, -63.435546875, -60.5908203125, -57.74609375, -54.9013671875, -52.056640625, -49.2119140625, -46.3671875, -43.5224609375, -40.677734375, -37.8330078125, -34.98828125, -32.1435546875, -29.298828125, -26.4541015625, -23.609375, -20.7646484375, -17.919921875, -15.0751953125, -12.23046875, -9.3857421875, -6.541015625, -3.6962890625, -0.8515625, 1.9931640625, 4.837890625, 7.6826171875, 10.52734375, 13.3720703125, 16.216796875, 19.0615234375, 21.90625, 24.7509765625, 27.595703125, 30.4404296875, 33.28515625, 36.1298828125, 38.974609375, 41.8193359375, 44.6640625, 47.5087890625, 50.353515625, 53.1982421875, 56.04296875, 58.8876953125, 61.732421875, 64.5771484375, 67.421875, 70.2666015625, 73.111328125, 75.9560546875, 78.80078125, 81.6455078125, 84.490234375, 87.3349609375, 90.1796875, 93.0244140625, 95.869140625, 98.7138671875, 101.55859375, 104.4033203125, 107.248046875, 110.0927734375, 112.9375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 832.0, 183.0], "bins": [-853.7847290039062, -840.1876831054688, -826.590576171875, -812.9935302734375, -799.3964233398438, -785.7993774414062, -772.2022705078125, -758.605224609375, -745.0081176757812, -731.4110717773438, -717.81396484375, -704.2169189453125, -690.6198120117188, -677.0227661132812, -663.4256591796875, -649.82861328125, -636.2315063476562, -622.6344604492188, -609.037353515625, -595.4403076171875, -581.8432006835938, -568.2461547851562, -554.6490478515625, -541.052001953125, -527.4548950195312, -513.8578491210938, -500.2607421875, -486.6636657714844, -473.06658935546875, -459.4695129394531, -445.8724365234375, -432.2753601074219, -418.6783142089844, -405.08123779296875, -391.4841613769531, -377.8870849609375, -364.2900085449219, -350.69293212890625, -337.0958557128906, -323.498779296875, -309.9017028808594, -296.30462646484375, -282.7075500488281, -269.1104736328125, -255.51339721679688, -241.91632080078125, -228.31924438476562, -214.72216796875, -201.12510681152344, -187.5280303955078, -173.9309539794922, -160.33387756347656, -146.73680114746094, -133.13973999023438, -119.54265594482422, -105.9455795288086, -92.34849548339844, -78.75141906738281, -65.15434265136719, -51.55727005004883, -37.9601936340332, -24.363121032714844, -10.766044616699219, 2.8310317993164062, 16.4281063079834]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 7.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 7.0, 12.0, 10.0, 17.0, 19.0, 21.0, 16.0, 25.0, 16.0, 40.0, 31.0, 22.0, 26.0, 36.0, 40.0, 31.0, 30.0, 44.0, 37.0, 32.0, 32.0, 31.0, 37.0, 38.0, 38.0, 24.0, 38.0, 27.0, 23.0, 24.0, 22.0, 22.0, 17.0, 20.0, 16.0, 11.0, 12.0, 9.0, 7.0, 12.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0], "bins": [-53.73471450805664, -52.15325164794922, -50.57178497314453, -48.99032211303711, -47.40885925292969, -45.827396392822266, -44.245933532714844, -42.664466857910156, -41.083003997802734, -39.50154113769531, -37.920074462890625, -36.3386116027832, -34.75714874267578, -33.17568588256836, -31.594221115112305, -30.01275634765625, -28.431293487548828, -26.849830627441406, -25.26836585998535, -23.686901092529297, -22.105438232421875, -20.523975372314453, -18.9425106048584, -17.361045837402344, -15.779582977294922, -14.198119163513184, -12.616655349731445, -11.035191535949707, -9.453727722167969, -7.8722639083862305, -6.290800094604492, -4.709336280822754, -3.1278762817382812, -1.546412467956543, 0.03505134582519531, 1.6165151596069336, 3.197978973388672, 4.77944278717041, 6.360906600952148, 7.942370414733887, 9.523834228515625, 11.105298042297363, 12.686761856079102, 14.26822566986084, 15.849689483642578, 17.43115234375, 19.012617111206055, 20.59408187866211, 22.17554473876953, 23.757007598876953, 25.338472366333008, 26.919937133789062, 28.501399993896484, 30.082862854003906, 31.66432762145996, 33.245792388916016, 34.82725524902344, 36.40871810913086, 37.99018096923828, 39.57164764404297, 41.15311050415039, 42.73457336425781, 44.3160400390625, 45.89750289916992, 47.478965759277344]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 7.0, 9.0, 8.0, 9.0, 13.0, 12.0, 12.0, 13.0, 19.0, 20.0, 34.0, 33.0, 33.0, 29.0, 42.0, 35.0, 61.0, 42.0, 43.0, 47.0, 41.0, 38.0, 34.0, 36.0, 33.0, 38.0, 35.0, 25.0, 27.0, 37.0, 18.0, 18.0, 22.0, 15.0, 13.0, 11.0, 11.0, 7.0, 3.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.96875, -6.7279052734375, -6.487060546875, -6.2462158203125, -6.00537109375, -5.7645263671875, -5.523681640625, -5.2828369140625, -5.0419921875, -4.8011474609375, -4.560302734375, -4.3194580078125, -4.07861328125, -3.8377685546875, -3.596923828125, -3.3560791015625, -3.115234375, -2.8743896484375, -2.633544921875, -2.3927001953125, -2.15185546875, -1.9110107421875, -1.670166015625, -1.4293212890625, -1.1884765625, -0.9476318359375, -0.706787109375, -0.4659423828125, -0.22509765625, 0.0157470703125, 0.256591796875, 0.4974365234375, 0.73828125, 0.9791259765625, 1.219970703125, 1.4608154296875, 1.70166015625, 1.9425048828125, 2.183349609375, 2.4241943359375, 2.6650390625, 2.9058837890625, 3.146728515625, 3.3875732421875, 3.62841796875, 3.8692626953125, 4.110107421875, 4.3509521484375, 4.591796875, 4.8326416015625, 5.073486328125, 5.3143310546875, 5.55517578125, 5.7960205078125, 6.036865234375, 6.2777099609375, 6.5185546875, 6.7593994140625, 7.000244140625, 7.2410888671875, 7.48193359375, 7.7227783203125, 7.963623046875, 8.2044677734375, 8.4453125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 8.0, 9.0, 3.0, 12.0, 8.0, 8.0, 14.0, 15.0, 27.0, 23.0, 37.0, 53.0, 47.0, 67.0, 86.0, 166.0, 336.0, 784.0, 5017.0, 211689.0, 3032186.0, 924522.0, 16591.0, 1428.0, 436.0, 209.0, 108.0, 82.0, 55.0, 52.0, 42.0, 37.0, 25.0, 9.0, 21.0, 10.0, 18.0, 11.0, 7.0, 4.0, 4.0, 1.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.328125, -16.724365234375, -16.12060546875, -15.516845703125, -14.9130859375, -14.309326171875, -13.70556640625, -13.101806640625, -12.498046875, -11.894287109375, -11.29052734375, -10.686767578125, -10.0830078125, -9.479248046875, -8.87548828125, -8.271728515625, -7.66796875, -7.064208984375, -6.46044921875, -5.856689453125, -5.2529296875, -4.649169921875, -4.04541015625, -3.441650390625, -2.837890625, -2.234130859375, -1.63037109375, -1.026611328125, -0.4228515625, 0.180908203125, 0.78466796875, 1.388427734375, 1.9921875, 2.595947265625, 3.19970703125, 3.803466796875, 4.4072265625, 5.010986328125, 5.61474609375, 6.218505859375, 6.822265625, 7.426025390625, 8.02978515625, 8.633544921875, 9.2373046875, 9.841064453125, 10.44482421875, 11.048583984375, 11.65234375, 12.256103515625, 12.85986328125, 13.463623046875, 14.0673828125, 14.671142578125, 15.27490234375, 15.878662109375, 16.482421875, 17.086181640625, 17.68994140625, 18.293701171875, 18.8974609375, 19.501220703125, 20.10498046875, 20.708740234375, 21.3125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 3.0, 5.0, 13.0, 5.0, 13.0, 20.0, 22.0, 34.0, 49.0, 100.0, 155.0, 282.0, 427.0, 652.0, 781.0, 614.0, 378.0, 198.0, 127.0, 70.0, 51.0, 28.0, 20.0, 8.0, 2.0, 2.0, 6.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.953125, -13.42578125, -12.8984375, -12.37109375, -11.84375, -11.31640625, -10.7890625, -10.26171875, -9.734375, -9.20703125, -8.6796875, -8.15234375, -7.625, -7.09765625, -6.5703125, -6.04296875, -5.515625, -4.98828125, -4.4609375, -3.93359375, -3.40625, -2.87890625, -2.3515625, -1.82421875, -1.296875, -0.76953125, -0.2421875, 0.28515625, 0.8125, 1.33984375, 1.8671875, 2.39453125, 2.921875, 3.44921875, 3.9765625, 4.50390625, 5.03125, 5.55859375, 6.0859375, 6.61328125, 7.140625, 7.66796875, 8.1953125, 8.72265625, 9.25, 9.77734375, 10.3046875, 10.83203125, 11.359375, 11.88671875, 12.4140625, 12.94140625, 13.46875, 13.99609375, 14.5234375, 15.05078125, 15.578125, 16.10546875, 16.6328125, 17.16015625, 17.6875, 18.21484375, 18.7421875, 19.26953125, 19.796875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 8.0, 10.0, 11.0, 11.0, 19.0, 35.0, 54.0, 64.0, 105.0, 164.0, 252.0, 404.0, 907.0, 3942.0, 162808.0, 3978742.0, 42402.0, 2465.0, 812.0, 397.0, 231.0, 145.0, 86.0, 68.0, 35.0, 31.0, 27.0, 16.0, 17.0, 6.0, 9.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-49.46875, -48.1796875, -46.890625, -45.6015625, -44.3125, -43.0234375, -41.734375, -40.4453125, -39.15625, -37.8671875, -36.578125, -35.2890625, -34.0, -32.7109375, -31.421875, -30.1328125, -28.84375, -27.5546875, -26.265625, -24.9765625, -23.6875, -22.3984375, -21.109375, -19.8203125, -18.53125, -17.2421875, -15.953125, -14.6640625, -13.375, -12.0859375, -10.796875, -9.5078125, -8.21875, -6.9296875, -5.640625, -4.3515625, -3.0625, -1.7734375, -0.484375, 0.8046875, 2.09375, 3.3828125, 4.671875, 5.9609375, 7.25, 8.5390625, 9.828125, 11.1171875, 12.40625, 13.6953125, 14.984375, 16.2734375, 17.5625, 18.8515625, 20.140625, 21.4296875, 22.71875, 24.0078125, 25.296875, 26.5859375, 27.875, 29.1640625, 30.453125, 31.7421875, 33.03125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 15.0, 64.0, 180.0, 316.0, 280.0, 116.0, 28.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.09215545654297, -77.01634216308594, -73.9405288696289, -70.86471557617188, -67.78890228271484, -64.71308898925781, -61.63727569580078, -58.56146240234375, -55.48564910888672, -52.40983581542969, -49.334022521972656, -46.258209228515625, -43.182395935058594, -40.10658264160156, -37.03076934814453, -33.9549560546875, -30.879138946533203, -27.803325653076172, -24.72751235961914, -21.65169906616211, -18.575885772705078, -15.50007152557373, -12.424257278442383, -9.348443984985352, -6.27263069152832, -3.19681715965271, -0.12100362777709961, 2.95481014251709, 6.030623435974121, 9.106436729431152, 12.1822509765625, 15.258064270019531, 18.333877563476562, 21.409690856933594, 24.485504150390625, 27.561317443847656, 30.637130737304688, 33.71294403076172, 36.78875732421875, 39.86457061767578, 42.94038391113281, 46.016197204589844, 49.092010498046875, 52.167823791503906, 55.24363708496094, 58.31945037841797, 61.395263671875, 64.47107696533203, 67.54689025878906, 70.6227035522461, 73.69851684570312, 76.77433013916016, 79.85014343261719, 82.92595672607422, 86.00177001953125, 89.07758331298828, 92.15340423583984, 95.22921752929688, 98.3050308227539, 101.38084411621094, 104.45665740966797, 107.532470703125, 110.60828399658203, 113.68409729003906, 116.7599105834961]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 8.0, 4.0, 6.0, 16.0, 11.0, 12.0, 13.0, 20.0, 15.0, 18.0, 23.0, 29.0, 23.0, 27.0, 26.0, 29.0, 29.0, 36.0, 32.0, 30.0, 36.0, 31.0, 41.0, 44.0, 37.0, 47.0, 29.0, 27.0, 32.0, 23.0, 30.0, 33.0, 25.0, 11.0, 16.0, 18.0, 13.0, 14.0, 14.0, 12.0, 18.0, 5.0, 8.0, 6.0, 6.0, 8.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-33.84520721435547, -32.7781982421875, -31.711193084716797, -30.64418601989746, -29.577178955078125, -28.510169982910156, -27.44316291809082, -26.376155853271484, -25.30914878845215, -24.242141723632812, -23.175134658813477, -22.10812759399414, -21.041118621826172, -19.97411346435547, -18.9071044921875, -17.840097427368164, -16.773090362548828, -15.706083297729492, -14.639076232910156, -13.572068214416504, -12.505061149597168, -11.438054084777832, -10.37104606628418, -9.304039001464844, -8.237031936645508, -7.170024871826172, -6.103017330169678, -5.036009788513184, -3.9690027236938477, -2.9019956588745117, -1.8349881172180176, -0.7679805755615234, 0.2990264892578125, 1.3660337924957275, 2.4330410957336426, 3.5000483989715576, 4.567055702209473, 5.634062767028809, 6.701070308685303, 7.768077850341797, 8.835084915161133, 9.902091979980469, 10.969099044799805, 12.036107063293457, 13.103114128112793, 14.170121192932129, 15.237129211425781, 16.304136276245117, 17.371143341064453, 18.43815040588379, 19.505157470703125, 20.57216453552246, 21.639171600341797, 22.706180572509766, 23.7731876373291, 24.840194702148438, 25.907201766967773, 26.97420883178711, 28.041215896606445, 29.10822296142578, 30.17523193359375, 31.242237091064453, 32.30924606323242, 33.376251220703125, 34.443260192871094]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 7.0, 5.0, 5.0, 3.0, 10.0, 9.0, 11.0, 10.0, 14.0, 25.0, 19.0, 21.0, 34.0, 26.0, 29.0, 40.0, 40.0, 37.0, 46.0, 39.0, 49.0, 45.0, 47.0, 39.0, 32.0, 39.0, 40.0, 44.0, 31.0, 30.0, 21.0, 31.0, 19.0, 14.0, 12.0, 16.0, 12.0, 10.0, 8.0, 7.0, 4.0, 2.0, 5.0, 4.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.87890625, -6.65362548828125, -6.4283447265625, -6.20306396484375, -5.977783203125, -5.75250244140625, -5.5272216796875, -5.30194091796875, -5.07666015625, -4.85137939453125, -4.6260986328125, -4.40081787109375, -4.175537109375, -3.95025634765625, -3.7249755859375, -3.49969482421875, -3.2744140625, -3.04913330078125, -2.8238525390625, -2.59857177734375, -2.373291015625, -2.14801025390625, -1.9227294921875, -1.69744873046875, -1.47216796875, -1.24688720703125, -1.0216064453125, -0.79632568359375, -0.571044921875, -0.34576416015625, -0.1204833984375, 0.10479736328125, 0.330078125, 0.55535888671875, 0.7806396484375, 1.00592041015625, 1.231201171875, 1.45648193359375, 1.6817626953125, 1.90704345703125, 2.13232421875, 2.35760498046875, 2.5828857421875, 2.80816650390625, 3.033447265625, 3.25872802734375, 3.4840087890625, 3.70928955078125, 3.9345703125, 4.15985107421875, 4.3851318359375, 4.61041259765625, 4.835693359375, 5.06097412109375, 5.2862548828125, 5.51153564453125, 5.73681640625, 5.96209716796875, 6.1873779296875, 6.41265869140625, 6.637939453125, 6.86322021484375, 7.0885009765625, 7.31378173828125, 7.5390625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 9.0, 6.0, 19.0, 22.0, 40.0, 48.0, 53.0, 100.0, 149.0, 222.0, 289.0, 460.0, 577.0, 830.0, 1290.0, 1873.0, 2711.0, 4038.0, 6106.0, 9394.0, 14479.0, 22790.0, 37032.0, 62544.0, 110818.0, 286686.0, 232479.0, 100364.0, 57500.0, 34466.0, 21193.0, 13511.0, 8692.0, 5794.0, 3610.0, 2679.0, 1766.0, 1182.0, 811.0, 593.0, 405.0, 285.0, 203.0, 142.0, 96.0, 75.0, 41.0, 31.0, 18.0, 15.0, 14.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.6396484375, -1.58984375, -1.5400390625, -1.490234375, -1.4404296875, -1.390625, -1.3408203125, -1.291015625, -1.2412109375, -1.19140625, -1.1416015625, -1.091796875, -1.0419921875, -0.9921875, -0.9423828125, -0.892578125, -0.8427734375, -0.79296875, -0.7431640625, -0.693359375, -0.6435546875, -0.59375, -0.5439453125, -0.494140625, -0.4443359375, -0.39453125, -0.3447265625, -0.294921875, -0.2451171875, -0.1953125, -0.1455078125, -0.095703125, -0.0458984375, 0.00390625, 0.0537109375, 0.103515625, 0.1533203125, 0.203125, 0.2529296875, 0.302734375, 0.3525390625, 0.40234375, 0.4521484375, 0.501953125, 0.5517578125, 0.6015625, 0.6513671875, 0.701171875, 0.7509765625, 0.80078125, 0.8505859375, 0.900390625, 0.9501953125, 1.0, 1.0498046875, 1.099609375, 1.1494140625, 1.19921875, 1.2490234375, 1.298828125, 1.3486328125, 1.3984375, 1.4482421875, 1.498046875, 1.5478515625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 2.0, 0.0, 7.0, 9.0, 9.0, 18.0, 14.0, 16.0, 23.0, 14.0, 25.0, 24.0, 40.0, 36.0, 25.0, 29.0, 46.0, 40.0, 36.0, 35.0, 465.0, 642.0, 34.0, 40.0, 39.0, 46.0, 37.0, 23.0, 31.0, 32.0, 30.0, 29.0, 16.0, 16.0, 14.0, 21.0, 14.0, 6.0, 5.0, 6.0, 5.0, 5.0, 7.0, 2.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0], "bins": [-4.921875, -4.78125, -4.640625, -4.5, -4.359375, -4.21875, -4.078125, -3.9375, -3.796875, -3.65625, -3.515625, -3.375, -3.234375, -3.09375, -2.953125, -2.8125, -2.671875, -2.53125, -2.390625, -2.25, -2.109375, -1.96875, -1.828125, -1.6875, -1.546875, -1.40625, -1.265625, -1.125, -0.984375, -0.84375, -0.703125, -0.5625, -0.421875, -0.28125, -0.140625, 0.0, 0.140625, 0.28125, 0.421875, 0.5625, 0.703125, 0.84375, 0.984375, 1.125, 1.265625, 1.40625, 1.546875, 1.6875, 1.828125, 1.96875, 2.109375, 2.25, 2.390625, 2.53125, 2.671875, 2.8125, 2.953125, 3.09375, 3.234375, 3.375, 3.515625, 3.65625, 3.796875, 3.9375, 4.078125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 2.0, 6.0, 2.0, 8.0, 17.0, 20.0, 38.0, 28.0, 76.0, 121.0, 125.0, 229.0, 293.0, 467.0, 664.0, 1007.0, 1517.0, 2360.0, 3930.0, 6286.0, 10223.0, 17186.0, 29913.0, 52129.0, 95758.0, 210445.0, 1389428.0, 121070.0, 64517.0, 35947.0, 20697.0, 12346.0, 7352.0, 4636.0, 2893.0, 1878.0, 1211.0, 789.0, 554.0, 324.0, 194.0, 128.0, 90.0, 83.0, 40.0, 31.0, 24.0, 17.0, 12.0, 12.0, 4.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.66015625, -1.6032562255859375, -1.546356201171875, -1.4894561767578125, -1.43255615234375, -1.3756561279296875, -1.318756103515625, -1.2618560791015625, -1.2049560546875, -1.1480560302734375, -1.091156005859375, -1.0342559814453125, -0.97735595703125, -0.9204559326171875, -0.863555908203125, -0.8066558837890625, -0.749755859375, -0.6928558349609375, -0.635955810546875, -0.5790557861328125, -0.52215576171875, -0.4652557373046875, -0.408355712890625, -0.3514556884765625, -0.2945556640625, -0.2376556396484375, -0.180755615234375, -0.1238555908203125, -0.06695556640625, -0.0100555419921875, 0.046844482421875, 0.1037445068359375, 0.16064453125, 0.2175445556640625, 0.274444580078125, 0.3313446044921875, 0.38824462890625, 0.4451446533203125, 0.502044677734375, 0.5589447021484375, 0.6158447265625, 0.6727447509765625, 0.729644775390625, 0.7865447998046875, 0.84344482421875, 0.9003448486328125, 0.957244873046875, 1.0141448974609375, 1.071044921875, 1.1279449462890625, 1.184844970703125, 1.2417449951171875, 1.29864501953125, 1.3555450439453125, 1.412445068359375, 1.4693450927734375, 1.5262451171875, 1.5831451416015625, 1.640045166015625, 1.6969451904296875, 1.75384521484375, 1.8107452392578125, 1.867645263671875, 1.9245452880859375, 1.9814453125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 7.0, 9.0, 12.0, 12.0, 15.0, 21.0, 14.0, 15.0, 32.0, 43.0, 50.0, 96.0, 125.0, 131.0, 108.0, 96.0, 50.0, 48.0, 29.0, 24.0, 19.0, 9.0, 12.0, 11.0, 3.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016145706176757812, -0.0015532523393630981, -0.001491934061050415, -0.001430615782737732, -0.0013692975044250488, -0.0013079792261123657, -0.0012466609477996826, -0.0011853426694869995, -0.0011240243911743164, -0.0010627061128616333, -0.0010013878345489502, -0.0009400695562362671, -0.000878751277923584, -0.0008174329996109009, -0.0007561147212982178, -0.0006947964429855347, -0.0006334781646728516, -0.0005721598863601685, -0.0005108416080474854, -0.00044952332973480225, -0.00038820505142211914, -0.00032688677310943604, -0.00026556849479675293, -0.00020425021648406982, -0.00014293193817138672, -8.161365985870361e-05, -2.0295381546020508e-05, 4.10228967666626e-05, 0.0001023411750793457, 0.0001636594533920288, 0.00022497773170471191, 0.000286296010017395, 0.0003476142883300781, 0.00040893256664276123, 0.00047025084495544434, 0.0005315691232681274, 0.0005928874015808105, 0.0006542056798934937, 0.0007155239582061768, 0.0007768422365188599, 0.000838160514831543, 0.0008994787931442261, 0.0009607970714569092, 0.0010221153497695923, 0.0010834336280822754, 0.0011447519063949585, 0.0012060701847076416, 0.0012673884630203247, 0.0013287067413330078, 0.001390025019645691, 0.001451343297958374, 0.0015126615762710571, 0.0015739798545837402, 0.0016352981328964233, 0.0016966164112091064, 0.0017579346895217896, 0.0018192529678344727, 0.0018805712461471558, 0.0019418895244598389, 0.002003207802772522, 0.002064526081085205, 0.002125844359397888, 0.0021871626377105713, 0.0022484809160232544, 0.0023097991943359375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 1.0, 3.0, 11.0, 10.0, 15.0, 19.0, 32.0, 43.0, 54.0, 94.0, 170.0, 306.0, 672.0, 8698.0, 1035797.0, 1539.0, 470.0, 238.0, 109.0, 62.0, 42.0, 39.0, 38.0, 25.0, 22.0, 11.0, 13.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.046722412109375, -0.045502662658691406, -0.04428291320800781, -0.04306316375732422, -0.041843414306640625, -0.04062366485595703, -0.03940391540527344, -0.038184165954589844, -0.03696441650390625, -0.035744667053222656, -0.03452491760253906, -0.03330516815185547, -0.032085418701171875, -0.03086566925048828, -0.029645919799804688, -0.028426170349121094, -0.0272064208984375, -0.025986671447753906, -0.024766921997070312, -0.02354717254638672, -0.022327423095703125, -0.02110767364501953, -0.019887924194335938, -0.018668174743652344, -0.01744842529296875, -0.016228675842285156, -0.015008926391601562, -0.013789176940917969, -0.012569427490234375, -0.011349678039550781, -0.010129928588867188, -0.008910179138183594, -0.0076904296875, -0.006470680236816406, -0.0052509307861328125, -0.004031181335449219, -0.002811431884765625, -0.0015916824340820312, -0.0003719329833984375, 0.0008478164672851562, 0.00206756591796875, 0.0032873153686523438, 0.0045070648193359375, 0.005726814270019531, 0.006946563720703125, 0.008166313171386719, 0.009386062622070312, 0.010605812072753906, 0.0118255615234375, 0.013045310974121094, 0.014265060424804688, 0.015484809875488281, 0.016704559326171875, 0.01792430877685547, 0.019144058227539062, 0.020363807678222656, 0.02158355712890625, 0.022803306579589844, 0.024023056030273438, 0.02524280548095703, 0.026462554931640625, 0.02768230438232422, 0.028902053833007812, 0.030121803283691406, 0.031341552734375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 96.0, 387.0, 414.0, 95.0, 9.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0034516933374106884, -0.003369476180523634, -0.003287258790805936, -0.0032050416339188814, -0.003122824477031827, -0.003040607087314129, -0.0029583899304270744, -0.00287617277354002, -0.0027939556166529655, -0.002711738459765911, -0.002629521070048213, -0.0025473039131611586, -0.002465086756274104, -0.002382869366556406, -0.0023006522096693516, -0.002218435052782297, -0.002136217663064599, -0.0020540005061775446, -0.0019717831164598465, -0.001889565959572792, -0.0018073488026857376, -0.0017251315293833613, -0.001642914256080985, -0.0015606970991939306, -0.0014784798258915544, -0.001396262552589178, -0.0013140453957021236, -0.0012318281223997474, -0.001149610849097371, -0.0010673936922103167, -0.0009851764189079404, -0.000902959203813225, -0.000820741755887866, -0.0007385245407931507, -0.0006563073256984353, -0.000574090052396059, -0.0004918728373013437, -0.0004096556222066283, -0.00032743834890425205, -0.0002452211338095367, -0.00016300391871482134, -8.078668906819075e-05, 1.4305405784398317e-06, 8.364778477698565e-05, 0.000165864999871701, 0.00024808221496641636, 0.00033029948826879263, 0.000412516703363508, 0.0004947339184582233, 0.0005769511335529387, 0.0006591683486476541, 0.0007413856219500303, 0.0008236028370447457, 0.000905820052139461, 0.0009880373254418373, 0.0010702544823288918, 0.001152471755631268, 0.0012346890289336443, 0.0013169061858206987, 0.001399123459123075, 0.0014813407324254513, 0.0015635578893125057, 0.001645775162614882, 0.0017279924359172583, 0.0018102095928043127]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 3.0, 4.0, 6.0, 14.0, 14.0, 12.0, 18.0, 19.0, 15.0, 32.0, 20.0, 22.0, 31.0, 31.0, 32.0, 48.0, 43.0, 42.0, 35.0, 41.0, 37.0, 45.0, 38.0, 43.0, 38.0, 42.0, 34.0, 28.0, 29.0, 28.0, 24.0, 20.0, 12.0, 26.0, 16.0, 16.0, 7.0, 5.0, 9.0, 5.0, 3.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005869865417480469, -0.0005651433020830154, -0.000543300062417984, -0.0005214568227529526, -0.0004996135830879211, -0.0004777703434228897, -0.0004559271037578583, -0.00043408386409282684, -0.0004122406244277954, -0.000390397384762764, -0.00036855414509773254, -0.0003467109054327011, -0.0003248676657676697, -0.00030302442610263824, -0.0002811811864376068, -0.0002593379467725754, -0.00023749470710754395, -0.0002156514674425125, -0.00019380822777748108, -0.00017196498811244965, -0.0001501217484474182, -0.00012827850878238678, -0.00010643526911735535, -8.459202945232391e-05, -6.274878978729248e-05, -4.090555012226105e-05, -1.9062310457229614e-05, 2.780929207801819e-06, 2.4624168872833252e-05, 4.6467408537864685e-05, 6.831064820289612e-05, 9.015388786792755e-05, 0.00011199712753295898, 0.00013384036719799042, 0.00015568360686302185, 0.00017752684652805328, 0.00019937008619308472, 0.00022121332585811615, 0.00024305656552314758, 0.000264899805188179, 0.00028674304485321045, 0.0003085862845182419, 0.0003304295241832733, 0.00035227276384830475, 0.0003741160035133362, 0.0003959592431783676, 0.00041780248284339905, 0.0004396457225084305, 0.0004614889621734619, 0.00048333220183849335, 0.0005051754415035248, 0.0005270186811685562, 0.0005488619208335876, 0.0005707051604986191, 0.0005925484001636505, 0.000614391639828682, 0.0006362348794937134, 0.0006580781191587448, 0.0006799213588237762, 0.0007017645984888077, 0.0007236078381538391, 0.0007454510778188705, 0.000767294317483902, 0.0007891375571489334, 0.0008109807968139648]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 7.0, 5.0, 5.0, 3.0, 10.0, 9.0, 11.0, 10.0, 14.0, 25.0, 19.0, 21.0, 34.0, 26.0, 29.0, 40.0, 40.0, 37.0, 46.0, 39.0, 49.0, 45.0, 47.0, 39.0, 32.0, 39.0, 40.0, 44.0, 31.0, 30.0, 21.0, 31.0, 19.0, 14.0, 12.0, 16.0, 12.0, 10.0, 8.0, 7.0, 4.0, 2.0, 5.0, 4.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.87890625, -6.65362548828125, -6.4283447265625, -6.20306396484375, -5.977783203125, -5.75250244140625, -5.5272216796875, -5.30194091796875, -5.07666015625, -4.85137939453125, -4.6260986328125, -4.40081787109375, -4.175537109375, -3.95025634765625, -3.7249755859375, -3.49969482421875, -3.2744140625, -3.04913330078125, -2.8238525390625, -2.59857177734375, -2.373291015625, -2.14801025390625, -1.9227294921875, -1.69744873046875, -1.47216796875, -1.24688720703125, -1.0216064453125, -0.79632568359375, -0.571044921875, -0.34576416015625, -0.1204833984375, 0.10479736328125, 0.330078125, 0.55535888671875, 0.7806396484375, 1.00592041015625, 1.231201171875, 1.45648193359375, 1.6817626953125, 1.90704345703125, 2.13232421875, 2.35760498046875, 2.5828857421875, 2.80816650390625, 3.033447265625, 3.25872802734375, 3.4840087890625, 3.70928955078125, 3.9345703125, 4.15985107421875, 4.3851318359375, 4.61041259765625, 4.835693359375, 5.06097412109375, 5.2862548828125, 5.51153564453125, 5.73681640625, 5.96209716796875, 6.1873779296875, 6.41265869140625, 6.637939453125, 6.86322021484375, 7.0885009765625, 7.31378173828125, 7.5390625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 8.0, 7.0, 11.0, 19.0, 25.0, 27.0, 33.0, 49.0, 94.0, 97.0, 127.0, 165.0, 234.0, 321.0, 419.0, 548.0, 899.0, 2399.0, 13112.0, 139340.0, 812823.0, 65569.0, 7716.0, 1712.0, 764.0, 516.0, 380.0, 272.0, 205.0, 140.0, 144.0, 102.0, 57.0, 55.0, 40.0, 29.0, 22.0, 17.0, 8.0, 10.0, 6.0, 5.0, 5.0, 6.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.953125, -16.394775390625, -15.83642578125, -15.278076171875, -14.7197265625, -14.161376953125, -13.60302734375, -13.044677734375, -12.486328125, -11.927978515625, -11.36962890625, -10.811279296875, -10.2529296875, -9.694580078125, -9.13623046875, -8.577880859375, -8.01953125, -7.461181640625, -6.90283203125, -6.344482421875, -5.7861328125, -5.227783203125, -4.66943359375, -4.111083984375, -3.552734375, -2.994384765625, -2.43603515625, -1.877685546875, -1.3193359375, -0.760986328125, -0.20263671875, 0.355712890625, 0.9140625, 1.472412109375, 2.03076171875, 2.589111328125, 3.1474609375, 3.705810546875, 4.26416015625, 4.822509765625, 5.380859375, 5.939208984375, 6.49755859375, 7.055908203125, 7.6142578125, 8.172607421875, 8.73095703125, 9.289306640625, 9.84765625, 10.406005859375, 10.96435546875, 11.522705078125, 12.0810546875, 12.639404296875, 13.19775390625, 13.756103515625, 14.314453125, 14.872802734375, 15.43115234375, 15.989501953125, 16.5478515625, 17.106201171875, 17.66455078125, 18.222900390625, 18.78125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 9.0, 10.0, 4.0, 9.0, 12.0, 16.0, 18.0, 22.0, 19.0, 18.0, 32.0, 40.0, 40.0, 37.0, 47.0, 73.0, 81.0, 331.0, 1643.0, 118.0, 75.0, 59.0, 42.0, 42.0, 28.0, 29.0, 33.0, 31.0, 22.0, 20.0, 19.0, 11.0, 9.0, 10.0, 10.0, 7.0, 1.0, 5.0, 5.0, 3.0, 4.0, 0.0, 1.0, 3.0], "bins": [-27.75, -27.024169921875, -26.29833984375, -25.572509765625, -24.8466796875, -24.120849609375, -23.39501953125, -22.669189453125, -21.943359375, -21.217529296875, -20.49169921875, -19.765869140625, -19.0400390625, -18.314208984375, -17.58837890625, -16.862548828125, -16.13671875, -15.410888671875, -14.68505859375, -13.959228515625, -13.2333984375, -12.507568359375, -11.78173828125, -11.055908203125, -10.330078125, -9.604248046875, -8.87841796875, -8.152587890625, -7.4267578125, -6.700927734375, -5.97509765625, -5.249267578125, -4.5234375, -3.797607421875, -3.07177734375, -2.345947265625, -1.6201171875, -0.894287109375, -0.16845703125, 0.557373046875, 1.283203125, 2.009033203125, 2.73486328125, 3.460693359375, 4.1865234375, 4.912353515625, 5.63818359375, 6.364013671875, 7.08984375, 7.815673828125, 8.54150390625, 9.267333984375, 9.9931640625, 10.718994140625, 11.44482421875, 12.170654296875, 12.896484375, 13.622314453125, 14.34814453125, 15.073974609375, 15.7998046875, 16.525634765625, 17.25146484375, 17.977294921875, 18.703125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 1.0, 4.0, 2.0, 5.0, 8.0, 11.0, 9.0, 13.0, 8.0, 14.0, 12.0, 32.0, 32.0, 27.0, 61.0, 37.0, 54.0, 104.0, 182.0, 267.0, 792.0, 4169.0, 2836546.0, 299229.0, 2696.0, 615.0, 225.0, 148.0, 82.0, 61.0, 50.0, 37.0, 29.0, 32.0, 25.0, 12.0, 18.0, 13.0, 7.0, 7.0, 9.0, 9.0, 8.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.03125, -47.13818359375, -45.2451171875, -43.35205078125, -41.458984375, -39.56591796875, -37.6728515625, -35.77978515625, -33.88671875, -31.99365234375, -30.1005859375, -28.20751953125, -26.314453125, -24.42138671875, -22.5283203125, -20.63525390625, -18.7421875, -16.84912109375, -14.9560546875, -13.06298828125, -11.169921875, -9.27685546875, -7.3837890625, -5.49072265625, -3.59765625, -1.70458984375, 0.1884765625, 2.08154296875, 3.974609375, 5.86767578125, 7.7607421875, 9.65380859375, 11.546875, 13.43994140625, 15.3330078125, 17.22607421875, 19.119140625, 21.01220703125, 22.9052734375, 24.79833984375, 26.69140625, 28.58447265625, 30.4775390625, 32.37060546875, 34.263671875, 36.15673828125, 38.0498046875, 39.94287109375, 41.8359375, 43.72900390625, 45.6220703125, 47.51513671875, 49.408203125, 51.30126953125, 53.1943359375, 55.08740234375, 56.98046875, 58.87353515625, 60.7666015625, 62.65966796875, 64.552734375, 66.44580078125, 68.3388671875, 70.23193359375, 72.125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 71.0, 221.0, 365.0, 251.0, 85.0, 15.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.70166301727295, -7.986354827880859, -6.2710466384887695, -4.555738925933838, -2.840430736541748, -1.1251230239868164, 0.5901851654052734, 2.3054933547973633, 4.020801544189453, 5.736109733581543, 7.451417922973633, 9.166725158691406, 10.882034301757812, 12.597341537475586, 14.312649726867676, 16.027957916259766, 17.743267059326172, 19.458574295043945, 21.17388343811035, 22.889190673828125, 24.60449981689453, 26.319807052612305, 28.035114288330078, 29.750423431396484, 31.465730667114258, 33.18103790283203, 34.89634704589844, 36.611656188964844, 38.326961517333984, 40.04227066040039, 41.7575798034668, 43.47288513183594, 45.18819808959961, 46.903507232666016, 48.618812561035156, 50.33412170410156, 52.04943084716797, 53.764739990234375, 55.480045318603516, 57.19535446166992, 58.91066360473633, 60.625972747802734, 62.341278076171875, 64.05658721923828, 65.77189636230469, 67.4872055053711, 69.2025146484375, 70.91781616210938, 72.63312530517578, 74.34843444824219, 76.0637435913086, 77.779052734375, 79.49435424804688, 81.20966339111328, 82.92497253417969, 84.6402816772461, 86.3555908203125, 88.0708999633789, 89.78620910644531, 91.50151824951172, 93.2168197631836, 94.93212890625, 96.6474380493164, 98.36274719238281, 100.07805633544922]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 2.0, 7.0, 5.0, 11.0, 11.0, 5.0, 7.0, 5.0, 13.0, 22.0, 14.0, 22.0, 24.0, 26.0, 23.0, 24.0, 26.0, 25.0, 27.0, 34.0, 37.0, 40.0, 39.0, 43.0, 38.0, 37.0, 36.0, 30.0, 40.0, 37.0, 29.0, 25.0, 34.0, 21.0, 31.0, 14.0, 16.0, 23.0, 12.0, 17.0, 16.0, 13.0, 10.0, 5.0, 7.0, 5.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-54.41594696044922, -52.89585494995117, -51.37575912475586, -49.85566711425781, -48.3355712890625, -46.81547927856445, -45.295387268066406, -43.775291442871094, -42.25519943237305, -40.735107421875, -39.21501159667969, -37.69491958618164, -36.17482376098633, -34.65473175048828, -33.13463592529297, -31.614543914794922, -30.094449996948242, -28.574356079101562, -27.054262161254883, -25.534168243408203, -24.014076232910156, -22.493982315063477, -20.973888397216797, -19.45379638671875, -17.933700561523438, -16.413606643676758, -14.893513679504395, -13.373419761657715, -11.853326797485352, -10.333232879638672, -8.813138961791992, -7.293045997619629, -5.772953033447266, -4.252859592437744, -2.7327659130096436, -1.212672233581543, 0.3074212074279785, 1.8275146484375, 3.3476085662841797, 4.867701530456543, 6.387795448303223, 7.907888889312744, 9.427982330322266, 10.948076248168945, 12.468170166015625, 13.988263130187988, 15.508357048034668, 17.02845001220703, 18.54854393005371, 20.06863784790039, 21.58873176574707, 23.10882568359375, 24.628917694091797, 26.149011611938477, 27.669105529785156, 29.189197540283203, 30.709293365478516, 32.22938537597656, 33.749481201171875, 35.26957321166992, 36.789669036865234, 38.30976104736328, 39.829856872558594, 41.34994888305664, 42.87004089355469]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 6.0, 11.0, 11.0, 8.0, 16.0, 16.0, 17.0, 25.0, 30.0, 27.0, 35.0, 30.0, 35.0, 49.0, 52.0, 38.0, 45.0, 48.0, 47.0, 46.0, 47.0, 40.0, 39.0, 31.0, 37.0, 31.0, 33.0, 23.0, 18.0, 20.0, 17.0, 14.0, 14.0, 9.0, 8.0, 4.0, 7.0, 2.0, 4.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8359375, -7.5823974609375, -7.328857421875, -7.0753173828125, -6.82177734375, -6.5682373046875, -6.314697265625, -6.0611572265625, -5.8076171875, -5.5540771484375, -5.300537109375, -5.0469970703125, -4.79345703125, -4.5399169921875, -4.286376953125, -4.0328369140625, -3.779296875, -3.5257568359375, -3.272216796875, -3.0186767578125, -2.76513671875, -2.5115966796875, -2.258056640625, -2.0045166015625, -1.7509765625, -1.4974365234375, -1.243896484375, -0.9903564453125, -0.73681640625, -0.4832763671875, -0.229736328125, 0.0238037109375, 0.27734375, 0.5308837890625, 0.784423828125, 1.0379638671875, 1.29150390625, 1.5450439453125, 1.798583984375, 2.0521240234375, 2.3056640625, 2.5592041015625, 2.812744140625, 3.0662841796875, 3.31982421875, 3.5733642578125, 3.826904296875, 4.0804443359375, 4.333984375, 4.5875244140625, 4.841064453125, 5.0946044921875, 5.34814453125, 5.6016845703125, 5.855224609375, 6.1087646484375, 6.3623046875, 6.6158447265625, 6.869384765625, 7.1229248046875, 7.37646484375, 7.6300048828125, 7.883544921875, 8.1370849609375, 8.390625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 4.0, 8.0, 12.0, 14.0, 21.0, 25.0, 28.0, 44.0, 61.0, 75.0, 103.0, 135.0, 173.0, 260.0, 361.0, 717.0, 1927.0, 12659.0, 258445.0, 2465143.0, 1373253.0, 72717.0, 5140.0, 1198.0, 532.0, 352.0, 211.0, 169.0, 106.0, 100.0, 55.0, 75.0, 43.0, 21.0, 19.0, 15.0, 11.0, 7.0, 11.0, 11.0, 8.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.140625, -14.649169921875, -14.15771484375, -13.666259765625, -13.1748046875, -12.683349609375, -12.19189453125, -11.700439453125, -11.208984375, -10.717529296875, -10.22607421875, -9.734619140625, -9.2431640625, -8.751708984375, -8.26025390625, -7.768798828125, -7.27734375, -6.785888671875, -6.29443359375, -5.802978515625, -5.3115234375, -4.820068359375, -4.32861328125, -3.837158203125, -3.345703125, -2.854248046875, -2.36279296875, -1.871337890625, -1.3798828125, -0.888427734375, -0.39697265625, 0.094482421875, 0.5859375, 1.077392578125, 1.56884765625, 2.060302734375, 2.5517578125, 3.043212890625, 3.53466796875, 4.026123046875, 4.517578125, 5.009033203125, 5.50048828125, 5.991943359375, 6.4833984375, 6.974853515625, 7.46630859375, 7.957763671875, 8.44921875, 8.940673828125, 9.43212890625, 9.923583984375, 10.4150390625, 10.906494140625, 11.39794921875, 11.889404296875, 12.380859375, 12.872314453125, 13.36376953125, 13.855224609375, 14.3466796875, 14.838134765625, 15.32958984375, 15.821044921875, 16.3125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 5.0, 5.0, 10.0, 15.0, 15.0, 40.0, 81.0, 120.0, 237.0, 457.0, 705.0, 750.0, 645.0, 400.0, 242.0, 131.0, 83.0, 48.0, 29.0, 18.0, 7.0, 8.0, 5.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.40625, -17.85693359375, -17.3076171875, -16.75830078125, -16.208984375, -15.65966796875, -15.1103515625, -14.56103515625, -14.01171875, -13.46240234375, -12.9130859375, -12.36376953125, -11.814453125, -11.26513671875, -10.7158203125, -10.16650390625, -9.6171875, -9.06787109375, -8.5185546875, -7.96923828125, -7.419921875, -6.87060546875, -6.3212890625, -5.77197265625, -5.22265625, -4.67333984375, -4.1240234375, -3.57470703125, -3.025390625, -2.47607421875, -1.9267578125, -1.37744140625, -0.828125, -0.27880859375, 0.2705078125, 0.81982421875, 1.369140625, 1.91845703125, 2.4677734375, 3.01708984375, 3.56640625, 4.11572265625, 4.6650390625, 5.21435546875, 5.763671875, 6.31298828125, 6.8623046875, 7.41162109375, 7.9609375, 8.51025390625, 9.0595703125, 9.60888671875, 10.158203125, 10.70751953125, 11.2568359375, 11.80615234375, 12.35546875, 12.90478515625, 13.4541015625, 14.00341796875, 14.552734375, 15.10205078125, 15.6513671875, 16.20068359375, 16.75]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 11.0, 17.0, 12.0, 23.0, 41.0, 75.0, 108.0, 185.0, 314.0, 773.0, 2473.0, 56099.0, 4059737.0, 70009.0, 2849.0, 802.0, 356.0, 163.0, 92.0, 46.0, 36.0, 13.0, 17.0, 9.0, 10.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.0625, -43.5859375, -42.109375, -40.6328125, -39.15625, -37.6796875, -36.203125, -34.7265625, -33.25, -31.7734375, -30.296875, -28.8203125, -27.34375, -25.8671875, -24.390625, -22.9140625, -21.4375, -19.9609375, -18.484375, -17.0078125, -15.53125, -14.0546875, -12.578125, -11.1015625, -9.625, -8.1484375, -6.671875, -5.1953125, -3.71875, -2.2421875, -0.765625, 0.7109375, 2.1875, 3.6640625, 5.140625, 6.6171875, 8.09375, 9.5703125, 11.046875, 12.5234375, 14.0, 15.4765625, 16.953125, 18.4296875, 19.90625, 21.3828125, 22.859375, 24.3359375, 25.8125, 27.2890625, 28.765625, 30.2421875, 31.71875, 33.1953125, 34.671875, 36.1484375, 37.625, 39.1015625, 40.578125, 42.0546875, 43.53125, 45.0078125, 46.484375, 47.9609375, 49.4375]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [11.0, 94.0, 322.0, 421.0, 150.0, 12.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.007353782653809, -9.532444953918457, -5.0575361251831055, -0.5826272964477539, 3.8922815322875977, 8.36719036102295, 12.8420991897583, 17.31700897216797, 21.791915893554688, 26.26682472229004, 30.74173355102539, 35.216644287109375, 39.691551208496094, 44.16645812988281, 48.6413688659668, 53.11627960205078, 57.5911865234375, 62.06609344482422, 66.54100036621094, 71.01591491699219, 75.4908218383789, 79.96572875976562, 84.44064331054688, 88.9155502319336, 93.39045715332031, 97.86536407470703, 102.34027099609375, 106.815185546875, 111.29009246826172, 115.76499938964844, 120.23991394042969, 124.7148208618164, 129.18972778320312, 133.66464233398438, 138.13954162597656, 142.6144561767578, 147.08935546875, 151.56427001953125, 156.0391845703125, 160.5140838623047, 164.98899841308594, 169.4639129638672, 173.93881225585938, 178.41372680664062, 182.88864135742188, 187.36354064941406, 191.8384552001953, 196.3133544921875, 200.78826904296875, 205.26318359375, 209.7380828857422, 214.21299743652344, 218.68789672851562, 223.16281127929688, 227.63772583007812, 232.1126251220703, 236.58753967285156, 241.0624542236328, 245.537353515625, 250.01226806640625, 254.4871826171875, 258.96209716796875, 263.4369812011719, 267.9118957519531, 272.3868103027344]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 1.0, 3.0, 8.0, 9.0, 11.0, 5.0, 16.0, 15.0, 20.0, 15.0, 23.0, 18.0, 27.0, 24.0, 39.0, 39.0, 41.0, 45.0, 43.0, 52.0, 34.0, 37.0, 54.0, 38.0, 30.0, 34.0, 44.0, 28.0, 27.0, 34.0, 34.0, 26.0, 26.0, 17.0, 13.0, 10.0, 14.0, 18.0, 6.0, 10.0, 2.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.04771423339844, -38.866085052490234, -37.684452056884766, -36.50282287597656, -35.321189880371094, -34.13956069946289, -32.95792770385742, -31.77629852294922, -30.59466552734375, -29.413034439086914, -28.231403350830078, -27.049772262573242, -25.868141174316406, -24.68651008605957, -23.504878997802734, -22.32324981689453, -21.141618728637695, -19.95998764038086, -18.778356552124023, -17.596725463867188, -16.41509437561035, -15.233463287353516, -14.051833152770996, -12.87020206451416, -11.688570976257324, -10.506939888000488, -9.325308799743652, -8.143678665161133, -6.962047100067139, -5.780416011810303, -4.598785400390625, -3.417154312133789, -2.235523223876953, -1.0538922548294067, 0.12773871421813965, 1.3093695640563965, 2.4910006523132324, 3.6726317405700684, 4.854262351989746, 6.035893440246582, 7.217524528503418, 8.399155616760254, 9.58078670501709, 10.76241683959961, 11.944047927856445, 13.125679016113281, 14.307310104370117, 15.488941192626953, 16.67057228088379, 17.852203369140625, 19.03383445739746, 20.215465545654297, 21.397096633911133, 22.57872772216797, 23.760356903076172, 24.94198989868164, 26.123619079589844, 27.30525016784668, 28.486881256103516, 29.66851234436035, 30.850143432617188, 32.03177261352539, 33.21340560913086, 34.39503479003906, 35.57666778564453]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 12.0, 13.0, 8.0, 15.0, 17.0, 15.0, 31.0, 28.0, 44.0, 41.0, 47.0, 34.0, 36.0, 38.0, 47.0, 52.0, 53.0, 38.0, 53.0, 37.0, 45.0, 36.0, 41.0, 27.0, 24.0, 23.0, 25.0, 32.0, 19.0, 9.0, 11.0, 15.0, 10.0, 7.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7578125, -6.5015869140625, -6.245361328125, -5.9891357421875, -5.73291015625, -5.4766845703125, -5.220458984375, -4.9642333984375, -4.7080078125, -4.4517822265625, -4.195556640625, -3.9393310546875, -3.68310546875, -3.4268798828125, -3.170654296875, -2.9144287109375, -2.658203125, -2.4019775390625, -2.145751953125, -1.8895263671875, -1.63330078125, -1.3770751953125, -1.120849609375, -0.8646240234375, -0.6083984375, -0.3521728515625, -0.095947265625, 0.1602783203125, 0.41650390625, 0.6727294921875, 0.928955078125, 1.1851806640625, 1.44140625, 1.6976318359375, 1.953857421875, 2.2100830078125, 2.46630859375, 2.7225341796875, 2.978759765625, 3.2349853515625, 3.4912109375, 3.7474365234375, 4.003662109375, 4.2598876953125, 4.51611328125, 4.7723388671875, 5.028564453125, 5.2847900390625, 5.541015625, 5.7972412109375, 6.053466796875, 6.3096923828125, 6.56591796875, 6.8221435546875, 7.078369140625, 7.3345947265625, 7.5908203125, 7.8470458984375, 8.103271484375, 8.3594970703125, 8.61572265625, 8.8719482421875, 9.128173828125, 9.3843994140625, 9.640625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 0.0, 2.0, 5.0, 4.0, 9.0, 3.0, 10.0, 14.0, 23.0, 37.0, 61.0, 109.0, 164.0, 275.0, 450.0, 738.0, 1140.0, 1921.0, 3089.0, 5185.0, 8344.0, 13368.0, 22409.0, 37621.0, 64792.0, 120038.0, 305346.0, 221386.0, 101796.0, 56419.0, 32765.0, 19789.0, 12076.0, 7426.0, 4566.0, 2740.0, 1702.0, 1027.0, 658.0, 407.0, 246.0, 144.0, 91.0, 58.0, 38.0, 23.0, 16.0, 8.0, 5.0, 7.0, 0.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.771484375, -1.714111328125, -1.65673828125, -1.599365234375, -1.5419921875, -1.484619140625, -1.42724609375, -1.369873046875, -1.3125, -1.255126953125, -1.19775390625, -1.140380859375, -1.0830078125, -1.025634765625, -0.96826171875, -0.910888671875, -0.853515625, -0.796142578125, -0.73876953125, -0.681396484375, -0.6240234375, -0.566650390625, -0.50927734375, -0.451904296875, -0.39453125, -0.337158203125, -0.27978515625, -0.222412109375, -0.1650390625, -0.107666015625, -0.05029296875, 0.007080078125, 0.064453125, 0.121826171875, 0.17919921875, 0.236572265625, 0.2939453125, 0.351318359375, 0.40869140625, 0.466064453125, 0.5234375, 0.580810546875, 0.63818359375, 0.695556640625, 0.7529296875, 0.810302734375, 0.86767578125, 0.925048828125, 0.982421875, 1.039794921875, 1.09716796875, 1.154541015625, 1.2119140625, 1.269287109375, 1.32666015625, 1.384033203125, 1.44140625, 1.498779296875, 1.55615234375, 1.613525390625, 1.6708984375, 1.728271484375, 1.78564453125, 1.843017578125, 1.900390625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 1.0, 4.0, 4.0, 7.0, 5.0, 8.0, 8.0, 22.0, 18.0, 13.0, 16.0, 16.0, 25.0, 33.0, 24.0, 20.0, 38.0, 31.0, 41.0, 43.0, 33.0, 42.0, 1066.0, 54.0, 34.0, 45.0, 42.0, 41.0, 24.0, 29.0, 34.0, 25.0, 26.0, 23.0, 30.0, 18.0, 14.0, 11.0, 18.0, 9.0, 5.0, 9.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.23828125, -4.0950927734375, -3.951904296875, -3.8087158203125, -3.66552734375, -3.5223388671875, -3.379150390625, -3.2359619140625, -3.0927734375, -2.9495849609375, -2.806396484375, -2.6632080078125, -2.52001953125, -2.3768310546875, -2.233642578125, -2.0904541015625, -1.947265625, -1.8040771484375, -1.660888671875, -1.5177001953125, -1.37451171875, -1.2313232421875, -1.088134765625, -0.9449462890625, -0.8017578125, -0.6585693359375, -0.515380859375, -0.3721923828125, -0.22900390625, -0.0858154296875, 0.057373046875, 0.2005615234375, 0.34375, 0.4869384765625, 0.630126953125, 0.7733154296875, 0.91650390625, 1.0596923828125, 1.202880859375, 1.3460693359375, 1.4892578125, 1.6324462890625, 1.775634765625, 1.9188232421875, 2.06201171875, 2.2052001953125, 2.348388671875, 2.4915771484375, 2.634765625, 2.7779541015625, 2.921142578125, 3.0643310546875, 3.20751953125, 3.3507080078125, 3.493896484375, 3.6370849609375, 3.7802734375, 3.9234619140625, 4.066650390625, 4.2098388671875, 4.35302734375, 4.4962158203125, 4.639404296875, 4.7825927734375, 4.92578125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 3.0, 11.0, 12.0, 10.0, 31.0, 30.0, 40.0, 77.0, 89.0, 159.0, 228.0, 370.0, 579.0, 892.0, 1339.0, 2096.0, 3499.0, 5621.0, 9043.0, 15098.0, 25306.0, 43607.0, 78531.0, 160997.0, 1428892.0, 145527.0, 72884.0, 40926.0, 24274.0, 14242.0, 8560.0, 5352.0, 3175.0, 2031.0, 1243.0, 811.0, 533.0, 329.0, 197.0, 172.0, 107.0, 75.0, 41.0, 29.0, 28.0, 12.0, 6.0, 10.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.9814453125, -1.923919677734375, -1.86639404296875, -1.808868408203125, -1.7513427734375, -1.693817138671875, -1.63629150390625, -1.578765869140625, -1.521240234375, -1.463714599609375, -1.40618896484375, -1.348663330078125, -1.2911376953125, -1.233612060546875, -1.17608642578125, -1.118560791015625, -1.06103515625, -1.003509521484375, -0.94598388671875, -0.888458251953125, -0.8309326171875, -0.773406982421875, -0.71588134765625, -0.658355712890625, -0.600830078125, -0.543304443359375, -0.48577880859375, -0.428253173828125, -0.3707275390625, -0.313201904296875, -0.25567626953125, -0.198150634765625, -0.140625, -0.083099365234375, -0.02557373046875, 0.031951904296875, 0.0894775390625, 0.147003173828125, 0.20452880859375, 0.262054443359375, 0.319580078125, 0.377105712890625, 0.43463134765625, 0.492156982421875, 0.5496826171875, 0.607208251953125, 0.66473388671875, 0.722259521484375, 0.77978515625, 0.837310791015625, 0.89483642578125, 0.952362060546875, 1.0098876953125, 1.067413330078125, 1.12493896484375, 1.182464599609375, 1.239990234375, 1.297515869140625, 1.35504150390625, 1.412567138671875, 1.4700927734375, 1.527618408203125, 1.58514404296875, 1.642669677734375, 1.7001953125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 1.0, 5.0, 2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 14.0, 10.0, 12.0, 24.0, 24.0, 22.0, 35.0, 29.0, 47.0, 68.0, 67.0, 113.0, 116.0, 95.0, 63.0, 51.0, 38.0, 20.0, 30.0, 21.0, 18.0, 11.0, 13.0, 6.0, 4.0, 7.0, 7.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013217926025390625, -0.001272827386856079, -0.0012238621711730957, -0.0011748969554901123, -0.001125931739807129, -0.0010769665241241455, -0.0010280013084411621, -0.0009790360927581787, -0.0009300708770751953, -0.0008811056613922119, -0.0008321404457092285, -0.0007831752300262451, -0.0007342100143432617, -0.0006852447986602783, -0.0006362795829772949, -0.0005873143672943115, -0.0005383491516113281, -0.0004893839359283447, -0.00044041872024536133, -0.00039145350456237793, -0.00034248828887939453, -0.00029352307319641113, -0.00024455785751342773, -0.00019559264183044434, -0.00014662742614746094, -9.766221046447754e-05, -4.869699478149414e-05, 2.682209014892578e-07, 4.9233436584472656e-05, 9.819865226745605e-05, 0.00014716386795043945, 0.00019612908363342285, 0.00024509429931640625, 0.00029405951499938965, 0.00034302473068237305, 0.00039198994636535645, 0.00044095516204833984, 0.0004899203777313232, 0.0005388855934143066, 0.00058785080909729, 0.0006368160247802734, 0.0006857812404632568, 0.0007347464561462402, 0.0007837116718292236, 0.000832676887512207, 0.0008816421031951904, 0.0009306073188781738, 0.0009795725345611572, 0.0010285377502441406, 0.001077502965927124, 0.0011264681816101074, 0.0011754333972930908, 0.0012243986129760742, 0.0012733638286590576, 0.001322329044342041, 0.0013712942600250244, 0.0014202594757080078, 0.0014692246913909912, 0.0015181899070739746, 0.001567155122756958, 0.0016161203384399414, 0.0016650855541229248, 0.0017140507698059082, 0.0017630159854888916, 0.001811981201171875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 5.0, 8.0, 8.0, 15.0, 23.0, 6.0, 15.0, 24.0, 33.0, 45.0, 65.0, 66.0, 99.0, 151.0, 241.0, 489.0, 1111.0, 160235.0, 883009.0, 1465.0, 552.0, 245.0, 158.0, 102.0, 91.0, 69.0, 42.0, 45.0, 32.0, 22.0, 18.0, 8.0, 9.0, 5.0, 5.0, 7.0, 9.0, 3.0, 2.0, 6.0, 4.0, 2.0, 5.0, 3.0, 4.0], "bins": [-0.03240966796875, -0.03153586387634277, -0.030662059783935547, -0.02978825569152832, -0.028914451599121094, -0.028040647506713867, -0.02716684341430664, -0.026293039321899414, -0.025419235229492188, -0.02454543113708496, -0.023671627044677734, -0.022797822952270508, -0.02192401885986328, -0.021050214767456055, -0.020176410675048828, -0.0193026065826416, -0.018428802490234375, -0.01755499839782715, -0.016681194305419922, -0.015807390213012695, -0.014933586120605469, -0.014059782028198242, -0.013185977935791016, -0.012312173843383789, -0.011438369750976562, -0.010564565658569336, -0.00969076156616211, -0.008816957473754883, -0.007943153381347656, -0.00706934928894043, -0.006195545196533203, -0.0053217411041259766, -0.00444793701171875, -0.0035741329193115234, -0.002700328826904297, -0.0018265247344970703, -0.0009527206420898438, -7.891654968261719e-05, 0.0007948875427246094, 0.001668691635131836, 0.0025424957275390625, 0.003416299819946289, 0.004290103912353516, 0.005163908004760742, 0.006037712097167969, 0.006911516189575195, 0.007785320281982422, 0.008659124374389648, 0.009532928466796875, 0.010406732559204102, 0.011280536651611328, 0.012154340744018555, 0.013028144836425781, 0.013901948928833008, 0.014775753021240234, 0.01564955711364746, 0.016523361206054688, 0.017397165298461914, 0.01827096939086914, 0.019144773483276367, 0.020018577575683594, 0.02089238166809082, 0.021766185760498047, 0.022639989852905273, 0.0235137939453125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 16.0, 164.0, 494.0, 295.0, 37.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0047285594046115875, -0.004638840910047293, -0.004549122415482998, -0.004459403920918703, -0.004369685426354408, -0.0042799669317901134, -0.004190248437225819, -0.004100529942661524, -0.004010811448097229, -0.003921092953532934, -0.0038313744589686394, -0.0037416559644043446, -0.0036519374698400497, -0.003562218975275755, -0.00347250048071146, -0.0033827819861471653, -0.003293063724413514, -0.0032033452298492193, -0.0031136267352849245, -0.0030239082407206297, -0.002934189746156335, -0.00284447125159204, -0.002754752989858389, -0.002665034495294094, -0.0025753160007297993, -0.0024855975061655045, -0.0023958790116012096, -0.002306160517036915, -0.00221644202247262, -0.002126723527908325, -0.0020370050333440304, -0.0019472866551950574, -0.0018575682770460844, -0.0017678497824817896, -0.0016781312879174948, -0.0015884127933532, -0.0014986942987889051, -0.0014089758042246103, -0.0013192574260756373, -0.0012295389315113425, -0.0011398204369470477, -0.001050101942382753, -0.0009603834478184581, -0.0008706650114618242, -0.0007809465168975294, -0.0006912280223332345, -0.0006015095859766006, -0.0005117910914123058, -0.000422072596848011, -0.0003323541022837162, -0.00024263563682325184, -0.00015291717136278749, -6.319867679849267e-05, 2.6519817765802145e-05, 0.00011623825412243605, 0.00020595674868673086, 0.0002956752432510257, 0.0003853937378153205, 0.00047511220327578485, 0.0005648306687362492, 0.000654549163300544, 0.0007442676578648388, 0.0008339860942214727, 0.0009237045887857676, 0.0010134230833500624]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 9.0, 5.0, 4.0, 5.0, 10.0, 11.0, 7.0, 14.0, 19.0, 18.0, 21.0, 20.0, 19.0, 28.0, 26.0, 27.0, 47.0, 43.0, 42.0, 38.0, 38.0, 44.0, 31.0, 43.0, 37.0, 43.0, 36.0, 23.0, 30.0, 31.0, 41.0, 27.0, 27.0, 26.0, 14.0, 14.0, 13.0, 17.0, 11.0, 10.0, 5.0, 5.0, 4.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.0006949305534362793, -0.0006743390113115311, -0.0006537474691867828, -0.0006331559270620346, -0.0006125643849372864, -0.0005919728428125381, -0.0005713813006877899, -0.0005507897585630417, -0.0005301982164382935, -0.0005096066743135452, -0.000489015132188797, -0.00046842359006404877, -0.00044783204793930054, -0.0004272405058145523, -0.0004066489636898041, -0.00038605742156505585, -0.0003654658794403076, -0.0003448743373155594, -0.00032428279519081116, -0.00030369125306606293, -0.0002830997109413147, -0.00026250816881656647, -0.00024191662669181824, -0.00022132508456707, -0.00020073354244232178, -0.00018014200031757355, -0.00015955045819282532, -0.0001389589160680771, -0.00011836737394332886, -9.777583181858063e-05, -7.71842896938324e-05, -5.659274756908417e-05, -3.600120544433594e-05, -1.5409663319587708e-05, 5.1818788051605225e-06, 2.5773420929908752e-05, 4.636496305465698e-05, 6.695650517940521e-05, 8.754804730415344e-05, 0.00010813958942890167, 0.0001287311315536499, 0.00014932267367839813, 0.00016991421580314636, 0.0001905057579278946, 0.00021109730005264282, 0.00023168884217739105, 0.0002522803843021393, 0.0002728719264268875, 0.00029346346855163574, 0.00031405501067638397, 0.0003346465528011322, 0.00035523809492588043, 0.00037582963705062866, 0.0003964211791753769, 0.0004170127213001251, 0.00043760426342487335, 0.0004581958055496216, 0.0004787873476743698, 0.000499378889799118, 0.0005199704319238663, 0.0005405619740486145, 0.0005611535161733627, 0.000581745058298111, 0.0006023366004228592, 0.0006229281425476074]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 12.0, 13.0, 8.0, 15.0, 17.0, 15.0, 31.0, 28.0, 44.0, 41.0, 47.0, 34.0, 36.0, 38.0, 47.0, 52.0, 53.0, 38.0, 53.0, 37.0, 45.0, 36.0, 41.0, 27.0, 24.0, 23.0, 25.0, 32.0, 19.0, 9.0, 11.0, 15.0, 10.0, 7.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7578125, -6.5015869140625, -6.245361328125, -5.9891357421875, -5.73291015625, -5.4766845703125, -5.220458984375, -4.9642333984375, -4.7080078125, -4.4517822265625, -4.195556640625, -3.9393310546875, -3.68310546875, -3.4268798828125, -3.170654296875, -2.9144287109375, -2.658203125, -2.4019775390625, -2.145751953125, -1.8895263671875, -1.63330078125, -1.3770751953125, -1.120849609375, -0.8646240234375, -0.6083984375, -0.3521728515625, -0.095947265625, 0.1602783203125, 0.41650390625, 0.6727294921875, 0.928955078125, 1.1851806640625, 1.44140625, 1.6976318359375, 1.953857421875, 2.2100830078125, 2.46630859375, 2.7225341796875, 2.978759765625, 3.2349853515625, 3.4912109375, 3.7474365234375, 4.003662109375, 4.2598876953125, 4.51611328125, 4.7723388671875, 5.028564453125, 5.2847900390625, 5.541015625, 5.7972412109375, 6.053466796875, 6.3096923828125, 6.56591796875, 6.8221435546875, 7.078369140625, 7.3345947265625, 7.5908203125, 7.8470458984375, 8.103271484375, 8.3594970703125, 8.61572265625, 8.8719482421875, 9.128173828125, 9.3843994140625, 9.640625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 3.0, 11.0, 13.0, 15.0, 31.0, 37.0, 44.0, 57.0, 96.0, 128.0, 188.0, 276.0, 527.0, 893.0, 2010.0, 5105.0, 14828.0, 50324.0, 179389.0, 475755.0, 226869.0, 62612.0, 18207.0, 6239.0, 2345.0, 1069.0, 484.0, 313.0, 180.0, 149.0, 83.0, 78.0, 61.0, 38.0, 27.0, 24.0, 14.0, 12.0, 11.0, 4.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0625, -7.75927734375, -7.4560546875, -7.15283203125, -6.849609375, -6.54638671875, -6.2431640625, -5.93994140625, -5.63671875, -5.33349609375, -5.0302734375, -4.72705078125, -4.423828125, -4.12060546875, -3.8173828125, -3.51416015625, -3.2109375, -2.90771484375, -2.6044921875, -2.30126953125, -1.998046875, -1.69482421875, -1.3916015625, -1.08837890625, -0.78515625, -0.48193359375, -0.1787109375, 0.12451171875, 0.427734375, 0.73095703125, 1.0341796875, 1.33740234375, 1.640625, 1.94384765625, 2.2470703125, 2.55029296875, 2.853515625, 3.15673828125, 3.4599609375, 3.76318359375, 4.06640625, 4.36962890625, 4.6728515625, 4.97607421875, 5.279296875, 5.58251953125, 5.8857421875, 6.18896484375, 6.4921875, 6.79541015625, 7.0986328125, 7.40185546875, 7.705078125, 8.00830078125, 8.3115234375, 8.61474609375, 8.91796875, 9.22119140625, 9.5244140625, 9.82763671875, 10.130859375, 10.43408203125, 10.7373046875, 11.04052734375, 11.34375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 1.0, 8.0, 8.0, 5.0, 10.0, 18.0, 22.0, 17.0, 16.0, 20.0, 30.0, 31.0, 33.0, 43.0, 48.0, 57.0, 83.0, 132.0, 370.0, 1461.0, 147.0, 87.0, 50.0, 45.0, 39.0, 47.0, 34.0, 37.0, 30.0, 31.0, 12.0, 12.0, 13.0, 6.0, 13.0, 4.0, 9.0, 8.0, 0.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.90625, -22.233154296875, -21.56005859375, -20.886962890625, -20.2138671875, -19.540771484375, -18.86767578125, -18.194580078125, -17.521484375, -16.848388671875, -16.17529296875, -15.502197265625, -14.8291015625, -14.156005859375, -13.48291015625, -12.809814453125, -12.13671875, -11.463623046875, -10.79052734375, -10.117431640625, -9.4443359375, -8.771240234375, -8.09814453125, -7.425048828125, -6.751953125, -6.078857421875, -5.40576171875, -4.732666015625, -4.0595703125, -3.386474609375, -2.71337890625, -2.040283203125, -1.3671875, -0.694091796875, -0.02099609375, 0.652099609375, 1.3251953125, 1.998291015625, 2.67138671875, 3.344482421875, 4.017578125, 4.690673828125, 5.36376953125, 6.036865234375, 6.7099609375, 7.383056640625, 8.05615234375, 8.729248046875, 9.40234375, 10.075439453125, 10.74853515625, 11.421630859375, 12.0947265625, 12.767822265625, 13.44091796875, 14.114013671875, 14.787109375, 15.460205078125, 16.13330078125, 16.806396484375, 17.4794921875, 18.152587890625, 18.82568359375, 19.498779296875, 20.171875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 9.0, 7.0, 9.0, 8.0, 15.0, 23.0, 28.0, 48.0, 58.0, 80.0, 155.0, 256.0, 415.0, 858.0, 3857.0, 641531.0, 2488941.0, 7203.0, 966.0, 502.0, 265.0, 164.0, 98.0, 71.0, 35.0, 30.0, 18.0, 15.0, 10.0, 7.0, 6.0, 6.0, 1.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-51.8125, -50.41552734375, -49.0185546875, -47.62158203125, -46.224609375, -44.82763671875, -43.4306640625, -42.03369140625, -40.63671875, -39.23974609375, -37.8427734375, -36.44580078125, -35.048828125, -33.65185546875, -32.2548828125, -30.85791015625, -29.4609375, -28.06396484375, -26.6669921875, -25.27001953125, -23.873046875, -22.47607421875, -21.0791015625, -19.68212890625, -18.28515625, -16.88818359375, -15.4912109375, -14.09423828125, -12.697265625, -11.30029296875, -9.9033203125, -8.50634765625, -7.109375, -5.71240234375, -4.3154296875, -2.91845703125, -1.521484375, -0.12451171875, 1.2724609375, 2.66943359375, 4.06640625, 5.46337890625, 6.8603515625, 8.25732421875, 9.654296875, 11.05126953125, 12.4482421875, 13.84521484375, 15.2421875, 16.63916015625, 18.0361328125, 19.43310546875, 20.830078125, 22.22705078125, 23.6240234375, 25.02099609375, 26.41796875, 27.81494140625, 29.2119140625, 30.60888671875, 32.005859375, 33.40283203125, 34.7998046875, 36.19677734375, 37.59375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 10.0, 98.0, 528.0, 359.0, 17.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.33464050292969, -120.4271011352539, -116.51956176757812, -112.61202239990234, -108.70448303222656, -104.79693603515625, -100.88939666748047, -96.98185729980469, -93.0743179321289, -89.16677856445312, -85.25923919677734, -81.35169982910156, -77.44415283203125, -73.53662109375, -69.62907409667969, -65.7215347290039, -61.813995361328125, -57.906455993652344, -53.99891662597656, -50.091373443603516, -46.183834075927734, -42.27629470825195, -38.368751525878906, -34.461212158203125, -30.553672790527344, -26.646133422851562, -22.73859214782715, -18.831050872802734, -14.923511505126953, -11.015972137451172, -7.108430862426758, -3.2008895874023438, 0.7066497802734375, 4.614190101623535, 8.521730422973633, 12.42927074432373, 16.336811065673828, 20.24435043334961, 24.151891708374023, 28.059432983398438, 31.96697235107422, 35.87451171875, 39.78205108642578, 43.68959426879883, 47.59713363647461, 51.50467300415039, 55.41221618652344, 59.31975555419922, 63.227294921875, 67.13483428955078, 71.04237365722656, 74.94991302490234, 78.85745239257812, 82.76499938964844, 86.67253875732422, 90.580078125, 94.48761749267578, 98.39515686035156, 102.30269622802734, 106.21023559570312, 110.11778259277344, 114.02531433105469, 117.932861328125, 121.84040069580078, 125.74794006347656]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 7.0, 2.0, 9.0, 2.0, 8.0, 8.0, 11.0, 14.0, 15.0, 21.0, 23.0, 26.0, 21.0, 24.0, 29.0, 31.0, 37.0, 48.0, 33.0, 43.0, 32.0, 49.0, 49.0, 52.0, 47.0, 43.0, 38.0, 33.0, 33.0, 29.0, 42.0, 30.0, 24.0, 11.0, 17.0, 15.0, 14.0, 8.0, 1.0, 11.0, 3.0, 6.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-52.30714797973633, -50.89025115966797, -49.473358154296875, -48.056461334228516, -46.639564514160156, -45.22267150878906, -43.8057746887207, -42.388877868652344, -40.97198486328125, -39.55508804321289, -38.1381950378418, -36.72129821777344, -35.304405212402344, -33.887508392333984, -32.470611572265625, -31.0537166595459, -29.636821746826172, -28.219926834106445, -26.80303192138672, -25.38613510131836, -23.969240188598633, -22.552345275878906, -21.135448455810547, -19.71855354309082, -18.301658630371094, -16.884763717651367, -15.467867851257324, -14.050971984863281, -12.634077072143555, -11.217182159423828, -9.800286293029785, -8.383390426635742, -6.966499328613281, -5.5496039390563965, -4.132708549499512, -2.715813159942627, -1.2989177703857422, 0.11797761917114258, 1.5348730087280273, 2.9517688751220703, 4.368663787841797, 5.785559177398682, 7.202454566955566, 8.61935043334961, 10.036245346069336, 11.453140258789062, 12.870036125183105, 14.286931991577148, 15.703826904296875, 17.1207218170166, 18.537616729736328, 19.954513549804688, 21.371408462524414, 22.78830337524414, 24.2052001953125, 25.622095108032227, 27.038990020751953, 28.45588493347168, 29.872779846191406, 31.289676666259766, 32.706573486328125, 34.12346649169922, 35.54036331176758, 36.95726013183594, 38.37415313720703]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 9.0, 7.0, 18.0, 17.0, 23.0, 21.0, 36.0, 27.0, 43.0, 39.0, 48.0, 47.0, 41.0, 45.0, 65.0, 50.0, 57.0, 48.0, 51.0, 37.0, 47.0, 32.0, 33.0, 26.0, 30.0, 16.0, 14.0, 17.0, 8.0, 14.0, 9.0, 10.0, 7.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8984375, -7.60888671875, -7.3193359375, -7.02978515625, -6.740234375, -6.45068359375, -6.1611328125, -5.87158203125, -5.58203125, -5.29248046875, -5.0029296875, -4.71337890625, -4.423828125, -4.13427734375, -3.8447265625, -3.55517578125, -3.265625, -2.97607421875, -2.6865234375, -2.39697265625, -2.107421875, -1.81787109375, -1.5283203125, -1.23876953125, -0.94921875, -0.65966796875, -0.3701171875, -0.08056640625, 0.208984375, 0.49853515625, 0.7880859375, 1.07763671875, 1.3671875, 1.65673828125, 1.9462890625, 2.23583984375, 2.525390625, 2.81494140625, 3.1044921875, 3.39404296875, 3.68359375, 3.97314453125, 4.2626953125, 4.55224609375, 4.841796875, 5.13134765625, 5.4208984375, 5.71044921875, 6.0, 6.28955078125, 6.5791015625, 6.86865234375, 7.158203125, 7.44775390625, 7.7373046875, 8.02685546875, 8.31640625, 8.60595703125, 8.8955078125, 9.18505859375, 9.474609375, 9.76416015625, 10.0537109375, 10.34326171875, 10.6328125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 9.0, 4.0, 7.0, 7.0, 11.0, 12.0, 18.0, 17.0, 22.0, 32.0, 52.0, 48.0, 105.0, 149.0, 246.0, 517.0, 1191.0, 4381.0, 24339.0, 267051.0, 1757420.0, 1838396.0, 269411.0, 24266.0, 4000.0, 1240.0, 508.0, 300.0, 162.0, 97.0, 75.0, 40.0, 33.0, 26.0, 21.0, 12.0, 10.0, 9.0, 11.0, 6.0, 10.0, 4.0, 1.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.4296875, -12.0413818359375, -11.653076171875, -11.2647705078125, -10.87646484375, -10.4881591796875, -10.099853515625, -9.7115478515625, -9.3232421875, -8.9349365234375, -8.546630859375, -8.1583251953125, -7.77001953125, -7.3817138671875, -6.993408203125, -6.6051025390625, -6.216796875, -5.8284912109375, -5.440185546875, -5.0518798828125, -4.66357421875, -4.2752685546875, -3.886962890625, -3.4986572265625, -3.1103515625, -2.7220458984375, -2.333740234375, -1.9454345703125, -1.55712890625, -1.1688232421875, -0.780517578125, -0.3922119140625, -0.00390625, 0.3843994140625, 0.772705078125, 1.1610107421875, 1.54931640625, 1.9376220703125, 2.325927734375, 2.7142333984375, 3.1025390625, 3.4908447265625, 3.879150390625, 4.2674560546875, 4.65576171875, 5.0440673828125, 5.432373046875, 5.8206787109375, 6.208984375, 6.5972900390625, 6.985595703125, 7.3739013671875, 7.76220703125, 8.1505126953125, 8.538818359375, 8.9271240234375, 9.3154296875, 9.7037353515625, 10.092041015625, 10.4803466796875, 10.86865234375, 11.2569580078125, 11.645263671875, 12.0335693359375, 12.421875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 3.0, 3.0, 5.0, 7.0, 11.0, 12.0, 19.0, 31.0, 27.0, 54.0, 67.0, 88.0, 161.0, 247.0, 300.0, 411.0, 492.0, 495.0, 464.0, 343.0, 245.0, 179.0, 114.0, 72.0, 51.0, 40.0, 26.0, 19.0, 21.0, 8.0, 9.0, 16.0, 6.0, 4.0, 2.0, 6.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.0234375, -9.7015380859375, -9.379638671875, -9.0577392578125, -8.73583984375, -8.4139404296875, -8.092041015625, -7.7701416015625, -7.4482421875, -7.1263427734375, -6.804443359375, -6.4825439453125, -6.16064453125, -5.8387451171875, -5.516845703125, -5.1949462890625, -4.873046875, -4.5511474609375, -4.229248046875, -3.9073486328125, -3.58544921875, -3.2635498046875, -2.941650390625, -2.6197509765625, -2.2978515625, -1.9759521484375, -1.654052734375, -1.3321533203125, -1.01025390625, -0.6883544921875, -0.366455078125, -0.0445556640625, 0.27734375, 0.5992431640625, 0.921142578125, 1.2430419921875, 1.56494140625, 1.8868408203125, 2.208740234375, 2.5306396484375, 2.8525390625, 3.1744384765625, 3.496337890625, 3.8182373046875, 4.14013671875, 4.4620361328125, 4.783935546875, 5.1058349609375, 5.427734375, 5.7496337890625, 6.071533203125, 6.3934326171875, 6.71533203125, 7.0372314453125, 7.359130859375, 7.6810302734375, 8.0029296875, 8.3248291015625, 8.646728515625, 8.9686279296875, 9.29052734375, 9.6124267578125, 9.934326171875, 10.2562255859375, 10.578125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 7.0, 8.0, 3.0, 9.0, 12.0, 12.0, 9.0, 13.0, 26.0, 31.0, 36.0, 51.0, 78.0, 104.0, 157.0, 253.0, 513.0, 1135.0, 3220.0, 12403.0, 73656.0, 839601.0, 2909842.0, 304459.0, 36760.0, 7676.0, 2222.0, 915.0, 389.0, 205.0, 130.0, 92.0, 63.0, 51.0, 31.0, 25.0, 19.0, 21.0, 8.0, 9.0, 10.0, 7.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-16.15625, -15.6712646484375, -15.186279296875, -14.7012939453125, -14.21630859375, -13.7313232421875, -13.246337890625, -12.7613525390625, -12.2763671875, -11.7913818359375, -11.306396484375, -10.8214111328125, -10.33642578125, -9.8514404296875, -9.366455078125, -8.8814697265625, -8.396484375, -7.9114990234375, -7.426513671875, -6.9415283203125, -6.45654296875, -5.9715576171875, -5.486572265625, -5.0015869140625, -4.5166015625, -4.0316162109375, -3.546630859375, -3.0616455078125, -2.57666015625, -2.0916748046875, -1.606689453125, -1.1217041015625, -0.63671875, -0.1517333984375, 0.333251953125, 0.8182373046875, 1.30322265625, 1.7882080078125, 2.273193359375, 2.7581787109375, 3.2431640625, 3.7281494140625, 4.213134765625, 4.6981201171875, 5.18310546875, 5.6680908203125, 6.153076171875, 6.6380615234375, 7.123046875, 7.6080322265625, 8.093017578125, 8.5780029296875, 9.06298828125, 9.5479736328125, 10.032958984375, 10.5179443359375, 11.0029296875, 11.4879150390625, 11.972900390625, 12.4578857421875, 12.94287109375, 13.4278564453125, 13.912841796875, 14.3978271484375, 14.8828125]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 8.0, 23.0, 105.0, 276.0, 365.0, 173.0, 52.0, 10.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.252296447753906, -29.078163146972656, -25.90403175354004, -22.729900360107422, -19.555767059326172, -16.381633758544922, -13.207502365112305, -10.033370971679688, -6.8592376708984375, -3.685105323791504, -0.5109729766845703, 2.6631593704223633, 5.837291717529297, 9.01142406463623, 12.185556411743164, 15.359687805175781, 18.53382110595703, 21.70795440673828, 24.8820858001709, 28.056217193603516, 31.230350494384766, 34.404483795166016, 37.57861328125, 40.75274658203125, 43.9268798828125, 47.10101318359375, 50.275146484375, 53.449275970458984, 56.623409271240234, 59.797542572021484, 62.97167205810547, 66.14580535888672, 69.31993103027344, 72.49406433105469, 75.66819763183594, 78.84233093261719, 82.01646423339844, 85.19058990478516, 88.3647232055664, 91.53885650634766, 94.7129898071289, 97.88712310791016, 101.0612564086914, 104.23538970947266, 107.40951538085938, 110.58364868164062, 113.75778198242188, 116.93191528320312, 120.10604858398438, 123.28018188476562, 126.45431518554688, 129.62844848632812, 132.80258178710938, 135.97671508789062, 139.15084838867188, 142.32498168945312, 145.49911499023438, 148.67324829101562, 151.84738159179688, 155.02151489257812, 158.19564819335938, 161.36978149414062, 164.54391479492188, 167.71804809570312, 170.8921661376953]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 6.0, 11.0, 12.0, 15.0, 14.0, 18.0, 28.0, 32.0, 24.0, 33.0, 33.0, 36.0, 48.0, 39.0, 75.0, 31.0, 49.0, 51.0, 48.0, 38.0, 39.0, 33.0, 30.0, 33.0, 50.0, 28.0, 27.0, 15.0, 18.0, 20.0, 13.0, 16.0, 7.0, 4.0, 8.0, 2.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.34954833984375, -40.12251281738281, -38.89547348022461, -37.66843795776367, -36.44139862060547, -35.21436309814453, -33.98732376098633, -32.76028823852539, -31.53325080871582, -30.30621337890625, -29.07917594909668, -27.85213851928711, -26.625102996826172, -25.39806365966797, -24.17102813720703, -22.94399070739746, -21.71695327758789, -20.48991584777832, -19.26287841796875, -18.03584098815918, -16.80880355834961, -15.581767082214355, -14.354730606079102, -13.127693176269531, -11.900655746459961, -10.67361831665039, -9.44658088684082, -8.219544410705566, -6.992506980895996, -5.765469551086426, -4.538432598114014, -3.3113956451416016, -2.0843582153320312, -0.85732102394104, 0.36971616744995117, 1.5967533588409424, 2.8237905502319336, 4.050827980041504, 5.277864933013916, 6.504901885986328, 7.731939315795898, 8.958976745605469, 10.186014175415039, 11.413050651550293, 12.640088081359863, 13.867125511169434, 15.094161987304688, 16.321199417114258, 17.548236846923828, 18.7752742767334, 20.00231170654297, 21.22934913635254, 22.45638656616211, 23.683422088623047, 24.910459518432617, 26.137496948242188, 27.364534378051758, 28.591571807861328, 29.8186092376709, 31.04564666748047, 32.272682189941406, 33.49972152709961, 34.72675704956055, 35.95379638671875, 37.18083190917969]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 0.0, 4.0, 2.0, 5.0, 13.0, 9.0, 12.0, 8.0, 14.0, 16.0, 23.0, 18.0, 35.0, 27.0, 41.0, 36.0, 33.0, 49.0, 54.0, 39.0, 50.0, 38.0, 48.0, 41.0, 34.0, 40.0, 38.0, 45.0, 32.0, 25.0, 19.0, 28.0, 19.0, 18.0, 23.0, 10.0, 7.0, 11.0, 11.0, 10.0, 4.0, 4.0, 6.0, 3.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.06640625, -6.82061767578125, -6.5748291015625, -6.32904052734375, -6.083251953125, -5.83746337890625, -5.5916748046875, -5.34588623046875, -5.10009765625, -4.85430908203125, -4.6085205078125, -4.36273193359375, -4.116943359375, -3.87115478515625, -3.6253662109375, -3.37957763671875, -3.1337890625, -2.88800048828125, -2.6422119140625, -2.39642333984375, -2.150634765625, -1.90484619140625, -1.6590576171875, -1.41326904296875, -1.16748046875, -0.92169189453125, -0.6759033203125, -0.43011474609375, -0.184326171875, 0.06146240234375, 0.3072509765625, 0.55303955078125, 0.798828125, 1.04461669921875, 1.2904052734375, 1.53619384765625, 1.781982421875, 2.02777099609375, 2.2735595703125, 2.51934814453125, 2.76513671875, 3.01092529296875, 3.2567138671875, 3.50250244140625, 3.748291015625, 3.99407958984375, 4.2398681640625, 4.48565673828125, 4.7314453125, 4.97723388671875, 5.2230224609375, 5.46881103515625, 5.714599609375, 5.96038818359375, 6.2061767578125, 6.45196533203125, 6.69775390625, 6.94354248046875, 7.1893310546875, 7.43511962890625, 7.680908203125, 7.92669677734375, 8.1724853515625, 8.41827392578125, 8.6640625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 10.0, 18.0, 21.0, 24.0, 36.0, 56.0, 103.0, 149.0, 272.0, 352.0, 534.0, 813.0, 1307.0, 1978.0, 2791.0, 4507.0, 6986.0, 10679.0, 17438.0, 28368.0, 49150.0, 90002.0, 200342.0, 351851.0, 121930.0, 63948.0, 36240.0, 21625.0, 13290.0, 8347.0, 5431.0, 3400.0, 2283.0, 1538.0, 958.0, 586.0, 418.0, 294.0, 163.0, 122.0, 74.0, 44.0, 28.0, 19.0, 12.0, 11.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.0078125, -1.9473724365234375, -1.886932373046875, -1.8264923095703125, -1.76605224609375, -1.7056121826171875, -1.645172119140625, -1.5847320556640625, -1.5242919921875, -1.4638519287109375, -1.403411865234375, -1.3429718017578125, -1.28253173828125, -1.2220916748046875, -1.161651611328125, -1.1012115478515625, -1.040771484375, -0.9803314208984375, -0.919891357421875, -0.8594512939453125, -0.79901123046875, -0.7385711669921875, -0.678131103515625, -0.6176910400390625, -0.5572509765625, -0.4968109130859375, -0.436370849609375, -0.3759307861328125, -0.31549072265625, -0.2550506591796875, -0.194610595703125, -0.1341705322265625, -0.07373046875, -0.0132904052734375, 0.047149658203125, 0.1075897216796875, 0.16802978515625, 0.2284698486328125, 0.288909912109375, 0.3493499755859375, 0.4097900390625, 0.4702301025390625, 0.530670166015625, 0.5911102294921875, 0.65155029296875, 0.7119903564453125, 0.772430419921875, 0.8328704833984375, 0.893310546875, 0.9537506103515625, 1.014190673828125, 1.0746307373046875, 1.13507080078125, 1.1955108642578125, 1.255950927734375, 1.3163909912109375, 1.3768310546875, 1.4372711181640625, 1.497711181640625, 1.5581512451171875, 1.61859130859375, 1.6790313720703125, 1.739471435546875, 1.7999114990234375, 1.8603515625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 8.0, 6.0, 10.0, 4.0, 21.0, 15.0, 12.0, 22.0, 27.0, 21.0, 20.0, 25.0, 20.0, 36.0, 53.0, 33.0, 35.0, 32.0, 36.0, 1072.0, 50.0, 40.0, 58.0, 39.0, 37.0, 35.0, 35.0, 32.0, 24.0, 24.0, 27.0, 22.0, 19.0, 16.0, 9.0, 4.0, 13.0, 7.0, 7.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0], "bins": [-5.1484375, -4.998779296875, -4.84912109375, -4.699462890625, -4.5498046875, -4.400146484375, -4.25048828125, -4.100830078125, -3.951171875, -3.801513671875, -3.65185546875, -3.502197265625, -3.3525390625, -3.202880859375, -3.05322265625, -2.903564453125, -2.75390625, -2.604248046875, -2.45458984375, -2.304931640625, -2.1552734375, -2.005615234375, -1.85595703125, -1.706298828125, -1.556640625, -1.406982421875, -1.25732421875, -1.107666015625, -0.9580078125, -0.808349609375, -0.65869140625, -0.509033203125, -0.359375, -0.209716796875, -0.06005859375, 0.089599609375, 0.2392578125, 0.388916015625, 0.53857421875, 0.688232421875, 0.837890625, 0.987548828125, 1.13720703125, 1.286865234375, 1.4365234375, 1.586181640625, 1.73583984375, 1.885498046875, 2.03515625, 2.184814453125, 2.33447265625, 2.484130859375, 2.6337890625, 2.783447265625, 2.93310546875, 3.082763671875, 3.232421875, 3.382080078125, 3.53173828125, 3.681396484375, 3.8310546875, 3.980712890625, 4.13037109375, 4.280029296875, 4.4296875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 16.0, 13.0, 13.0, 24.0, 42.0, 55.0, 78.0, 98.0, 178.0, 285.0, 374.0, 551.0, 908.0, 1477.0, 2415.0, 3707.0, 6157.0, 10055.0, 17031.0, 28729.0, 50807.0, 95651.0, 227781.0, 1390705.0, 115626.0, 60479.0, 34160.0, 19567.0, 11544.0, 7034.0, 4220.0, 2577.0, 1706.0, 1079.0, 659.0, 440.0, 299.0, 224.0, 118.0, 76.0, 59.0, 29.0, 32.0, 13.0, 16.0, 8.0, 15.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7373046875, -1.6776885986328125, -1.618072509765625, -1.5584564208984375, -1.49884033203125, -1.4392242431640625, -1.379608154296875, -1.3199920654296875, -1.2603759765625, -1.2007598876953125, -1.141143798828125, -1.0815277099609375, -1.02191162109375, -0.9622955322265625, -0.902679443359375, -0.8430633544921875, -0.783447265625, -0.7238311767578125, -0.664215087890625, -0.6045989990234375, -0.54498291015625, -0.4853668212890625, -0.425750732421875, -0.3661346435546875, -0.3065185546875, -0.2469024658203125, -0.187286376953125, -0.1276702880859375, -0.06805419921875, -0.0084381103515625, 0.051177978515625, 0.1107940673828125, 0.17041015625, 0.2300262451171875, 0.289642333984375, 0.3492584228515625, 0.40887451171875, 0.4684906005859375, 0.528106689453125, 0.5877227783203125, 0.6473388671875, 0.7069549560546875, 0.766571044921875, 0.8261871337890625, 0.88580322265625, 0.9454193115234375, 1.005035400390625, 1.0646514892578125, 1.124267578125, 1.1838836669921875, 1.243499755859375, 1.3031158447265625, 1.36273193359375, 1.4223480224609375, 1.481964111328125, 1.5415802001953125, 1.6011962890625, 1.6608123779296875, 1.720428466796875, 1.7800445556640625, 1.83966064453125, 1.8992767333984375, 1.958892822265625, 2.0185089111328125, 2.078125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 7.0, 7.0, 11.0, 5.0, 8.0, 8.0, 15.0, 15.0, 21.0, 26.0, 36.0, 56.0, 63.0, 94.0, 101.0, 105.0, 112.0, 62.0, 60.0, 30.0, 28.0, 27.0, 19.0, 11.0, 14.0, 11.0, 7.0, 5.0, 4.0, 3.0, 6.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.001430511474609375, -0.0013874918222427368, -0.0013444721698760986, -0.0013014525175094604, -0.0012584328651428223, -0.001215413212776184, -0.001172393560409546, -0.0011293739080429077, -0.0010863542556762695, -0.0010433346033096313, -0.0010003149509429932, -0.000957295298576355, -0.0009142756462097168, -0.0008712559938430786, -0.0008282363414764404, -0.0007852166891098022, -0.0007421970367431641, -0.0006991773843765259, -0.0006561577320098877, -0.0006131380796432495, -0.0005701184272766113, -0.0005270987749099731, -0.00048407912254333496, -0.0004410594701766968, -0.0003980398178100586, -0.0003550201654434204, -0.0003120005130767822, -0.00026898086071014404, -0.00022596120834350586, -0.00018294155597686768, -0.0001399219036102295, -9.690225124359131e-05, -5.3882598876953125e-05, -1.0862946510314941e-05, 3.215670585632324e-05, 7.517635822296143e-05, 0.00011819601058959961, 0.0001612156629562378, 0.00020423531532287598, 0.00024725496768951416, 0.00029027462005615234, 0.00033329427242279053, 0.0003763139247894287, 0.0004193335771560669, 0.0004623532295227051, 0.0005053728818893433, 0.0005483925342559814, 0.0005914121866226196, 0.0006344318389892578, 0.000677451491355896, 0.0007204711437225342, 0.0007634907960891724, 0.0008065104484558105, 0.0008495301008224487, 0.0008925497531890869, 0.0009355694055557251, 0.0009785890579223633, 0.0010216087102890015, 0.0010646283626556396, 0.0011076480150222778, 0.001150667667388916, 0.0011936873197555542, 0.0012367069721221924, 0.0012797266244888306, 0.0013227462768554688]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 5.0, 5.0, 7.0, 6.0, 9.0, 11.0, 15.0, 16.0, 26.0, 37.0, 63.0, 55.0, 102.0, 144.0, 253.0, 515.0, 1769.0, 947308.0, 96011.0, 1038.0, 405.0, 243.0, 145.0, 90.0, 61.0, 46.0, 27.0, 23.0, 21.0, 17.0, 11.0, 12.0, 11.0, 4.0, 2.0, 6.0, 6.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.025848388671875, -0.02501058578491211, -0.02417278289794922, -0.023334980010986328, -0.022497177124023438, -0.021659374237060547, -0.020821571350097656, -0.019983768463134766, -0.019145965576171875, -0.018308162689208984, -0.017470359802246094, -0.016632556915283203, -0.015794754028320312, -0.014956951141357422, -0.014119148254394531, -0.01328134536743164, -0.01244354248046875, -0.01160573959350586, -0.010767936706542969, -0.009930133819580078, -0.009092330932617188, -0.008254528045654297, -0.007416725158691406, -0.006578922271728516, -0.005741119384765625, -0.004903316497802734, -0.004065513610839844, -0.003227710723876953, -0.0023899078369140625, -0.0015521049499511719, -0.0007143020629882812, 0.00012350082397460938, 0.0009613037109375, 0.0017991065979003906, 0.0026369094848632812, 0.003474712371826172, 0.0043125152587890625, 0.005150318145751953, 0.005988121032714844, 0.006825923919677734, 0.007663726806640625, 0.008501529693603516, 0.009339332580566406, 0.010177135467529297, 0.011014938354492188, 0.011852741241455078, 0.012690544128417969, 0.01352834701538086, 0.01436614990234375, 0.01520395278930664, 0.01604175567626953, 0.016879558563232422, 0.017717361450195312, 0.018555164337158203, 0.019392967224121094, 0.020230770111083984, 0.021068572998046875, 0.021906375885009766, 0.022744178771972656, 0.023581981658935547, 0.024419784545898438, 0.025257587432861328, 0.02609539031982422, 0.02693319320678711, 0.02777099609375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 16.0, 43.0, 137.0, 243.0, 319.0, 157.0, 64.0, 24.0, 7.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00042936060344800353, -0.0003769064205698669, -0.0003244522667955607, -0.00027199811302125454, -0.0002195439301431179, -0.00016708974726498127, -0.00011463559349067509, -6.218143971636891e-05, -9.727256838232279e-06, 4.272691148798913e-05, 9.518107981421053e-05, 0.00014763524814043194, 0.00020008941646665335, 0.00025254359934479, 0.00030499775311909616, 0.00035745190689340234, 0.00040990608977153897, 0.0004623602726496756, 0.0005148143973201513, 0.000567268580198288, 0.0006197227630764246, 0.0006721769459545612, 0.0007246311288326979, 0.0007770852535031736, 0.0008295394363813102, 0.0008819936192594469, 0.0009344477439299226, 0.0009869019268080592, 0.0010393561096861959, 0.0010918102925643325, 0.0011442644754424691, 0.001196718541905284, 0.0012491727247834206, 0.0013016269076615572, 0.0013540810905396938, 0.0014065352734178305, 0.001458989456295967, 0.0015114436391741037, 0.0015638977056369185, 0.0016163518885150552, 0.0016688060713931918, 0.0017212602542713284, 0.001773714437149465, 0.0018261686200276017, 0.0018786226864904165, 0.0019310768693685532, 0.00198353105224669, 0.0020359852351248264, 0.002088439418002963, 0.0021408936008810997, 0.0021933477837592363, 0.002245801966637373, 0.0022982561495155096, 0.0023507103323936462, 0.002403164515271783, 0.0024556186981499195, 0.0025080726481974125, 0.002560526831075549, 0.0026129810139536858, 0.0026654351968318224, 0.002717889379709959, 0.0027703435625880957, 0.0028227977454662323, 0.0028752516955137253, 0.0029277061112225056]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 6.0, 4.0, 4.0, 7.0, 15.0, 11.0, 13.0, 20.0, 14.0, 19.0, 17.0, 17.0, 21.0, 32.0, 36.0, 31.0, 36.0, 31.0, 46.0, 31.0, 57.0, 50.0, 32.0, 42.0, 36.0, 33.0, 37.0, 32.0, 35.0, 36.0, 29.0, 24.0, 20.0, 25.0, 19.0, 13.0, 20.0, 15.0, 7.0, 8.0, 6.0, 5.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006527304649353027, -0.0006332546472549438, -0.000613778829574585, -0.0005943030118942261, -0.0005748271942138672, -0.0005553513765335083, -0.0005358755588531494, -0.0005163997411727905, -0.0004969239234924316, -0.00047744810581207275, -0.00045797228813171387, -0.000438496470451355, -0.0004190206527709961, -0.0003995448350906372, -0.0003800690174102783, -0.00036059319972991943, -0.00034111738204956055, -0.00032164156436920166, -0.0003021657466888428, -0.0002826899290084839, -0.000263214111328125, -0.0002437382936477661, -0.00022426247596740723, -0.00020478665828704834, -0.00018531084060668945, -0.00016583502292633057, -0.00014635920524597168, -0.0001268833875656128, -0.0001074075698852539, -8.793175220489502e-05, -6.845593452453613e-05, -4.8980116844177246e-05, -2.950429916381836e-05, -1.0028481483459473e-05, 9.447336196899414e-06, 2.89231538772583e-05, 4.839897155761719e-05, 6.787478923797607e-05, 8.735060691833496e-05, 0.00010682642459869385, 0.00012630224227905273, 0.00014577805995941162, 0.0001652538776397705, 0.0001847296953201294, 0.00020420551300048828, 0.00022368133068084717, 0.00024315714836120605, 0.00026263296604156494, 0.00028210878372192383, 0.0003015846014022827, 0.0003210604190826416, 0.0003405362367630005, 0.0003600120544433594, 0.00037948787212371826, 0.00039896368980407715, 0.00041843950748443604, 0.0004379153251647949, 0.0004573911428451538, 0.0004768669605255127, 0.0004963427782058716, 0.0005158185958862305, 0.0005352944135665894, 0.0005547702312469482, 0.0005742460489273071, 0.000593721866607666]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 0.0, 4.0, 2.0, 5.0, 13.0, 9.0, 12.0, 8.0, 14.0, 16.0, 23.0, 18.0, 35.0, 27.0, 41.0, 36.0, 33.0, 49.0, 54.0, 39.0, 50.0, 38.0, 48.0, 41.0, 34.0, 40.0, 38.0, 45.0, 32.0, 25.0, 19.0, 28.0, 19.0, 18.0, 23.0, 10.0, 7.0, 11.0, 11.0, 10.0, 4.0, 4.0, 6.0, 3.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.06640625, -6.82061767578125, -6.5748291015625, -6.32904052734375, -6.083251953125, -5.83746337890625, -5.5916748046875, -5.34588623046875, -5.10009765625, -4.85430908203125, -4.6085205078125, -4.36273193359375, -4.116943359375, -3.87115478515625, -3.6253662109375, -3.37957763671875, -3.1337890625, -2.88800048828125, -2.6422119140625, -2.39642333984375, -2.150634765625, -1.90484619140625, -1.6590576171875, -1.41326904296875, -1.16748046875, -0.92169189453125, -0.6759033203125, -0.43011474609375, -0.184326171875, 0.06146240234375, 0.3072509765625, 0.55303955078125, 0.798828125, 1.04461669921875, 1.2904052734375, 1.53619384765625, 1.781982421875, 2.02777099609375, 2.2735595703125, 2.51934814453125, 2.76513671875, 3.01092529296875, 3.2567138671875, 3.50250244140625, 3.748291015625, 3.99407958984375, 4.2398681640625, 4.48565673828125, 4.7314453125, 4.97723388671875, 5.2230224609375, 5.46881103515625, 5.714599609375, 5.96038818359375, 6.2061767578125, 6.45196533203125, 6.69775390625, 6.94354248046875, 7.1893310546875, 7.43511962890625, 7.680908203125, 7.92669677734375, 8.1724853515625, 8.41827392578125, 8.6640625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 8.0, 8.0, 15.0, 11.0, 20.0, 31.0, 47.0, 53.0, 91.0, 98.0, 102.0, 157.0, 228.0, 318.0, 443.0, 657.0, 1247.0, 2224.0, 5696.0, 19549.0, 75006.0, 259103.0, 428283.0, 182775.0, 50066.0, 13111.0, 4287.0, 1874.0, 994.0, 550.0, 391.0, 278.0, 214.0, 141.0, 122.0, 87.0, 68.0, 52.0, 35.0, 33.0, 25.0, 20.0, 15.0, 10.0, 3.0, 3.0, 2.0, 0.0, 3.0, 3.0, 1.0], "bins": [-10.5546875, -10.256103515625, -9.95751953125, -9.658935546875, -9.3603515625, -9.061767578125, -8.76318359375, -8.464599609375, -8.166015625, -7.867431640625, -7.56884765625, -7.270263671875, -6.9716796875, -6.673095703125, -6.37451171875, -6.075927734375, -5.77734375, -5.478759765625, -5.18017578125, -4.881591796875, -4.5830078125, -4.284423828125, -3.98583984375, -3.687255859375, -3.388671875, -3.090087890625, -2.79150390625, -2.492919921875, -2.1943359375, -1.895751953125, -1.59716796875, -1.298583984375, -1.0, -0.701416015625, -0.40283203125, -0.104248046875, 0.1943359375, 0.492919921875, 0.79150390625, 1.090087890625, 1.388671875, 1.687255859375, 1.98583984375, 2.284423828125, 2.5830078125, 2.881591796875, 3.18017578125, 3.478759765625, 3.77734375, 4.075927734375, 4.37451171875, 4.673095703125, 4.9716796875, 5.270263671875, 5.56884765625, 5.867431640625, 6.166015625, 6.464599609375, 6.76318359375, 7.061767578125, 7.3603515625, 7.658935546875, 7.95751953125, 8.256103515625, 8.5546875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 6.0, 3.0, 8.0, 6.0, 12.0, 12.0, 14.0, 29.0, 21.0, 21.0, 38.0, 37.0, 27.0, 55.0, 53.0, 60.0, 78.0, 112.0, 274.0, 1475.0, 199.0, 108.0, 64.0, 60.0, 30.0, 49.0, 31.0, 31.0, 23.0, 19.0, 22.0, 19.0, 12.0, 14.0, 9.0, 6.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.28125, -21.631591796875, -20.98193359375, -20.332275390625, -19.6826171875, -19.032958984375, -18.38330078125, -17.733642578125, -17.083984375, -16.434326171875, -15.78466796875, -15.135009765625, -14.4853515625, -13.835693359375, -13.18603515625, -12.536376953125, -11.88671875, -11.237060546875, -10.58740234375, -9.937744140625, -9.2880859375, -8.638427734375, -7.98876953125, -7.339111328125, -6.689453125, -6.039794921875, -5.39013671875, -4.740478515625, -4.0908203125, -3.441162109375, -2.79150390625, -2.141845703125, -1.4921875, -0.842529296875, -0.19287109375, 0.456787109375, 1.1064453125, 1.756103515625, 2.40576171875, 3.055419921875, 3.705078125, 4.354736328125, 5.00439453125, 5.654052734375, 6.3037109375, 6.953369140625, 7.60302734375, 8.252685546875, 8.90234375, 9.552001953125, 10.20166015625, 10.851318359375, 11.5009765625, 12.150634765625, 12.80029296875, 13.449951171875, 14.099609375, 14.749267578125, 15.39892578125, 16.048583984375, 16.6982421875, 17.347900390625, 17.99755859375, 18.647216796875, 19.296875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 9.0, 7.0, 6.0, 7.0, 9.0, 14.0, 11.0, 14.0, 24.0, 30.0, 51.0, 73.0, 105.0, 158.0, 217.0, 297.0, 427.0, 769.0, 1707.0, 22685.0, 2749669.0, 361043.0, 5213.0, 1115.0, 624.0, 419.0, 249.0, 178.0, 137.0, 107.0, 81.0, 46.0, 45.0, 34.0, 30.0, 15.0, 17.0, 13.0, 13.0, 5.0, 8.0, 9.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.65625, -32.59765625, -31.5390625, -30.48046875, -29.421875, -28.36328125, -27.3046875, -26.24609375, -25.1875, -24.12890625, -23.0703125, -22.01171875, -20.953125, -19.89453125, -18.8359375, -17.77734375, -16.71875, -15.66015625, -14.6015625, -13.54296875, -12.484375, -11.42578125, -10.3671875, -9.30859375, -8.25, -7.19140625, -6.1328125, -5.07421875, -4.015625, -2.95703125, -1.8984375, -0.83984375, 0.21875, 1.27734375, 2.3359375, 3.39453125, 4.453125, 5.51171875, 6.5703125, 7.62890625, 8.6875, 9.74609375, 10.8046875, 11.86328125, 12.921875, 13.98046875, 15.0390625, 16.09765625, 17.15625, 18.21484375, 19.2734375, 20.33203125, 21.390625, 22.44921875, 23.5078125, 24.56640625, 25.625, 26.68359375, 27.7421875, 28.80078125, 29.859375, 30.91796875, 31.9765625, 33.03515625, 34.09375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 36.0, 612.0, 357.0, 12.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.7442626953125, -115.21851348876953, -109.69276428222656, -104.1670150756836, -98.64126586914062, -93.11551666259766, -87.58976745605469, -82.06401062011719, -76.53826904296875, -71.01251983642578, -65.48677062988281, -59.961021423339844, -54.435272216796875, -48.909523010253906, -43.38376998901367, -37.8580207824707, -32.33226776123047, -26.8065185546875, -21.28076934814453, -15.75501823425293, -10.229269027709961, -4.703519821166992, 0.8222312927246094, 6.347980499267578, 11.873729705810547, 17.399478912353516, 22.925228118896484, 28.450979232788086, 33.97673034667969, 39.502479553222656, 45.028228759765625, 50.553977966308594, 56.07972717285156, 61.60547637939453, 67.1312255859375, 72.65697479248047, 78.18272399902344, 83.7084732055664, 89.23422241210938, 94.75997924804688, 100.28572082519531, 105.81147003173828, 111.33721923828125, 116.86296844482422, 122.38871765136719, 127.91446685791016, 133.44021606445312, 138.96597290039062, 144.49172973632812, 150.01748657226562, 155.54322814941406, 161.06898498535156, 166.5947265625, 172.1204833984375, 177.64622497558594, 183.17198181152344, 188.69772338867188, 194.22348022460938, 199.7492218017578, 205.2749786376953, 210.80072021484375, 216.32647705078125, 221.8522186279297, 227.3779754638672, 232.90371704101562]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 7.0, 6.0, 3.0, 7.0, 16.0, 18.0, 19.0, 27.0, 21.0, 17.0, 27.0, 40.0, 35.0, 31.0, 52.0, 42.0, 42.0, 33.0, 51.0, 50.0, 39.0, 38.0, 47.0, 51.0, 43.0, 30.0, 30.0, 21.0, 27.0, 23.0, 17.0, 16.0, 13.0, 10.0, 16.0, 8.0, 6.0, 4.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-47.08586502075195, -45.65842056274414, -44.230979919433594, -42.80353546142578, -41.37609100341797, -39.948646545410156, -38.52120590209961, -37.0937614440918, -35.66632080078125, -34.23887634277344, -32.81143569946289, -31.383991241455078, -29.956546783447266, -28.529104232788086, -27.101661682128906, -25.674217224121094, -24.24677276611328, -22.8193302154541, -21.39188575744629, -19.96444320678711, -18.536998748779297, -17.109556198120117, -15.682113647460938, -14.254670143127441, -12.827226638793945, -11.39978313446045, -9.972339630126953, -8.544897079467773, -7.117453575134277, -5.690010070800781, -4.262567520141602, -2.8351240158081055, -1.407684326171875, 0.019758939743041992, 1.447202205657959, 2.874645233154297, 4.302088737487793, 5.729532241821289, 7.156974792480469, 8.584418296813965, 10.011861801147461, 11.439305305480957, 12.866748809814453, 14.294191360473633, 15.721634864807129, 17.149078369140625, 18.576520919799805, 20.003963470458984, 21.431407928466797, 22.858850479125977, 24.28629493713379, 25.71373748779297, 27.14118194580078, 28.56862449645996, 29.99606704711914, 31.423511505126953, 32.8509521484375, 34.27839660644531, 35.70583724975586, 37.13328170776367, 38.560726165771484, 39.98816680908203, 41.415611267089844, 42.843055725097656, 44.27050018310547]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 2.0, 5.0, 2.0, 9.0, 4.0, 17.0, 9.0, 17.0, 21.0, 30.0, 22.0, 29.0, 33.0, 35.0, 36.0, 53.0, 46.0, 40.0, 66.0, 50.0, 60.0, 48.0, 40.0, 50.0, 37.0, 26.0, 32.0, 15.0, 35.0, 22.0, 18.0, 15.0, 25.0, 12.0, 15.0, 7.0, 6.0, 3.0, 7.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3828125, -7.1075439453125, -6.832275390625, -6.5570068359375, -6.28173828125, -6.0064697265625, -5.731201171875, -5.4559326171875, -5.1806640625, -4.9053955078125, -4.630126953125, -4.3548583984375, -4.07958984375, -3.8043212890625, -3.529052734375, -3.2537841796875, -2.978515625, -2.7032470703125, -2.427978515625, -2.1527099609375, -1.87744140625, -1.6021728515625, -1.326904296875, -1.0516357421875, -0.7763671875, -0.5010986328125, -0.225830078125, 0.0494384765625, 0.32470703125, 0.5999755859375, 0.875244140625, 1.1505126953125, 1.42578125, 1.7010498046875, 1.976318359375, 2.2515869140625, 2.52685546875, 2.8021240234375, 3.077392578125, 3.3526611328125, 3.6279296875, 3.9031982421875, 4.178466796875, 4.4537353515625, 4.72900390625, 5.0042724609375, 5.279541015625, 5.5548095703125, 5.830078125, 6.1053466796875, 6.380615234375, 6.6558837890625, 6.93115234375, 7.2064208984375, 7.481689453125, 7.7569580078125, 8.0322265625, 8.3074951171875, 8.582763671875, 8.8580322265625, 9.13330078125, 9.4085693359375, 9.683837890625, 9.9591064453125, 10.234375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 5.0, 8.0, 7.0, 5.0, 12.0, 18.0, 25.0, 31.0, 30.0, 37.0, 48.0, 66.0, 108.0, 118.0, 165.0, 261.0, 325.0, 411.0, 800.0, 1843393.0, 2345912.0, 784.0, 442.0, 309.0, 234.0, 168.0, 136.0, 96.0, 76.0, 49.0, 43.0, 31.0, 21.0, 15.0, 26.0, 12.0, 9.0, 8.0, 10.0, 7.0, 5.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-104.3125, -101.0537109375, -97.794921875, -94.5361328125, -91.27734375, -88.0185546875, -84.759765625, -81.5009765625, -78.2421875, -74.9833984375, -71.724609375, -68.4658203125, -65.20703125, -61.9482421875, -58.689453125, -55.4306640625, -52.171875, -48.9130859375, -45.654296875, -42.3955078125, -39.13671875, -35.8779296875, -32.619140625, -29.3603515625, -26.1015625, -22.8427734375, -19.583984375, -16.3251953125, -13.06640625, -9.8076171875, -6.548828125, -3.2900390625, -0.03125, 3.2275390625, 6.486328125, 9.7451171875, 13.00390625, 16.2626953125, 19.521484375, 22.7802734375, 26.0390625, 29.2978515625, 32.556640625, 35.8154296875, 39.07421875, 42.3330078125, 45.591796875, 48.8505859375, 52.109375, 55.3681640625, 58.626953125, 61.8857421875, 65.14453125, 68.4033203125, 71.662109375, 74.9208984375, 78.1796875, 81.4384765625, 84.697265625, 87.9560546875, 91.21484375, 94.4736328125, 97.732421875, 100.9912109375, 104.25]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 10.0, 6.0, 8.0, 18.0, 17.0, 12.0, 24.0, 33.0, 48.0, 57.0, 84.0, 118.0, 203.0, 320.0, 444.0, 510.0, 560.0, 465.0, 361.0, 225.0, 142.0, 123.0, 59.0, 46.0, 38.0, 33.0, 26.0, 16.0, 16.0, 6.0, 7.0, 7.0, 5.0, 2.0, 7.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.8125, -10.4554443359375, -10.098388671875, -9.7413330078125, -9.38427734375, -9.0272216796875, -8.670166015625, -8.3131103515625, -7.9560546875, -7.5989990234375, -7.241943359375, -6.8848876953125, -6.52783203125, -6.1707763671875, -5.813720703125, -5.4566650390625, -5.099609375, -4.7425537109375, -4.385498046875, -4.0284423828125, -3.67138671875, -3.3143310546875, -2.957275390625, -2.6002197265625, -2.2431640625, -1.8861083984375, -1.529052734375, -1.1719970703125, -0.81494140625, -0.4578857421875, -0.100830078125, 0.2562255859375, 0.61328125, 0.9703369140625, 1.327392578125, 1.6844482421875, 2.04150390625, 2.3985595703125, 2.755615234375, 3.1126708984375, 3.4697265625, 3.8267822265625, 4.183837890625, 4.5408935546875, 4.89794921875, 5.2550048828125, 5.612060546875, 5.9691162109375, 6.326171875, 6.6832275390625, 7.040283203125, 7.3973388671875, 7.75439453125, 8.1114501953125, 8.468505859375, 8.8255615234375, 9.1826171875, 9.5396728515625, 9.896728515625, 10.2537841796875, 10.61083984375, 10.9678955078125, 11.324951171875, 11.6820068359375, 12.0390625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 10.0, 9.0, 12.0, 20.0, 25.0, 27.0, 33.0, 44.0, 52.0, 57.0, 127.0, 219.0, 913.0, 31108.0, 4136596.0, 23557.0, 838.0, 206.0, 105.0, 84.0, 54.0, 37.0, 25.0, 35.0, 16.0, 13.0, 11.0, 11.0, 12.0, 3.0, 4.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.78125, -47.74755859375, -45.7138671875, -43.68017578125, -41.646484375, -39.61279296875, -37.5791015625, -35.54541015625, -33.51171875, -31.47802734375, -29.4443359375, -27.41064453125, -25.376953125, -23.34326171875, -21.3095703125, -19.27587890625, -17.2421875, -15.20849609375, -13.1748046875, -11.14111328125, -9.107421875, -7.07373046875, -5.0400390625, -3.00634765625, -0.97265625, 1.06103515625, 3.0947265625, 5.12841796875, 7.162109375, 9.19580078125, 11.2294921875, 13.26318359375, 15.296875, 17.33056640625, 19.3642578125, 21.39794921875, 23.431640625, 25.46533203125, 27.4990234375, 29.53271484375, 31.56640625, 33.60009765625, 35.6337890625, 37.66748046875, 39.701171875, 41.73486328125, 43.7685546875, 45.80224609375, 47.8359375, 49.86962890625, 51.9033203125, 53.93701171875, 55.970703125, 58.00439453125, 60.0380859375, 62.07177734375, 64.10546875, 66.13916015625, 68.1728515625, 70.20654296875, 72.240234375, 74.27392578125, 76.3076171875, 78.34130859375, 80.375]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 39.0, 99.0, 194.0, 277.0, 210.0, 122.0, 38.0, 15.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-46.22077178955078, -43.872989654541016, -41.52520751953125, -39.177425384521484, -36.82964324951172, -34.48185729980469, -32.13407516479492, -29.786293029785156, -27.43851089477539, -25.090728759765625, -22.74294662475586, -20.39516258239746, -18.047380447387695, -15.69959831237793, -13.351815223693848, -11.004032135009766, -8.65625, -6.308467388153076, -3.9606847763061523, -1.6129021644592285, 0.7348804473876953, 3.082662582397461, 5.430445671081543, 7.778228759765625, 10.12601089477539, 12.473793029785156, 14.821576118469238, 17.16935920715332, 19.517141342163086, 21.86492347717285, 24.21270751953125, 26.560489654541016, 28.908279418945312, 31.256061553955078, 33.603843688964844, 35.95162582397461, 38.299407958984375, 40.647193908691406, 42.99497604370117, 45.34275817871094, 47.6905403137207, 50.03832244873047, 52.386104583740234, 54.73388671875, 57.08167266845703, 59.42945098876953, 61.77723693847656, 64.12501525878906, 66.4728012084961, 68.82058715820312, 71.16836547851562, 73.51615142822266, 75.86392974853516, 78.21171569824219, 80.55949401855469, 82.90727996826172, 85.25506591796875, 87.60285186767578, 89.95063018798828, 92.29841613769531, 94.64619445800781, 96.99398040771484, 99.34175872802734, 101.68954467773438, 104.03732299804688]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 5.0, 6.0, 3.0, 4.0, 5.0, 13.0, 10.0, 14.0, 12.0, 24.0, 29.0, 29.0, 19.0, 23.0, 30.0, 25.0, 27.0, 35.0, 30.0, 36.0, 40.0, 33.0, 36.0, 46.0, 35.0, 49.0, 41.0, 31.0, 38.0, 31.0, 21.0, 29.0, 33.0, 31.0, 29.0, 16.0, 13.0, 14.0, 10.0, 10.0, 10.0, 6.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-36.1537971496582, -35.039039611816406, -33.92428207397461, -32.80952453613281, -31.694765090942383, -30.580007553100586, -29.465248107910156, -28.35049057006836, -27.235733032226562, -26.120975494384766, -25.00621795654297, -23.89145851135254, -22.776700973510742, -21.661943435668945, -20.547183990478516, -19.43242645263672, -18.317668914794922, -17.202911376953125, -16.088153839111328, -14.973394393920898, -13.858636856079102, -12.743879318237305, -11.629120826721191, -10.514362335205078, -9.399604797363281, -8.284847259521484, -7.170088768005371, -6.055330753326416, -4.940572738647461, -3.825814723968506, -2.711056709289551, -1.5962986946105957, -0.481536865234375, 0.6332211494445801, 1.7479791641235352, 2.8627371788024902, 3.9774951934814453, 5.0922532081604, 6.2070112228393555, 7.3217692375183105, 8.436527252197266, 9.551284790039062, 10.666043281555176, 11.780801773071289, 12.895559310913086, 14.010316848754883, 15.125075340270996, 16.23983383178711, 17.354591369628906, 18.469348907470703, 19.5841064453125, 20.69886589050293, 21.813623428344727, 22.928380966186523, 24.043140411376953, 25.15789794921875, 26.272655487060547, 27.387413024902344, 28.50217056274414, 29.61693000793457, 30.731687545776367, 31.846445083618164, 32.961204528808594, 34.07596206665039, 35.19071960449219]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 5.0, 4.0, 6.0, 14.0, 18.0, 4.0, 10.0, 19.0, 19.0, 25.0, 33.0, 25.0, 27.0, 27.0, 34.0, 38.0, 42.0, 40.0, 42.0, 42.0, 46.0, 40.0, 48.0, 51.0, 31.0, 38.0, 33.0, 36.0, 17.0, 31.0, 15.0, 23.0, 22.0, 18.0, 16.0, 14.0, 9.0, 5.0, 8.0, 6.0, 2.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.85546875, -6.62225341796875, -6.3890380859375, -6.15582275390625, -5.922607421875, -5.68939208984375, -5.4561767578125, -5.22296142578125, -4.98974609375, -4.75653076171875, -4.5233154296875, -4.29010009765625, -4.056884765625, -3.82366943359375, -3.5904541015625, -3.35723876953125, -3.1240234375, -2.89080810546875, -2.6575927734375, -2.42437744140625, -2.191162109375, -1.95794677734375, -1.7247314453125, -1.49151611328125, -1.25830078125, -1.02508544921875, -0.7918701171875, -0.55865478515625, -0.325439453125, -0.09222412109375, 0.1409912109375, 0.37420654296875, 0.607421875, 0.84063720703125, 1.0738525390625, 1.30706787109375, 1.540283203125, 1.77349853515625, 2.0067138671875, 2.23992919921875, 2.47314453125, 2.70635986328125, 2.9395751953125, 3.17279052734375, 3.406005859375, 3.63922119140625, 3.8724365234375, 4.10565185546875, 4.3388671875, 4.57208251953125, 4.8052978515625, 5.03851318359375, 5.271728515625, 5.50494384765625, 5.7381591796875, 5.97137451171875, 6.20458984375, 6.43780517578125, 6.6710205078125, 6.90423583984375, 7.137451171875, 7.37066650390625, 7.6038818359375, 7.83709716796875, 8.0703125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 6.0, 15.0, 30.0, 30.0, 44.0, 71.0, 108.0, 141.0, 205.0, 304.0, 393.0, 613.0, 928.0, 1348.0, 1899.0, 2774.0, 4146.0, 6303.0, 9041.0, 13847.0, 20802.0, 31433.0, 49884.0, 83988.0, 172683.0, 331891.0, 124924.0, 68136.0, 41514.0, 26990.0, 17700.0, 11881.0, 8054.0, 5140.0, 3626.0, 2411.0, 1686.0, 1128.0, 725.0, 559.0, 338.0, 263.0, 174.0, 112.0, 88.0, 49.0, 41.0, 35.0, 18.0, 15.0, 8.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.615234375, -1.5636444091796875, -1.512054443359375, -1.4604644775390625, -1.40887451171875, -1.3572845458984375, -1.305694580078125, -1.2541046142578125, -1.2025146484375, -1.1509246826171875, -1.099334716796875, -1.0477447509765625, -0.99615478515625, -0.9445648193359375, -0.892974853515625, -0.8413848876953125, -0.789794921875, -0.7382049560546875, -0.686614990234375, -0.6350250244140625, -0.58343505859375, -0.5318450927734375, -0.480255126953125, -0.4286651611328125, -0.3770751953125, -0.3254852294921875, -0.273895263671875, -0.2223052978515625, -0.17071533203125, -0.1191253662109375, -0.067535400390625, -0.0159454345703125, 0.03564453125, 0.0872344970703125, 0.138824462890625, 0.1904144287109375, 0.24200439453125, 0.2935943603515625, 0.345184326171875, 0.3967742919921875, 0.4483642578125, 0.4999542236328125, 0.551544189453125, 0.6031341552734375, 0.65472412109375, 0.7063140869140625, 0.757904052734375, 0.8094940185546875, 0.861083984375, 0.9126739501953125, 0.964263916015625, 1.0158538818359375, 1.06744384765625, 1.1190338134765625, 1.170623779296875, 1.2222137451171875, 1.2738037109375, 1.3253936767578125, 1.376983642578125, 1.4285736083984375, 1.48016357421875, 1.5317535400390625, 1.583343505859375, 1.6349334716796875, 1.6865234375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 8.0, 5.0, 9.0, 14.0, 14.0, 13.0, 14.0, 22.0, 26.0, 23.0, 36.0, 36.0, 32.0, 30.0, 36.0, 41.0, 40.0, 44.0, 40.0, 1069.0, 52.0, 40.0, 48.0, 28.0, 41.0, 30.0, 32.0, 33.0, 28.0, 22.0, 27.0, 20.0, 12.0, 12.0, 10.0, 11.0, 9.0, 6.0, 5.0, 5.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.0390625, -4.8841552734375, -4.729248046875, -4.5743408203125, -4.41943359375, -4.2645263671875, -4.109619140625, -3.9547119140625, -3.7998046875, -3.6448974609375, -3.489990234375, -3.3350830078125, -3.18017578125, -3.0252685546875, -2.870361328125, -2.7154541015625, -2.560546875, -2.4056396484375, -2.250732421875, -2.0958251953125, -1.94091796875, -1.7860107421875, -1.631103515625, -1.4761962890625, -1.3212890625, -1.1663818359375, -1.011474609375, -0.8565673828125, -0.70166015625, -0.5467529296875, -0.391845703125, -0.2369384765625, -0.08203125, 0.0728759765625, 0.227783203125, 0.3826904296875, 0.53759765625, 0.6925048828125, 0.847412109375, 1.0023193359375, 1.1572265625, 1.3121337890625, 1.467041015625, 1.6219482421875, 1.77685546875, 1.9317626953125, 2.086669921875, 2.2415771484375, 2.396484375, 2.5513916015625, 2.706298828125, 2.8612060546875, 3.01611328125, 3.1710205078125, 3.325927734375, 3.4808349609375, 3.6357421875, 3.7906494140625, 3.945556640625, 4.1004638671875, 4.25537109375, 4.4102783203125, 4.565185546875, 4.7200927734375, 4.875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 10.0, 5.0, 14.0, 19.0, 17.0, 43.0, 56.0, 91.0, 128.0, 208.0, 319.0, 493.0, 712.0, 1211.0, 2047.0, 3523.0, 5876.0, 10409.0, 17870.0, 32775.0, 59742.0, 115996.0, 1401893.0, 232432.0, 96039.0, 50534.0, 27544.0, 15387.0, 8693.0, 5106.0, 3075.0, 1847.0, 1153.0, 689.0, 421.0, 278.0, 167.0, 108.0, 66.0, 45.0, 38.0, 17.0, 14.0, 13.0, 6.0, 3.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0390625, -1.975067138671875, -1.91107177734375, -1.847076416015625, -1.7830810546875, -1.719085693359375, -1.65509033203125, -1.591094970703125, -1.527099609375, -1.463104248046875, -1.39910888671875, -1.335113525390625, -1.2711181640625, -1.207122802734375, -1.14312744140625, -1.079132080078125, -1.01513671875, -0.951141357421875, -0.88714599609375, -0.823150634765625, -0.7591552734375, -0.695159912109375, -0.63116455078125, -0.567169189453125, -0.503173828125, -0.439178466796875, -0.37518310546875, -0.311187744140625, -0.2471923828125, -0.183197021484375, -0.11920166015625, -0.055206298828125, 0.0087890625, 0.072784423828125, 0.13677978515625, 0.200775146484375, 0.2647705078125, 0.328765869140625, 0.39276123046875, 0.456756591796875, 0.520751953125, 0.584747314453125, 0.64874267578125, 0.712738037109375, 0.7767333984375, 0.840728759765625, 0.90472412109375, 0.968719482421875, 1.03271484375, 1.096710205078125, 1.16070556640625, 1.224700927734375, 1.2886962890625, 1.352691650390625, 1.41668701171875, 1.480682373046875, 1.544677734375, 1.608673095703125, 1.67266845703125, 1.736663818359375, 1.8006591796875, 1.864654541015625, 1.92864990234375, 1.992645263671875, 2.056640625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 7.0, 3.0, 6.0, 14.0, 10.0, 13.0, 18.0, 20.0, 33.0, 42.0, 62.0, 82.0, 92.0, 94.0, 82.0, 86.0, 87.0, 54.0, 45.0, 34.0, 23.0, 20.0, 17.0, 11.0, 10.0, 3.0, 10.0, 3.0, 1.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0016574859619140625, -0.0016127228736877441, -0.0015679597854614258, -0.0015231966972351074, -0.001478433609008789, -0.0014336705207824707, -0.0013889074325561523, -0.001344144344329834, -0.0012993812561035156, -0.0012546181678771973, -0.001209855079650879, -0.0011650919914245605, -0.0011203289031982422, -0.0010755658149719238, -0.0010308027267456055, -0.0009860396385192871, -0.0009412765502929688, -0.0008965134620666504, -0.000851750373840332, -0.0008069872856140137, -0.0007622241973876953, -0.000717461109161377, -0.0006726980209350586, -0.0006279349327087402, -0.0005831718444824219, -0.0005384087562561035, -0.0004936456680297852, -0.0004488825798034668, -0.00040411949157714844, -0.0003593564033508301, -0.0003145933151245117, -0.00026983022689819336, -0.000225067138671875, -0.00018030405044555664, -0.00013554096221923828, -9.077787399291992e-05, -4.601478576660156e-05, -1.2516975402832031e-06, 4.3511390686035156e-05, 8.827447891235352e-05, 0.00013303756713867188, 0.00017780065536499023, 0.0002225637435913086, 0.00026732683181762695, 0.0003120899200439453, 0.00035685300827026367, 0.00040161609649658203, 0.0004463791847229004, 0.0004911422729492188, 0.0005359053611755371, 0.0005806684494018555, 0.0006254315376281738, 0.0006701946258544922, 0.0007149577140808105, 0.0007597208023071289, 0.0008044838905334473, 0.0008492469787597656, 0.000894010066986084, 0.0009387731552124023, 0.0009835362434387207, 0.001028299331665039, 0.0010730624198913574, 0.0011178255081176758, 0.0011625885963439941, 0.0012073516845703125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 6.0, 7.0, 9.0, 8.0, 10.0, 11.0, 17.0, 28.0, 30.0, 44.0, 71.0, 88.0, 148.0, 221.0, 415.0, 719.0, 2968.0, 1015491.0, 25935.0, 970.0, 485.0, 289.0, 175.0, 106.0, 82.0, 55.0, 35.0, 24.0, 30.0, 17.0, 13.0, 9.0, 6.0, 7.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0204010009765625, -0.019664525985717773, -0.018928050994873047, -0.01819157600402832, -0.017455101013183594, -0.016718626022338867, -0.01598215103149414, -0.015245676040649414, -0.014509201049804688, -0.013772726058959961, -0.013036251068115234, -0.012299776077270508, -0.011563301086425781, -0.010826826095581055, -0.010090351104736328, -0.009353876113891602, -0.008617401123046875, -0.007880926132202148, -0.007144451141357422, -0.006407976150512695, -0.005671501159667969, -0.004935026168823242, -0.004198551177978516, -0.003462076187133789, -0.0027256011962890625, -0.001989126205444336, -0.0012526512145996094, -0.0005161762237548828, 0.00022029876708984375, 0.0009567737579345703, 0.0016932487487792969, 0.0024297237396240234, 0.00316619873046875, 0.0039026737213134766, 0.004639148712158203, 0.00537562370300293, 0.006112098693847656, 0.006848573684692383, 0.007585048675537109, 0.008321523666381836, 0.009057998657226562, 0.009794473648071289, 0.010530948638916016, 0.011267423629760742, 0.012003898620605469, 0.012740373611450195, 0.013476848602294922, 0.014213323593139648, 0.014949798583984375, 0.0156862735748291, 0.016422748565673828, 0.017159223556518555, 0.01789569854736328, 0.018632173538208008, 0.019368648529052734, 0.02010512351989746, 0.020841598510742188, 0.021578073501586914, 0.02231454849243164, 0.023051023483276367, 0.023787498474121094, 0.02452397346496582, 0.025260448455810547, 0.025996923446655273, 0.0267333984375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 8.0, 58.0, 355.0, 466.0, 106.0, 18.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002323971828445792, -0.0022468899842351675, -0.002169807907193899, -0.0020927260629832745, -0.0020156442187726498, -0.0019385621417313814, -0.0018614802975207567, -0.0017843983368948102, -0.0017073163762688637, -0.0016302344156429172, -0.0015531524550169706, -0.001476070610806346, -0.0013989886501803994, -0.001321906689554453, -0.0012448248453438282, -0.0011677428847178817, -0.0010906609240919352, -0.0010135789634659886, -0.000936497061047703, -0.0008594151586294174, -0.0007823331980034709, -0.0007052512373775244, -0.0006281693349592388, -0.0005510874325409532, -0.00047400547191500664, -0.00039692354039289057, -0.0003198416088707745, -0.00024275967734865844, -0.00016567774582654238, -8.859581430442631e-05, -1.1513882782310247e-05, 6.556801963597536e-05, 0.00014264998026192188, 0.00021973191178403795, 0.000296813843306154, 0.0003738957748282701, 0.00045097770635038614, 0.0005280596669763327, 0.0006051415693946183, 0.0006822234718129039, 0.0007593054324388504, 0.0008363873930647969, 0.0009134692954830825, 0.0009905511979013681, 0.0010676331585273147, 0.0011447151191532612, 0.0012217969633638859, 0.0012988789239898324, 0.001375960884615779, 0.0014530428452417254, 0.001530124805867672, 0.0016072066500782967, 0.0016842886107042432, 0.0017613705713301897, 0.0018384524155408144, 0.001915534376166761, 0.0019926163367927074, 0.002069698181003332, 0.0021467802580446005, 0.002223862102255225, 0.0023009441792964935, 0.0023780260235071182, 0.002455107867717743, 0.0025321897119283676, 0.002609271788969636]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 4.0, 7.0, 8.0, 13.0, 7.0, 11.0, 13.0, 16.0, 22.0, 20.0, 23.0, 17.0, 20.0, 32.0, 18.0, 23.0, 23.0, 37.0, 39.0, 36.0, 34.0, 45.0, 35.0, 24.0, 42.0, 35.0, 43.0, 22.0, 25.0, 28.0, 29.0, 25.0, 28.0, 25.0, 24.0, 16.0, 21.0, 14.0, 9.0, 11.0, 12.0, 19.0, 9.0, 7.0, 2.0, 3.0, 5.0, 4.0, 1.0, 5.0, 3.0, 2.0, 3.0], "bins": [-0.0005110502243041992, -0.0004959879443049431, -0.00048092566430568695, -0.0004658633843064308, -0.0004508011043071747, -0.00043573882430791855, -0.0004206765443086624, -0.0004056142643094063, -0.00039055198431015015, -0.000375489704310894, -0.0003604274243116379, -0.00034536514431238174, -0.0003303028643131256, -0.0003152405843138695, -0.00030017830431461334, -0.0002851160243153572, -0.0002700537443161011, -0.00025499146431684494, -0.0002399291843175888, -0.00022486690431833267, -0.00020980462431907654, -0.0001947423443198204, -0.00017968006432056427, -0.00016461778432130814, -0.000149555504322052, -0.00013449322432279587, -0.00011943094432353973, -0.0001043686643242836, -8.930638432502747e-05, -7.424410432577133e-05, -5.91818243265152e-05, -4.4119544327259064e-05, -2.905726432800293e-05, -1.3994984328746796e-05, 1.0672956705093384e-06, 1.6129575669765472e-05, 3.1191855669021606e-05, 4.625413566827774e-05, 6.131641566753387e-05, 7.637869566679001e-05, 9.144097566604614e-05, 0.00010650325566530228, 0.00012156553566455841, 0.00013662781566381454, 0.00015169009566307068, 0.0001667523756623268, 0.00018181465566158295, 0.00019687693566083908, 0.00021193921566009521, 0.00022700149565935135, 0.00024206377565860748, 0.0002571260556578636, 0.00027218833565711975, 0.0002872506156563759, 0.000302312895655632, 0.00031737517565488815, 0.0003324374556541443, 0.0003474997356534004, 0.00036256201565265656, 0.0003776242956519127, 0.0003926865756511688, 0.00040774885565042496, 0.0004228111356496811, 0.0004378734156489372, 0.00045293569564819336]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 5.0, 4.0, 6.0, 13.0, 19.0, 4.0, 10.0, 19.0, 19.0, 25.0, 33.0, 25.0, 27.0, 27.0, 34.0, 38.0, 42.0, 40.0, 42.0, 42.0, 46.0, 40.0, 48.0, 51.0, 31.0, 38.0, 33.0, 36.0, 17.0, 31.0, 15.0, 23.0, 22.0, 18.0, 16.0, 14.0, 9.0, 5.0, 8.0, 6.0, 2.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.85546875, -6.62225341796875, -6.3890380859375, -6.15582275390625, -5.922607421875, -5.68939208984375, -5.4561767578125, -5.22296142578125, -4.98974609375, -4.75653076171875, -4.5233154296875, -4.29010009765625, -4.056884765625, -3.82366943359375, -3.5904541015625, -3.35723876953125, -3.1240234375, -2.89080810546875, -2.6575927734375, -2.42437744140625, -2.191162109375, -1.95794677734375, -1.7247314453125, -1.49151611328125, -1.25830078125, -1.02508544921875, -0.7918701171875, -0.55865478515625, -0.325439453125, -0.09222412109375, 0.1409912109375, 0.37420654296875, 0.607421875, 0.84063720703125, 1.0738525390625, 1.30706787109375, 1.540283203125, 1.77349853515625, 2.0067138671875, 2.23992919921875, 2.47314453125, 2.70635986328125, 2.9395751953125, 3.17279052734375, 3.406005859375, 3.63922119140625, 3.8724365234375, 4.10565185546875, 4.3388671875, 4.57208251953125, 4.8052978515625, 5.03851318359375, 5.271728515625, 5.50494384765625, 5.7381591796875, 5.97137451171875, 6.20458984375, 6.43780517578125, 6.6710205078125, 6.90423583984375, 7.137451171875, 7.37066650390625, 7.6038818359375, 7.83709716796875, 8.0703125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 11.0, 9.0, 20.0, 17.0, 21.0, 34.0, 38.0, 69.0, 79.0, 99.0, 134.0, 160.0, 237.0, 339.0, 443.0, 547.0, 791.0, 1021.0, 1482.0, 2707.0, 9650.0, 79444.0, 495377.0, 387555.0, 53669.0, 7099.0, 2218.0, 1405.0, 963.0, 764.0, 536.0, 418.0, 318.0, 194.0, 179.0, 119.0, 107.0, 88.0, 48.0, 38.0, 24.0, 25.0, 13.0, 15.0, 8.0, 6.0, 9.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.8359375, -13.3883056640625, -12.940673828125, -12.4930419921875, -12.04541015625, -11.5977783203125, -11.150146484375, -10.7025146484375, -10.2548828125, -9.8072509765625, -9.359619140625, -8.9119873046875, -8.46435546875, -8.0167236328125, -7.569091796875, -7.1214599609375, -6.673828125, -6.2261962890625, -5.778564453125, -5.3309326171875, -4.88330078125, -4.4356689453125, -3.988037109375, -3.5404052734375, -3.0927734375, -2.6451416015625, -2.197509765625, -1.7498779296875, -1.30224609375, -0.8546142578125, -0.406982421875, 0.0406494140625, 0.48828125, 0.9359130859375, 1.383544921875, 1.8311767578125, 2.27880859375, 2.7264404296875, 3.174072265625, 3.6217041015625, 4.0693359375, 4.5169677734375, 4.964599609375, 5.4122314453125, 5.85986328125, 6.3074951171875, 6.755126953125, 7.2027587890625, 7.650390625, 8.0980224609375, 8.545654296875, 8.9932861328125, 9.44091796875, 9.8885498046875, 10.336181640625, 10.7838134765625, 11.2314453125, 11.6790771484375, 12.126708984375, 12.5743408203125, 13.02197265625, 13.4696044921875, 13.917236328125, 14.3648681640625, 14.8125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 5.0, 12.0, 14.0, 15.0, 19.0, 25.0, 45.0, 43.0, 65.0, 77.0, 99.0, 215.0, 1678.0, 276.0, 124.0, 70.0, 54.0, 41.0, 57.0, 37.0, 20.0, 21.0, 6.0, 11.0, 6.0, 10.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.578125, -28.612060546875, -27.64599609375, -26.679931640625, -25.7138671875, -24.747802734375, -23.78173828125, -22.815673828125, -21.849609375, -20.883544921875, -19.91748046875, -18.951416015625, -17.9853515625, -17.019287109375, -16.05322265625, -15.087158203125, -14.12109375, -13.155029296875, -12.18896484375, -11.222900390625, -10.2568359375, -9.290771484375, -8.32470703125, -7.358642578125, -6.392578125, -5.426513671875, -4.46044921875, -3.494384765625, -2.5283203125, -1.562255859375, -0.59619140625, 0.369873046875, 1.3359375, 2.302001953125, 3.26806640625, 4.234130859375, 5.2001953125, 6.166259765625, 7.13232421875, 8.098388671875, 9.064453125, 10.030517578125, 10.99658203125, 11.962646484375, 12.9287109375, 13.894775390625, 14.86083984375, 15.826904296875, 16.79296875, 17.759033203125, 18.72509765625, 19.691162109375, 20.6572265625, 21.623291015625, 22.58935546875, 23.555419921875, 24.521484375, 25.487548828125, 26.45361328125, 27.419677734375, 28.3857421875, 29.351806640625, 30.31787109375, 31.283935546875, 32.25]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 10.0, 5.0, 5.0, 7.0, 17.0, 12.0, 18.0, 23.0, 27.0, 47.0, 62.0, 78.0, 122.0, 187.0, 295.0, 499.0, 913.0, 2354.0, 2840822.0, 296095.0, 1937.0, 843.0, 467.0, 281.0, 159.0, 120.0, 70.0, 62.0, 34.0, 30.0, 24.0, 17.0, 14.0, 15.0, 8.0, 9.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.6875, -73.31640625, -70.9453125, -68.57421875, -66.203125, -63.83203125, -61.4609375, -59.08984375, -56.71875, -54.34765625, -51.9765625, -49.60546875, -47.234375, -44.86328125, -42.4921875, -40.12109375, -37.75, -35.37890625, -33.0078125, -30.63671875, -28.265625, -25.89453125, -23.5234375, -21.15234375, -18.78125, -16.41015625, -14.0390625, -11.66796875, -9.296875, -6.92578125, -4.5546875, -2.18359375, 0.1875, 2.55859375, 4.9296875, 7.30078125, 9.671875, 12.04296875, 14.4140625, 16.78515625, 19.15625, 21.52734375, 23.8984375, 26.26953125, 28.640625, 31.01171875, 33.3828125, 35.75390625, 38.125, 40.49609375, 42.8671875, 45.23828125, 47.609375, 49.98046875, 52.3515625, 54.72265625, 57.09375, 59.46484375, 61.8359375, 64.20703125, 66.578125, 68.94921875, 71.3203125, 73.69140625, 76.0625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 95.0, 654.0, 237.0, 19.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.23116302490234, -74.19345092773438, -69.15573120117188, -64.1180191040039, -59.080299377441406, -54.04258728027344, -49.0048713684082, -43.96715545654297, -38.929439544677734, -33.8917236328125, -28.854007720947266, -23.816293716430664, -18.77857780456543, -13.740861892700195, -8.703147888183594, -3.6654319763183594, 1.372283935546875, 6.409999370574951, 11.447714805603027, 16.485429763793945, 21.52314567565918, 26.560861587524414, 31.598575592041016, 36.63629150390625, 41.674007415771484, 46.71172332763672, 51.74943923950195, 56.78715515136719, 61.824867248535156, 66.86258697509766, 71.90029907226562, 76.93801879882812, 81.97572326660156, 87.01343536376953, 92.05115509033203, 97.0888671875, 102.1265869140625, 107.16429901123047, 112.20201110839844, 117.23973083496094, 122.27745056152344, 127.3151626586914, 132.35287475585938, 137.39059448242188, 142.42831420898438, 147.46603393554688, 152.5037384033203, 157.5414581298828, 162.57916259765625, 167.61688232421875, 172.6545867919922, 177.6923065185547, 182.7300262451172, 187.7677459716797, 192.80545043945312, 197.84317016601562, 202.88088989257812, 207.91860961914062, 212.95631408691406, 217.99403381347656, 223.03175354003906, 228.06947326660156, 233.107177734375, 238.1448974609375, 243.1826171875]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 9.0, 5.0, 9.0, 5.0, 9.0, 10.0, 19.0, 18.0, 15.0, 24.0, 23.0, 28.0, 29.0, 27.0, 31.0, 39.0, 33.0, 41.0, 52.0, 37.0, 42.0, 34.0, 50.0, 44.0, 28.0, 48.0, 44.0, 34.0, 33.0, 28.0, 31.0, 22.0, 22.0, 16.0, 14.0, 13.0, 10.0, 7.0, 4.0, 6.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-60.58242416381836, -58.814056396484375, -57.045684814453125, -55.277313232421875, -53.50894546508789, -51.740577697753906, -49.972206115722656, -48.203834533691406, -46.43546676635742, -44.66709899902344, -42.89872741699219, -41.13035583496094, -39.36198806762695, -37.59362030029297, -35.82524871826172, -34.05687713623047, -32.288509368896484, -30.520139694213867, -28.75177001953125, -26.983400344848633, -25.215030670166016, -23.4466609954834, -21.67829132080078, -19.909921646118164, -18.141551971435547, -16.37318229675293, -14.604812622070312, -12.836442947387695, -11.068073272705078, -9.299703598022461, -7.531333923339844, -5.762964248657227, -3.9945945739746094, -2.226224899291992, -0.457855224609375, 1.3105144500732422, 3.0788841247558594, 4.847253799438477, 6.615623474121094, 8.383993148803711, 10.152362823486328, 11.920732498168945, 13.689102172851562, 15.45747184753418, 17.225841522216797, 18.994211196899414, 20.76258087158203, 22.53095054626465, 24.299320220947266, 26.067689895629883, 27.8360595703125, 29.604429244995117, 31.372798919677734, 33.14116668701172, 34.90953826904297, 36.67790985107422, 38.4462776184082, 40.21464538574219, 41.98301696777344, 43.75138854980469, 45.51975631713867, 47.288124084472656, 49.056495666503906, 50.824867248535156, 52.59323501586914]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 4.0, 4.0, 3.0, 5.0, 4.0, 6.0, 11.0, 21.0, 18.0, 18.0, 23.0, 27.0, 26.0, 24.0, 29.0, 37.0, 34.0, 51.0, 36.0, 44.0, 44.0, 55.0, 46.0, 35.0, 41.0, 27.0, 29.0, 35.0, 32.0, 36.0, 34.0, 27.0, 15.0, 16.0, 20.0, 17.0, 12.0, 9.0, 7.0, 14.0, 5.0, 7.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.359375, -7.1199951171875, -6.880615234375, -6.6412353515625, -6.40185546875, -6.1624755859375, -5.923095703125, -5.6837158203125, -5.4443359375, -5.2049560546875, -4.965576171875, -4.7261962890625, -4.48681640625, -4.2474365234375, -4.008056640625, -3.7686767578125, -3.529296875, -3.2899169921875, -3.050537109375, -2.8111572265625, -2.57177734375, -2.3323974609375, -2.093017578125, -1.8536376953125, -1.6142578125, -1.3748779296875, -1.135498046875, -0.8961181640625, -0.65673828125, -0.4173583984375, -0.177978515625, 0.0614013671875, 0.30078125, 0.5401611328125, 0.779541015625, 1.0189208984375, 1.25830078125, 1.4976806640625, 1.737060546875, 1.9764404296875, 2.2158203125, 2.4552001953125, 2.694580078125, 2.9339599609375, 3.17333984375, 3.4127197265625, 3.652099609375, 3.8914794921875, 4.130859375, 4.3702392578125, 4.609619140625, 4.8489990234375, 5.08837890625, 5.3277587890625, 5.567138671875, 5.8065185546875, 6.0458984375, 6.2852783203125, 6.524658203125, 6.7640380859375, 7.00341796875, 7.2427978515625, 7.482177734375, 7.7215576171875, 7.9609375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 7.0, 10.0, 10.0, 16.0, 19.0, 27.0, 24.0, 38.0, 44.0, 64.0, 81.0, 126.0, 185.0, 237.0, 480.0, 961.0, 2737.0, 8995.0, 52942.0, 521239.0, 2295847.0, 1154549.0, 131523.0, 16741.0, 4173.0, 1468.0, 673.0, 325.0, 201.0, 134.0, 96.0, 77.0, 50.0, 46.0, 27.0, 31.0, 21.0, 12.0, 13.0, 10.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-14.8359375, -14.42041015625, -14.0048828125, -13.58935546875, -13.173828125, -12.75830078125, -12.3427734375, -11.92724609375, -11.51171875, -11.09619140625, -10.6806640625, -10.26513671875, -9.849609375, -9.43408203125, -9.0185546875, -8.60302734375, -8.1875, -7.77197265625, -7.3564453125, -6.94091796875, -6.525390625, -6.10986328125, -5.6943359375, -5.27880859375, -4.86328125, -4.44775390625, -4.0322265625, -3.61669921875, -3.201171875, -2.78564453125, -2.3701171875, -1.95458984375, -1.5390625, -1.12353515625, -0.7080078125, -0.29248046875, 0.123046875, 0.53857421875, 0.9541015625, 1.36962890625, 1.78515625, 2.20068359375, 2.6162109375, 3.03173828125, 3.447265625, 3.86279296875, 4.2783203125, 4.69384765625, 5.109375, 5.52490234375, 5.9404296875, 6.35595703125, 6.771484375, 7.18701171875, 7.6025390625, 8.01806640625, 8.43359375, 8.84912109375, 9.2646484375, 9.68017578125, 10.095703125, 10.51123046875, 10.9267578125, 11.34228515625, 11.7578125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 1.0, 1.0, 5.0, 7.0, 16.0, 27.0, 32.0, 58.0, 99.0, 112.0, 202.0, 345.0, 564.0, 808.0, 606.0, 431.0, 267.0, 164.0, 109.0, 79.0, 48.0, 31.0, 23.0, 14.0, 11.0, 7.0, 0.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.828125, -16.220703125, -15.61328125, -15.005859375, -14.3984375, -13.791015625, -13.18359375, -12.576171875, -11.96875, -11.361328125, -10.75390625, -10.146484375, -9.5390625, -8.931640625, -8.32421875, -7.716796875, -7.109375, -6.501953125, -5.89453125, -5.287109375, -4.6796875, -4.072265625, -3.46484375, -2.857421875, -2.25, -1.642578125, -1.03515625, -0.427734375, 0.1796875, 0.787109375, 1.39453125, 2.001953125, 2.609375, 3.216796875, 3.82421875, 4.431640625, 5.0390625, 5.646484375, 6.25390625, 6.861328125, 7.46875, 8.076171875, 8.68359375, 9.291015625, 9.8984375, 10.505859375, 11.11328125, 11.720703125, 12.328125, 12.935546875, 13.54296875, 14.150390625, 14.7578125, 15.365234375, 15.97265625, 16.580078125, 17.1875, 17.794921875, 18.40234375, 19.009765625, 19.6171875, 20.224609375, 20.83203125, 21.439453125, 22.046875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 7.0, 7.0, 16.0, 15.0, 34.0, 48.0, 88.0, 139.0, 248.0, 482.0, 1093.0, 3090.0, 25981.0, 3166873.0, 979806.0, 12284.0, 2301.0, 876.0, 404.0, 189.0, 135.0, 57.0, 40.0, 21.0, 21.0, 2.0, 13.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.9375, -35.84716796875, -34.7568359375, -33.66650390625, -32.576171875, -31.48583984375, -30.3955078125, -29.30517578125, -28.21484375, -27.12451171875, -26.0341796875, -24.94384765625, -23.853515625, -22.76318359375, -21.6728515625, -20.58251953125, -19.4921875, -18.40185546875, -17.3115234375, -16.22119140625, -15.130859375, -14.04052734375, -12.9501953125, -11.85986328125, -10.76953125, -9.67919921875, -8.5888671875, -7.49853515625, -6.408203125, -5.31787109375, -4.2275390625, -3.13720703125, -2.046875, -0.95654296875, 0.1337890625, 1.22412109375, 2.314453125, 3.40478515625, 4.4951171875, 5.58544921875, 6.67578125, 7.76611328125, 8.8564453125, 9.94677734375, 11.037109375, 12.12744140625, 13.2177734375, 14.30810546875, 15.3984375, 16.48876953125, 17.5791015625, 18.66943359375, 19.759765625, 20.85009765625, 21.9404296875, 23.03076171875, 24.12109375, 25.21142578125, 26.3017578125, 27.39208984375, 28.482421875, 29.57275390625, 30.6630859375, 31.75341796875, 32.84375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 30.0, 610.0, 367.0, 8.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-333.8099670410156, -322.9875793457031, -312.1651916503906, -301.3428039550781, -290.5204162597656, -279.6980285644531, -268.8756103515625, -258.05322265625, -247.23085021972656, -236.40846252441406, -225.58607482910156, -214.763671875, -203.9412841796875, -193.118896484375, -182.2965087890625, -171.47412109375, -160.6517333984375, -149.829345703125, -139.0069580078125, -128.1845703125, -117.36217498779297, -106.53978729248047, -95.71739196777344, -84.89500427246094, -74.07261657714844, -63.25022888183594, -52.42783737182617, -41.605445861816406, -30.783058166503906, -19.960670471191406, -9.138275146484375, 1.684112548828125, 12.50653076171875, 23.328920364379883, 34.151309967041016, 44.97370147705078, 55.79608917236328, 66.61847686767578, 77.44087219238281, 88.26325988769531, 99.08564758300781, 109.90803527832031, 120.73042297363281, 131.55282592773438, 142.37521362304688, 153.19760131835938, 164.01998901367188, 174.84237670898438, 185.66476440429688, 196.48715209960938, 207.30953979492188, 218.13192749023438, 228.95431518554688, 239.77670288085938, 250.59910583496094, 261.4215087890625, 272.243896484375, 283.0662841796875, 293.888671875, 304.7110595703125, 315.533447265625, 326.3558349609375, 337.17822265625, 348.0006103515625, 358.822998046875]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 8.0, 8.0, 8.0, 8.0, 6.0, 13.0, 11.0, 12.0, 17.0, 31.0, 25.0, 16.0, 26.0, 31.0, 41.0, 33.0, 36.0, 34.0, 31.0, 35.0, 41.0, 42.0, 38.0, 31.0, 28.0, 41.0, 27.0, 44.0, 25.0, 29.0, 29.0, 25.0, 25.0, 16.0, 24.0, 25.0, 18.0, 13.0, 10.0, 9.0, 7.0, 8.0, 5.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0], "bins": [-46.265296936035156, -44.86012268066406, -43.45494842529297, -42.049774169921875, -40.64459991455078, -39.23942565917969, -37.834251403808594, -36.4290771484375, -35.023902893066406, -33.61872863769531, -32.21355438232422, -30.808380126953125, -29.40320587158203, -27.998031616210938, -26.592859268188477, -25.187685012817383, -23.782512664794922, -22.377338409423828, -20.972164154052734, -19.56698989868164, -18.161815643310547, -16.756641387939453, -15.351469039916992, -13.946294784545898, -12.541120529174805, -11.135946273803711, -9.730772018432617, -8.32559871673584, -6.920424461364746, -5.515250205993652, -4.110076904296875, -2.7049026489257812, -1.2997283935546875, 0.10544562339782715, 1.5106196403503418, 2.9157934188842773, 4.320967674255371, 5.726141929626465, 7.131315231323242, 8.536489486694336, 9.94166374206543, 11.346837997436523, 12.752012252807617, 14.157185554504395, 15.562359809875488, 16.967533111572266, 18.37270736694336, 19.777881622314453, 21.183055877685547, 22.58823013305664, 23.993404388427734, 25.398578643798828, 26.803752899169922, 28.208927154541016, 29.614099502563477, 31.01927375793457, 32.42444610595703, 33.829620361328125, 35.23479461669922, 36.63996887207031, 38.045143127441406, 39.4503173828125, 40.855491638183594, 42.26066589355469, 43.66584014892578]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 9.0, 11.0, 10.0, 12.0, 15.0, 17.0, 23.0, 22.0, 31.0, 30.0, 33.0, 44.0, 42.0, 45.0, 44.0, 44.0, 56.0, 49.0, 59.0, 48.0, 44.0, 46.0, 41.0, 34.0, 40.0, 26.0, 15.0, 18.0, 12.0, 13.0, 15.0, 10.0, 9.0, 7.0, 9.0, 5.0, 0.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.42578125, -5.22357177734375, -5.0213623046875, -4.81915283203125, -4.616943359375, -4.41473388671875, -4.2125244140625, -4.01031494140625, -3.80810546875, -3.60589599609375, -3.4036865234375, -3.20147705078125, -2.999267578125, -2.79705810546875, -2.5948486328125, -2.39263916015625, -2.1904296875, -1.98822021484375, -1.7860107421875, -1.58380126953125, -1.381591796875, -1.17938232421875, -0.9771728515625, -0.77496337890625, -0.57275390625, -0.37054443359375, -0.1683349609375, 0.03387451171875, 0.236083984375, 0.43829345703125, 0.6405029296875, 0.84271240234375, 1.044921875, 1.24713134765625, 1.4493408203125, 1.65155029296875, 1.853759765625, 2.05596923828125, 2.2581787109375, 2.46038818359375, 2.66259765625, 2.86480712890625, 3.0670166015625, 3.26922607421875, 3.471435546875, 3.67364501953125, 3.8758544921875, 4.07806396484375, 4.2802734375, 4.48248291015625, 4.6846923828125, 4.88690185546875, 5.089111328125, 5.29132080078125, 5.4935302734375, 5.69573974609375, 5.89794921875, 6.10015869140625, 6.3023681640625, 6.50457763671875, 6.706787109375, 6.90899658203125, 7.1112060546875, 7.31341552734375, 7.515625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 7.0, 10.0, 16.0, 24.0, 39.0, 74.0, 78.0, 142.0, 211.0, 318.0, 539.0, 870.0, 1437.0, 2376.0, 3834.0, 6543.0, 10928.0, 19413.0, 36398.0, 72842.0, 165582.0, 423366.0, 154485.0, 68827.0, 34860.0, 18853.0, 10633.0, 6172.0, 3721.0, 2250.0, 1426.0, 833.0, 537.0, 342.0, 216.0, 126.0, 72.0, 57.0, 31.0, 15.0, 13.0, 21.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.525390625, -1.4718017578125, -1.418212890625, -1.3646240234375, -1.31103515625, -1.2574462890625, -1.203857421875, -1.1502685546875, -1.0966796875, -1.0430908203125, -0.989501953125, -0.9359130859375, -0.88232421875, -0.8287353515625, -0.775146484375, -0.7215576171875, -0.66796875, -0.6143798828125, -0.560791015625, -0.5072021484375, -0.45361328125, -0.4000244140625, -0.346435546875, -0.2928466796875, -0.2392578125, -0.1856689453125, -0.132080078125, -0.0784912109375, -0.02490234375, 0.0286865234375, 0.082275390625, 0.1358642578125, 0.189453125, 0.2430419921875, 0.296630859375, 0.3502197265625, 0.40380859375, 0.4573974609375, 0.510986328125, 0.5645751953125, 0.6181640625, 0.6717529296875, 0.725341796875, 0.7789306640625, 0.83251953125, 0.8861083984375, 0.939697265625, 0.9932861328125, 1.046875, 1.1004638671875, 1.154052734375, 1.2076416015625, 1.26123046875, 1.3148193359375, 1.368408203125, 1.4219970703125, 1.4755859375, 1.5291748046875, 1.582763671875, 1.6363525390625, 1.68994140625, 1.7435302734375, 1.797119140625, 1.8507080078125, 1.904296875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 7.0, 2.0, 13.0, 5.0, 4.0, 11.0, 6.0, 15.0, 17.0, 19.0, 18.0, 17.0, 34.0, 31.0, 34.0, 37.0, 34.0, 44.0, 49.0, 42.0, 42.0, 42.0, 1061.0, 31.0, 42.0, 30.0, 54.0, 43.0, 31.0, 31.0, 25.0, 17.0, 23.0, 13.0, 20.0, 17.0, 13.0, 14.0, 9.0, 9.0, 12.0, 5.0, 9.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6171875, -3.50115966796875, -3.3851318359375, -3.26910400390625, -3.153076171875, -3.03704833984375, -2.9210205078125, -2.80499267578125, -2.68896484375, -2.57293701171875, -2.4569091796875, -2.34088134765625, -2.224853515625, -2.10882568359375, -1.9927978515625, -1.87677001953125, -1.7607421875, -1.64471435546875, -1.5286865234375, -1.41265869140625, -1.296630859375, -1.18060302734375, -1.0645751953125, -0.94854736328125, -0.83251953125, -0.71649169921875, -0.6004638671875, -0.48443603515625, -0.368408203125, -0.25238037109375, -0.1363525390625, -0.02032470703125, 0.095703125, 0.21173095703125, 0.3277587890625, 0.44378662109375, 0.559814453125, 0.67584228515625, 0.7918701171875, 0.90789794921875, 1.02392578125, 1.13995361328125, 1.2559814453125, 1.37200927734375, 1.488037109375, 1.60406494140625, 1.7200927734375, 1.83612060546875, 1.9521484375, 2.06817626953125, 2.1842041015625, 2.30023193359375, 2.416259765625, 2.53228759765625, 2.6483154296875, 2.76434326171875, 2.88037109375, 2.99639892578125, 3.1124267578125, 3.22845458984375, 3.344482421875, 3.46051025390625, 3.5765380859375, 3.69256591796875, 3.80859375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 9.0, 11.0, 23.0, 25.0, 33.0, 81.0, 94.0, 164.0, 300.0, 455.0, 707.0, 1186.0, 1922.0, 2920.0, 4900.0, 8128.0, 13890.0, 23675.0, 42735.0, 80268.0, 172447.0, 1424108.0, 152520.0, 73234.0, 38932.0, 21746.0, 12840.0, 7858.0, 4571.0, 2841.0, 1690.0, 1009.0, 606.0, 397.0, 271.0, 181.0, 117.0, 84.0, 46.0, 35.0, 19.0, 27.0, 12.0, 5.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.58984375, -1.5422821044921875, -1.494720458984375, -1.4471588134765625, -1.39959716796875, -1.3520355224609375, -1.304473876953125, -1.2569122314453125, -1.2093505859375, -1.1617889404296875, -1.114227294921875, -1.0666656494140625, -1.01910400390625, -0.9715423583984375, -0.923980712890625, -0.8764190673828125, -0.828857421875, -0.7812957763671875, -0.733734130859375, -0.6861724853515625, -0.63861083984375, -0.5910491943359375, -0.543487548828125, -0.4959259033203125, -0.4483642578125, -0.4008026123046875, -0.353240966796875, -0.3056793212890625, -0.25811767578125, -0.2105560302734375, -0.162994384765625, -0.1154327392578125, -0.06787109375, -0.0203094482421875, 0.027252197265625, 0.0748138427734375, 0.12237548828125, 0.1699371337890625, 0.217498779296875, 0.2650604248046875, 0.3126220703125, 0.3601837158203125, 0.407745361328125, 0.4553070068359375, 0.50286865234375, 0.5504302978515625, 0.597991943359375, 0.6455535888671875, 0.693115234375, 0.7406768798828125, 0.788238525390625, 0.8358001708984375, 0.88336181640625, 0.9309234619140625, 0.978485107421875, 1.0260467529296875, 1.0736083984375, 1.1211700439453125, 1.168731689453125, 1.2162933349609375, 1.26385498046875, 1.3114166259765625, 1.358978271484375, 1.4065399169921875, 1.4541015625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 8.0, 11.0, 12.0, 20.0, 18.0, 26.0, 26.0, 45.0, 69.0, 99.0, 115.0, 133.0, 107.0, 76.0, 50.0, 38.0, 24.0, 20.0, 19.0, 16.0, 8.0, 7.0, 11.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001506805419921875, -0.0014551132917404175, -0.00140342116355896, -0.0013517290353775024, -0.001300036907196045, -0.0012483447790145874, -0.0011966526508331299, -0.0011449605226516724, -0.0010932683944702148, -0.0010415762662887573, -0.0009898841381072998, -0.0009381920099258423, -0.0008864998817443848, -0.0008348077535629272, -0.0007831156253814697, -0.0007314234972000122, -0.0006797313690185547, -0.0006280392408370972, -0.0005763471126556396, -0.0005246549844741821, -0.0004729628562927246, -0.0004212707281112671, -0.00036957859992980957, -0.00031788647174835205, -0.00026619434356689453, -0.000214502215385437, -0.0001628100872039795, -0.00011111795902252197, -5.942583084106445e-05, -7.733702659606934e-06, 4.3958425521850586e-05, 9.56505537033081e-05, 0.00014734268188476562, 0.00019903481006622314, 0.00025072693824768066, 0.0003024190664291382, 0.0003541111946105957, 0.0004058033227920532, 0.00045749545097351074, 0.0005091875791549683, 0.0005608797073364258, 0.0006125718355178833, 0.0006642639636993408, 0.0007159560918807983, 0.0007676482200622559, 0.0008193403482437134, 0.0008710324764251709, 0.0009227246046066284, 0.0009744167327880859, 0.0010261088609695435, 0.001077800989151001, 0.0011294931173324585, 0.001181185245513916, 0.0012328773736953735, 0.001284569501876831, 0.0013362616300582886, 0.001387953758239746, 0.0014396458864212036, 0.0014913380146026611, 0.0015430301427841187, 0.0015947222709655762, 0.0016464143991470337, 0.0016981065273284912, 0.0017497986555099487, 0.0018014907836914062]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 1.0, 5.0, 3.0, 3.0, 3.0, 4.0, 7.0, 10.0, 11.0, 20.0, 24.0, 23.0, 34.0, 35.0, 76.0, 92.0, 144.0, 256.0, 502.0, 1432.0, 1024169.0, 19978.0, 784.0, 347.0, 201.0, 108.0, 72.0, 52.0, 34.0, 33.0, 25.0, 13.0, 16.0, 11.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.035125732421875, -0.03411531448364258, -0.033104896545410156, -0.032094478607177734, -0.031084060668945312, -0.03007364273071289, -0.02906322479248047, -0.028052806854248047, -0.027042388916015625, -0.026031970977783203, -0.02502155303955078, -0.02401113510131836, -0.023000717163085938, -0.021990299224853516, -0.020979881286621094, -0.019969463348388672, -0.01895904541015625, -0.017948627471923828, -0.016938209533691406, -0.015927791595458984, -0.014917373657226562, -0.01390695571899414, -0.012896537780761719, -0.011886119842529297, -0.010875701904296875, -0.009865283966064453, -0.008854866027832031, -0.00784444808959961, -0.0068340301513671875, -0.005823612213134766, -0.004813194274902344, -0.003802776336669922, -0.0027923583984375, -0.0017819404602050781, -0.0007715225219726562, 0.00023889541625976562, 0.0012493133544921875, 0.0022597312927246094, 0.0032701492309570312, 0.004280567169189453, 0.005290985107421875, 0.006301403045654297, 0.007311820983886719, 0.00832223892211914, 0.009332656860351562, 0.010343074798583984, 0.011353492736816406, 0.012363910675048828, 0.01337432861328125, 0.014384746551513672, 0.015395164489746094, 0.016405582427978516, 0.017416000366210938, 0.01842641830444336, 0.01943683624267578, 0.020447254180908203, 0.021457672119140625, 0.022468090057373047, 0.02347850799560547, 0.02448892593383789, 0.025499343872070312, 0.026509761810302734, 0.027520179748535156, 0.028530597686767578, 0.029541015625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 12.0, 24.0, 94.0, 266.0, 334.0, 194.0, 59.0, 16.0, 8.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007651117048226297, -0.0007182001136243343, -0.000671288522426039, -0.0006243769312277436, -0.0005774653982371092, -0.0005305537488311529, -0.0004836422158405185, -0.0004367306246422231, -0.00038981903344392776, -0.0003429074422456324, -0.00029599585104733706, -0.00024908428895287216, -0.0002021726977545768, -0.00015526110655628145, -0.00010834954446181655, -6.14379532635212e-05, -1.452636206522584e-05, 3.23852218571119e-05, 7.929680577944964e-05, 0.00012620838242582977, 0.00017311997362412512, 0.00022003156482242048, 0.0002669431269168854, 0.00031385471811518073, 0.0003607663093134761, 0.00040767790051177144, 0.0004545894917100668, 0.0005015010247007012, 0.0005484126741066575, 0.000595324207097292, 0.0006422357982955873, 0.0006891473894938827, 0.0007360589224845171, 0.0007829705136828125, 0.0008298821048811078, 0.0008767936378717422, 0.0009237052872776985, 0.000970616820268333, 0.0010175283532589674, 0.0010644400026649237, 0.00111135165207088, 0.0011582631850615144, 0.0012051748344674706, 0.001252086367458105, 0.0012989980168640614, 0.0013459095498546958, 0.0013928210828453302, 0.0014397327322512865, 0.001486644265241921, 0.0015335557982325554, 0.0015804674476385117, 0.001627378980629146, 0.0016742906300351024, 0.0017212021630257368, 0.001768113812431693, 0.0018150253454223275, 0.001861936878412962, 0.0019088484114035964, 0.001955759944394231, 0.002002671593800187, 0.0020495832432061434, 0.0020964948926120996, 0.0021434063091874123, 0.0021903179585933685, 0.002237229607999325]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 10.0, 11.0, 9.0, 13.0, 20.0, 12.0, 24.0, 22.0, 41.0, 34.0, 43.0, 36.0, 43.0, 39.0, 48.0, 46.0, 56.0, 39.0, 45.0, 43.0, 42.0, 27.0, 45.0, 35.0, 35.0, 26.0, 27.0, 17.0, 21.0, 14.0, 14.0, 10.0, 11.0, 7.0, 6.0, 10.0, 5.0, 0.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006845593452453613, -0.0006617233157157898, -0.0006388872861862183, -0.0006160512566566467, -0.0005932152271270752, -0.0005703791975975037, -0.0005475431680679321, -0.0005247071385383606, -0.0005018711090087891, -0.00047903507947921753, -0.000456199049949646, -0.00043336302042007446, -0.00041052699089050293, -0.0003876909613609314, -0.00036485493183135986, -0.00034201890230178833, -0.0003191828727722168, -0.00029634684324264526, -0.00027351081371307373, -0.0002506747841835022, -0.00022783875465393066, -0.00020500272512435913, -0.0001821666955947876, -0.00015933066606521606, -0.00013649463653564453, -0.000113658607006073, -9.082257747650146e-05, -6.798654794692993e-05, -4.51505184173584e-05, -2.2314488887786865e-05, 5.21540641784668e-07, 2.33575701713562e-05, 4.6193599700927734e-05, 6.902962923049927e-05, 9.18656587600708e-05, 0.00011470168828964233, 0.00013753771781921387, 0.0001603737473487854, 0.00018320977687835693, 0.00020604580640792847, 0.0002288818359375, 0.00025171786546707153, 0.00027455389499664307, 0.0002973899245262146, 0.00032022595405578613, 0.00034306198358535767, 0.0003658980131149292, 0.00038873404264450073, 0.00041157007217407227, 0.0004344061017036438, 0.00045724213123321533, 0.00048007816076278687, 0.0005029141902923584, 0.0005257502198219299, 0.0005485862493515015, 0.000571422278881073, 0.0005942583084106445, 0.0006170943379402161, 0.0006399303674697876, 0.0006627663969993591, 0.0006856024265289307, 0.0007084384560585022, 0.0007312744855880737, 0.0007541105151176453, 0.0007769465446472168]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 9.0, 11.0, 10.0, 12.0, 15.0, 17.0, 23.0, 22.0, 31.0, 30.0, 33.0, 44.0, 42.0, 45.0, 44.0, 44.0, 56.0, 49.0, 59.0, 48.0, 44.0, 46.0, 41.0, 34.0, 40.0, 26.0, 15.0, 18.0, 12.0, 13.0, 15.0, 10.0, 9.0, 7.0, 9.0, 5.0, 0.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.42578125, -5.22357177734375, -5.0213623046875, -4.81915283203125, -4.616943359375, -4.41473388671875, -4.2125244140625, -4.01031494140625, -3.80810546875, -3.60589599609375, -3.4036865234375, -3.20147705078125, -2.999267578125, -2.79705810546875, -2.5948486328125, -2.39263916015625, -2.1904296875, -1.98822021484375, -1.7860107421875, -1.58380126953125, -1.381591796875, -1.17938232421875, -0.9771728515625, -0.77496337890625, -0.57275390625, -0.37054443359375, -0.1683349609375, 0.03387451171875, 0.236083984375, 0.43829345703125, 0.6405029296875, 0.84271240234375, 1.044921875, 1.24713134765625, 1.4493408203125, 1.65155029296875, 1.853759765625, 2.05596923828125, 2.2581787109375, 2.46038818359375, 2.66259765625, 2.86480712890625, 3.0670166015625, 3.26922607421875, 3.471435546875, 3.67364501953125, 3.8758544921875, 4.07806396484375, 4.2802734375, 4.48248291015625, 4.6846923828125, 4.88690185546875, 5.089111328125, 5.29132080078125, 5.4935302734375, 5.69573974609375, 5.89794921875, 6.10015869140625, 6.3023681640625, 6.50457763671875, 6.706787109375, 6.90899658203125, 7.1112060546875, 7.31341552734375, 7.515625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 4.0, 10.0, 18.0, 30.0, 36.0, 42.0, 91.0, 110.0, 167.0, 212.0, 286.0, 438.0, 645.0, 947.0, 1326.0, 2097.0, 3723.0, 9908.0, 94846.0, 781044.0, 130173.0, 11534.0, 4095.0, 2259.0, 1398.0, 908.0, 679.0, 459.0, 310.0, 222.0, 163.0, 119.0, 74.0, 59.0, 37.0, 29.0, 14.0, 14.0, 13.0, 6.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.765625, -18.2225341796875, -17.679443359375, -17.1363525390625, -16.59326171875, -16.0501708984375, -15.507080078125, -14.9639892578125, -14.4208984375, -13.8778076171875, -13.334716796875, -12.7916259765625, -12.24853515625, -11.7054443359375, -11.162353515625, -10.6192626953125, -10.076171875, -9.5330810546875, -8.989990234375, -8.4468994140625, -7.90380859375, -7.3607177734375, -6.817626953125, -6.2745361328125, -5.7314453125, -5.1883544921875, -4.645263671875, -4.1021728515625, -3.55908203125, -3.0159912109375, -2.472900390625, -1.9298095703125, -1.38671875, -0.8436279296875, -0.300537109375, 0.2425537109375, 0.78564453125, 1.3287353515625, 1.871826171875, 2.4149169921875, 2.9580078125, 3.5010986328125, 4.044189453125, 4.5872802734375, 5.13037109375, 5.6734619140625, 6.216552734375, 6.7596435546875, 7.302734375, 7.8458251953125, 8.388916015625, 8.9320068359375, 9.47509765625, 10.0181884765625, 10.561279296875, 11.1043701171875, 11.6474609375, 12.1905517578125, 12.733642578125, 13.2767333984375, 13.81982421875, 14.3629150390625, 14.906005859375, 15.4490966796875, 15.9921875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 10.0, 5.0, 10.0, 10.0, 10.0, 22.0, 15.0, 19.0, 21.0, 30.0, 30.0, 32.0, 41.0, 44.0, 61.0, 79.0, 203.0, 1546.0, 340.0, 123.0, 81.0, 58.0, 39.0, 28.0, 41.0, 31.0, 21.0, 18.0, 10.0, 12.0, 15.0, 7.0, 7.0, 2.0, 6.0, 6.0, 1.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.484375, -15.948486328125, -15.41259765625, -14.876708984375, -14.3408203125, -13.804931640625, -13.26904296875, -12.733154296875, -12.197265625, -11.661376953125, -11.12548828125, -10.589599609375, -10.0537109375, -9.517822265625, -8.98193359375, -8.446044921875, -7.91015625, -7.374267578125, -6.83837890625, -6.302490234375, -5.7666015625, -5.230712890625, -4.69482421875, -4.158935546875, -3.623046875, -3.087158203125, -2.55126953125, -2.015380859375, -1.4794921875, -0.943603515625, -0.40771484375, 0.128173828125, 0.6640625, 1.199951171875, 1.73583984375, 2.271728515625, 2.8076171875, 3.343505859375, 3.87939453125, 4.415283203125, 4.951171875, 5.487060546875, 6.02294921875, 6.558837890625, 7.0947265625, 7.630615234375, 8.16650390625, 8.702392578125, 9.23828125, 9.774169921875, 10.31005859375, 10.845947265625, 11.3818359375, 11.917724609375, 12.45361328125, 12.989501953125, 13.525390625, 14.061279296875, 14.59716796875, 15.133056640625, 15.6689453125, 16.204833984375, 16.74072265625, 17.276611328125, 17.8125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 8.0, 13.0, 13.0, 12.0, 16.0, 19.0, 27.0, 48.0, 57.0, 85.0, 103.0, 126.0, 197.0, 274.0, 552.0, 1076.0, 3537.0, 3045729.0, 89396.0, 2221.0, 767.0, 443.0, 287.0, 193.0, 128.0, 86.0, 64.0, 61.0, 31.0, 28.0, 22.0, 24.0, 8.0, 11.0, 5.0, 5.0, 5.0, 4.0, 8.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-54.71875, -53.0517578125, -51.384765625, -49.7177734375, -48.05078125, -46.3837890625, -44.716796875, -43.0498046875, -41.3828125, -39.7158203125, -38.048828125, -36.3818359375, -34.71484375, -33.0478515625, -31.380859375, -29.7138671875, -28.046875, -26.3798828125, -24.712890625, -23.0458984375, -21.37890625, -19.7119140625, -18.044921875, -16.3779296875, -14.7109375, -13.0439453125, -11.376953125, -9.7099609375, -8.04296875, -6.3759765625, -4.708984375, -3.0419921875, -1.375, 0.2919921875, 1.958984375, 3.6259765625, 5.29296875, 6.9599609375, 8.626953125, 10.2939453125, 11.9609375, 13.6279296875, 15.294921875, 16.9619140625, 18.62890625, 20.2958984375, 21.962890625, 23.6298828125, 25.296875, 26.9638671875, 28.630859375, 30.2978515625, 31.96484375, 33.6318359375, 35.298828125, 36.9658203125, 38.6328125, 40.2998046875, 41.966796875, 43.6337890625, 45.30078125, 46.9677734375, 48.634765625, 50.3017578125, 51.96875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 20.0, 38.0, 88.0, 125.0, 244.0, 227.0, 148.0, 58.0, 36.0, 12.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.71249389648438, -83.04866790771484, -81.38484191894531, -79.72101593017578, -78.05718994140625, -76.39336395263672, -74.72953796386719, -73.06571197509766, -71.40188598632812, -69.7380599975586, -68.07423400878906, -66.41040802001953, -64.74658203125, -63.08275604248047, -61.41893005371094, -59.755104064941406, -58.09128189086914, -56.42745590209961, -54.76362991333008, -53.09980392456055, -51.435977935791016, -49.772151947021484, -48.10832977294922, -46.44450378417969, -44.780677795410156, -43.116851806640625, -41.453025817871094, -39.78919982910156, -38.12537384033203, -36.4615478515625, -34.79772186279297, -33.13389587402344, -31.470069885253906, -29.806243896484375, -28.142417907714844, -26.478591918945312, -24.81476593017578, -23.15093994140625, -21.48711585998535, -19.82328987121582, -18.15946388244629, -16.495637893676758, -14.831811904907227, -13.167986869812012, -11.50416088104248, -9.84033489227295, -8.176509857177734, -6.512683868408203, -4.848857879638672, -3.1850321292877197, -1.5212063789367676, 0.14261913299560547, 1.8064451217651367, 3.470271110534668, 5.134096145629883, 6.797922134399414, 8.461748123168945, 10.125574111938477, 11.789400100708008, 13.453225135803223, 15.117051124572754, 16.78087615966797, 18.4447021484375, 20.10852813720703, 21.772354125976562]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 4.0, 3.0, 12.0, 9.0, 7.0, 12.0, 17.0, 11.0, 16.0, 18.0, 26.0, 23.0, 36.0, 35.0, 37.0, 36.0, 45.0, 48.0, 30.0, 45.0, 46.0, 46.0, 50.0, 41.0, 43.0, 27.0, 36.0, 27.0, 30.0, 22.0, 25.0, 20.0, 11.0, 20.0, 18.0, 14.0, 11.0, 12.0, 5.0, 6.0, 6.0, 3.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-43.41010665893555, -42.07524871826172, -40.740386962890625, -39.40552520751953, -38.0706672668457, -36.735809326171875, -35.40094757080078, -34.06608581542969, -32.73122787475586, -31.3963680267334, -30.061508178710938, -28.726648330688477, -27.391788482666016, -26.056928634643555, -24.722068786621094, -23.387208938598633, -22.052349090576172, -20.71748924255371, -19.38262939453125, -18.04776954650879, -16.712909698486328, -15.378049850463867, -14.043190002441406, -12.708330154418945, -11.373470306396484, -10.038610458374023, -8.703750610351562, -7.368890762329102, -6.034030914306641, -4.69917106628418, -3.3643112182617188, -2.029451370239258, -0.6945877075195312, 0.6402721405029297, 1.9751319885253906, 3.3099918365478516, 4.6448516845703125, 5.979711532592773, 7.314571380615234, 8.649431228637695, 9.984291076660156, 11.319150924682617, 12.654010772705078, 13.988870620727539, 15.32373046875, 16.65859031677246, 17.993450164794922, 19.328310012817383, 20.663169860839844, 21.998029708862305, 23.332889556884766, 24.667749404907227, 26.002609252929688, 27.33746910095215, 28.67232894897461, 30.00718879699707, 31.34204864501953, 32.676910400390625, 34.01176834106445, 35.34662628173828, 36.681488037109375, 38.01634979248047, 39.3512077331543, 40.686065673828125, 42.02092742919922]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 0.0, 4.0, 6.0, 7.0, 8.0, 7.0, 6.0, 8.0, 17.0, 10.0, 16.0, 5.0, 32.0, 18.0, 26.0, 28.0, 30.0, 36.0, 35.0, 41.0, 56.0, 36.0, 31.0, 43.0, 41.0, 49.0, 39.0, 29.0, 36.0, 41.0, 31.0, 32.0, 27.0, 27.0, 26.0, 14.0, 17.0, 9.0, 9.0, 20.0, 14.0, 5.0, 8.0, 5.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.5546875, -5.37420654296875, -5.1937255859375, -5.01324462890625, -4.832763671875, -4.65228271484375, -4.4718017578125, -4.29132080078125, -4.11083984375, -3.93035888671875, -3.7498779296875, -3.56939697265625, -3.388916015625, -3.20843505859375, -3.0279541015625, -2.84747314453125, -2.6669921875, -2.48651123046875, -2.3060302734375, -2.12554931640625, -1.945068359375, -1.76458740234375, -1.5841064453125, -1.40362548828125, -1.22314453125, -1.04266357421875, -0.8621826171875, -0.68170166015625, -0.501220703125, -0.32073974609375, -0.1402587890625, 0.04022216796875, 0.220703125, 0.40118408203125, 0.5816650390625, 0.76214599609375, 0.942626953125, 1.12310791015625, 1.3035888671875, 1.48406982421875, 1.66455078125, 1.84503173828125, 2.0255126953125, 2.20599365234375, 2.386474609375, 2.56695556640625, 2.7474365234375, 2.92791748046875, 3.1083984375, 3.28887939453125, 3.4693603515625, 3.64984130859375, 3.830322265625, 4.01080322265625, 4.1912841796875, 4.37176513671875, 4.55224609375, 4.73272705078125, 4.9132080078125, 5.09368896484375, 5.274169921875, 5.45465087890625, 5.6351318359375, 5.81561279296875, 5.99609375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 8.0, 6.0, 15.0, 11.0, 22.0, 20.0, 17.0, 25.0, 33.0, 40.0, 61.0, 83.0, 173.0, 239.0, 444.0, 957.0, 2286.0, 6496.0, 29746.0, 301516.0, 2311742.0, 1391874.0, 125159.0, 15855.0, 4208.0, 1595.0, 716.0, 343.0, 178.0, 113.0, 65.0, 48.0, 36.0, 24.0, 27.0, 21.0, 14.0, 13.0, 8.0, 8.0, 10.0, 9.0, 3.0, 3.0, 3.0, 6.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-12.3984375, -12.0089111328125, -11.619384765625, -11.2298583984375, -10.84033203125, -10.4508056640625, -10.061279296875, -9.6717529296875, -9.2822265625, -8.8927001953125, -8.503173828125, -8.1136474609375, -7.72412109375, -7.3345947265625, -6.945068359375, -6.5555419921875, -6.166015625, -5.7764892578125, -5.386962890625, -4.9974365234375, -4.60791015625, -4.2183837890625, -3.828857421875, -3.4393310546875, -3.0498046875, -2.6602783203125, -2.270751953125, -1.8812255859375, -1.49169921875, -1.1021728515625, -0.712646484375, -0.3231201171875, 0.06640625, 0.4559326171875, 0.845458984375, 1.2349853515625, 1.62451171875, 2.0140380859375, 2.403564453125, 2.7930908203125, 3.1826171875, 3.5721435546875, 3.961669921875, 4.3511962890625, 4.74072265625, 5.1302490234375, 5.519775390625, 5.9093017578125, 6.298828125, 6.6883544921875, 7.077880859375, 7.4674072265625, 7.85693359375, 8.2464599609375, 8.635986328125, 9.0255126953125, 9.4150390625, 9.8045654296875, 10.194091796875, 10.5836181640625, 10.97314453125, 11.3626708984375, 11.752197265625, 12.1417236328125, 12.53125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 10.0, 17.0, 43.0, 90.0, 187.0, 427.0, 750.0, 1106.0, 686.0, 385.0, 211.0, 91.0, 43.0, 16.0, 10.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.5625, -21.797607421875, -21.03271484375, -20.267822265625, -19.5029296875, -18.738037109375, -17.97314453125, -17.208251953125, -16.443359375, -15.678466796875, -14.91357421875, -14.148681640625, -13.3837890625, -12.618896484375, -11.85400390625, -11.089111328125, -10.32421875, -9.559326171875, -8.79443359375, -8.029541015625, -7.2646484375, -6.499755859375, -5.73486328125, -4.969970703125, -4.205078125, -3.440185546875, -2.67529296875, -1.910400390625, -1.1455078125, -0.380615234375, 0.38427734375, 1.149169921875, 1.9140625, 2.678955078125, 3.44384765625, 4.208740234375, 4.9736328125, 5.738525390625, 6.50341796875, 7.268310546875, 8.033203125, 8.798095703125, 9.56298828125, 10.327880859375, 11.0927734375, 11.857666015625, 12.62255859375, 13.387451171875, 14.15234375, 14.917236328125, 15.68212890625, 16.447021484375, 17.2119140625, 17.976806640625, 18.74169921875, 19.506591796875, 20.271484375, 21.036376953125, 21.80126953125, 22.566162109375, 23.3310546875, 24.095947265625, 24.86083984375, 25.625732421875, 26.390625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 12.0, 9.0, 19.0, 31.0, 65.0, 135.0, 377.0, 1011.0, 3629.0, 497735.0, 3683045.0, 6097.0, 1308.0, 474.0, 174.0, 76.0, 39.0, 13.0, 10.0, 8.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.90625, -52.37158203125, -50.8369140625, -49.30224609375, -47.767578125, -46.23291015625, -44.6982421875, -43.16357421875, -41.62890625, -40.09423828125, -38.5595703125, -37.02490234375, -35.490234375, -33.95556640625, -32.4208984375, -30.88623046875, -29.3515625, -27.81689453125, -26.2822265625, -24.74755859375, -23.212890625, -21.67822265625, -20.1435546875, -18.60888671875, -17.07421875, -15.53955078125, -14.0048828125, -12.47021484375, -10.935546875, -9.40087890625, -7.8662109375, -6.33154296875, -4.796875, -3.26220703125, -1.7275390625, -0.19287109375, 1.341796875, 2.87646484375, 4.4111328125, 5.94580078125, 7.48046875, 9.01513671875, 10.5498046875, 12.08447265625, 13.619140625, 15.15380859375, 16.6884765625, 18.22314453125, 19.7578125, 21.29248046875, 22.8271484375, 24.36181640625, 25.896484375, 27.43115234375, 28.9658203125, 30.50048828125, 32.03515625, 33.56982421875, 35.1044921875, 36.63916015625, 38.173828125, 39.70849609375, 41.2431640625, 42.77783203125, 44.3125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 14.0, 132.0, 449.0, 348.0, 62.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-205.23599243164062, -200.54342651367188, -195.85084533691406, -191.1582794189453, -186.4656982421875, -181.77313232421875, -177.08056640625, -172.3879852294922, -167.69541931152344, -163.0028533935547, -158.31027221679688, -153.61770629882812, -148.9251251220703, -144.23255920410156, -139.53997802734375, -134.847412109375, -130.15484619140625, -125.46227264404297, -120.76969909667969, -116.07713317871094, -111.38455963134766, -106.69198608398438, -101.9994125366211, -97.30683898925781, -92.6142578125, -87.92168426513672, -83.22911071777344, -78.53654479980469, -73.8439712524414, -69.15139770507812, -64.45882415771484, -59.76625442504883, -55.07367706298828, -50.381103515625, -45.688533782958984, -40.9959602355957, -36.30339050292969, -31.610816955566406, -26.918243408203125, -22.22567367553711, -17.533100128173828, -12.84052848815918, -8.147955894470215, -3.45538330078125, 1.2371883392333984, 5.929759979248047, 10.622333526611328, 15.314903259277344, 20.007476806640625, 24.700048446655273, 29.392620086669922, 34.0851936340332, 38.77776336669922, 43.4703369140625, 48.16291046142578, 52.8554801940918, 57.54805374145508, 62.24062728881836, 66.93319702148438, 71.62577056884766, 76.31834411621094, 81.01091003417969, 85.7034912109375, 90.39605712890625, 95.08863067626953]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 6.0, 5.0, 12.0, 8.0, 14.0, 11.0, 13.0, 16.0, 17.0, 24.0, 25.0, 28.0, 26.0, 23.0, 39.0, 22.0, 24.0, 39.0, 29.0, 45.0, 26.0, 42.0, 47.0, 38.0, 29.0, 39.0, 42.0, 32.0, 35.0, 29.0, 31.0, 31.0, 19.0, 20.0, 12.0, 18.0, 17.0, 6.0, 11.0, 11.0, 5.0, 3.0, 4.0, 5.0, 8.0, 6.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0], "bins": [-40.54632568359375, -39.32184600830078, -38.09736633300781, -36.872886657714844, -35.648406982421875, -34.423927307128906, -33.19944763183594, -31.974964141845703, -30.750484466552734, -29.526004791259766, -28.301525115966797, -27.077045440673828, -25.852563858032227, -24.628084182739258, -23.40360450744629, -22.179122924804688, -20.95464515686035, -19.730165481567383, -18.505685806274414, -17.281204223632812, -16.056724548339844, -14.832244873046875, -13.607765197753906, -12.383284568786621, -11.158804893493652, -9.934325218200684, -8.709844589233398, -7.48536491394043, -6.260884761810303, -5.036404609680176, -3.811924934387207, -2.587444305419922, -1.3629646301269531, -0.13848459720611572, 1.0859954357147217, 2.3104753494262695, 3.5349555015563965, 4.759435653686523, 5.983915328979492, 7.208395957946777, 8.432875633239746, 9.657355308532715, 10.8818359375, 12.106315612792969, 13.330795288085938, 14.555275917053223, 15.779755592346191, 17.004236221313477, 18.228715896606445, 19.453195571899414, 20.677675247192383, 21.902156829833984, 23.126636505126953, 24.351116180419922, 25.57559585571289, 26.80007553100586, 28.024555206298828, 29.249034881591797, 30.473514556884766, 31.697994232177734, 32.9224739074707, 34.14695739746094, 35.371437072753906, 36.595916748046875, 37.820396423339844]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 9.0, 4.0, 10.0, 14.0, 11.0, 23.0, 21.0, 28.0, 28.0, 33.0, 35.0, 26.0, 43.0, 47.0, 54.0, 47.0, 61.0, 40.0, 64.0, 53.0, 42.0, 33.0, 30.0, 48.0, 28.0, 23.0, 25.0, 24.0, 20.0, 20.0, 13.0, 15.0, 8.0, 3.0, 5.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8828125, -5.7059326171875, -5.529052734375, -5.3521728515625, -5.17529296875, -4.9984130859375, -4.821533203125, -4.6446533203125, -4.4677734375, -4.2908935546875, -4.114013671875, -3.9371337890625, -3.76025390625, -3.5833740234375, -3.406494140625, -3.2296142578125, -3.052734375, -2.8758544921875, -2.698974609375, -2.5220947265625, -2.34521484375, -2.1683349609375, -1.991455078125, -1.8145751953125, -1.6376953125, -1.4608154296875, -1.283935546875, -1.1070556640625, -0.93017578125, -0.7532958984375, -0.576416015625, -0.3995361328125, -0.22265625, -0.0457763671875, 0.131103515625, 0.3079833984375, 0.48486328125, 0.6617431640625, 0.838623046875, 1.0155029296875, 1.1923828125, 1.3692626953125, 1.546142578125, 1.7230224609375, 1.89990234375, 2.0767822265625, 2.253662109375, 2.4305419921875, 2.607421875, 2.7843017578125, 2.961181640625, 3.1380615234375, 3.31494140625, 3.4918212890625, 3.668701171875, 3.8455810546875, 4.0224609375, 4.1993408203125, 4.376220703125, 4.5531005859375, 4.72998046875, 4.9068603515625, 5.083740234375, 5.2606201171875, 5.4375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 13.0, 18.0, 25.0, 36.0, 41.0, 70.0, 131.0, 152.0, 306.0, 474.0, 737.0, 1189.0, 2026.0, 3363.0, 5930.0, 9814.0, 17221.0, 29763.0, 52600.0, 100635.0, 295068.0, 302427.0, 101671.0, 52959.0, 29995.0, 17270.0, 10093.0, 5857.0, 3400.0, 2078.0, 1204.0, 724.0, 467.0, 285.0, 179.0, 110.0, 65.0, 55.0, 36.0, 20.0, 13.0, 12.0, 7.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.37109375, -1.326873779296875, -1.28265380859375, -1.238433837890625, -1.1942138671875, -1.149993896484375, -1.10577392578125, -1.061553955078125, -1.017333984375, -0.973114013671875, -0.92889404296875, -0.884674072265625, -0.8404541015625, -0.796234130859375, -0.75201416015625, -0.707794189453125, -0.66357421875, -0.619354248046875, -0.57513427734375, -0.530914306640625, -0.4866943359375, -0.442474365234375, -0.39825439453125, -0.354034423828125, -0.309814453125, -0.265594482421875, -0.22137451171875, -0.177154541015625, -0.1329345703125, -0.088714599609375, -0.04449462890625, -0.000274658203125, 0.0439453125, 0.088165283203125, 0.13238525390625, 0.176605224609375, 0.2208251953125, 0.265045166015625, 0.30926513671875, 0.353485107421875, 0.397705078125, 0.441925048828125, 0.48614501953125, 0.530364990234375, 0.5745849609375, 0.618804931640625, 0.66302490234375, 0.707244873046875, 0.75146484375, 0.795684814453125, 0.83990478515625, 0.884124755859375, 0.9283447265625, 0.972564697265625, 1.01678466796875, 1.061004638671875, 1.105224609375, 1.149444580078125, 1.19366455078125, 1.237884521484375, 1.2821044921875, 1.326324462890625, 1.37054443359375, 1.414764404296875, 1.458984375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 10.0, 19.0, 19.0, 24.0, 21.0, 24.0, 24.0, 23.0, 25.0, 26.0, 39.0, 38.0, 38.0, 35.0, 42.0, 30.0, 31.0, 1057.0, 38.0, 29.0, 32.0, 51.0, 34.0, 35.0, 34.0, 26.0, 27.0, 24.0, 19.0, 29.0, 27.0, 16.0, 13.0, 11.0, 9.0, 10.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.724609375, -2.634552001953125, -2.54449462890625, -2.454437255859375, -2.3643798828125, -2.274322509765625, -2.18426513671875, -2.094207763671875, -2.004150390625, -1.914093017578125, -1.82403564453125, -1.733978271484375, -1.6439208984375, -1.553863525390625, -1.46380615234375, -1.373748779296875, -1.28369140625, -1.193634033203125, -1.10357666015625, -1.013519287109375, -0.9234619140625, -0.833404541015625, -0.74334716796875, -0.653289794921875, -0.563232421875, -0.473175048828125, -0.38311767578125, -0.293060302734375, -0.2030029296875, -0.112945556640625, -0.02288818359375, 0.067169189453125, 0.1572265625, 0.247283935546875, 0.33734130859375, 0.427398681640625, 0.5174560546875, 0.607513427734375, 0.69757080078125, 0.787628173828125, 0.877685546875, 0.967742919921875, 1.05780029296875, 1.147857666015625, 1.2379150390625, 1.327972412109375, 1.41802978515625, 1.508087158203125, 1.59814453125, 1.688201904296875, 1.77825927734375, 1.868316650390625, 1.9583740234375, 2.048431396484375, 2.13848876953125, 2.228546142578125, 2.318603515625, 2.408660888671875, 2.49871826171875, 2.588775634765625, 2.6788330078125, 2.768890380859375, 2.85894775390625, 2.949005126953125, 3.0390625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 5.0, 4.0, 17.0, 13.0, 19.0, 31.0, 52.0, 70.0, 93.0, 150.0, 239.0, 345.0, 558.0, 778.0, 1212.0, 1990.0, 3228.0, 5474.0, 8968.0, 15079.0, 25405.0, 43650.0, 78100.0, 149334.0, 1393670.0, 167007.0, 85568.0, 47351.0, 27490.0, 16121.0, 9693.0, 5818.0, 3574.0, 2199.0, 1337.0, 892.0, 573.0, 344.0, 241.0, 135.0, 103.0, 70.0, 33.0, 36.0, 24.0, 13.0, 15.0, 3.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.2294921875, -1.19287109375, -1.15625, -1.11962890625, -1.0830078125, -1.04638671875, -1.009765625, -0.97314453125, -0.9365234375, -0.89990234375, -0.86328125, -0.82666015625, -0.7900390625, -0.75341796875, -0.716796875, -0.68017578125, -0.6435546875, -0.60693359375, -0.5703125, -0.53369140625, -0.4970703125, -0.46044921875, -0.423828125, -0.38720703125, -0.3505859375, -0.31396484375, -0.27734375, -0.24072265625, -0.2041015625, -0.16748046875, -0.130859375, -0.09423828125, -0.0576171875, -0.02099609375, 0.015625, 0.05224609375, 0.0888671875, 0.12548828125, 0.162109375, 0.19873046875, 0.2353515625, 0.27197265625, 0.30859375, 0.34521484375, 0.3818359375, 0.41845703125, 0.455078125, 0.49169921875, 0.5283203125, 0.56494140625, 0.6015625, 0.63818359375, 0.6748046875, 0.71142578125, 0.748046875, 0.78466796875, 0.8212890625, 0.85791015625, 0.89453125, 0.93115234375, 0.9677734375, 1.00439453125, 1.041015625, 1.07763671875, 1.1142578125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 5.0, 6.0, 12.0, 9.0, 10.0, 16.0, 19.0, 23.0, 31.0, 37.0, 66.0, 87.0, 147.0, 146.0, 112.0, 78.0, 46.0, 31.0, 27.0, 26.0, 12.0, 9.0, 13.0, 4.0, 3.0, 5.0, 4.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0006079673767089844, -0.0005829855799674988, -0.0005580037832260132, -0.0005330219864845276, -0.000508040189743042, -0.0004830583930015564, -0.0004580765962600708, -0.0004330947995185852, -0.0004081130027770996, -0.000383131206035614, -0.0003581494092941284, -0.0003331676125526428, -0.0003081858158111572, -0.00028320401906967163, -0.00025822222232818604, -0.00023324042558670044, -0.00020825862884521484, -0.00018327683210372925, -0.00015829503536224365, -0.00013331323862075806, -0.00010833144187927246, -8.334964513778687e-05, -5.836784839630127e-05, -3.3386051654815674e-05, -8.404254913330078e-06, 1.6577541828155518e-05, 4.155933856964111e-05, 6.654113531112671e-05, 9.15229320526123e-05, 0.0001165047287940979, 0.0001414865255355835, 0.0001664683222770691, 0.0001914501190185547, 0.00021643191576004028, 0.00024141371250152588, 0.0002663955092430115, 0.00029137730598449707, 0.00031635910272598267, 0.00034134089946746826, 0.00036632269620895386, 0.00039130449295043945, 0.00041628628969192505, 0.00044126808643341064, 0.00046624988317489624, 0.0004912316799163818, 0.0005162134766578674, 0.000541195273399353, 0.0005661770701408386, 0.0005911588668823242, 0.0006161406636238098, 0.0006411224603652954, 0.000666104257106781, 0.0006910860538482666, 0.0007160678505897522, 0.0007410496473312378, 0.0007660314440727234, 0.000791013240814209, 0.0008159950375556946, 0.0008409768342971802, 0.0008659586310386658, 0.0008909404277801514, 0.000915922224521637, 0.0009409040212631226, 0.0009658858180046082, 0.0009908676147460938]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 2.0, 6.0, 7.0, 12.0, 16.0, 29.0, 26.0, 31.0, 50.0, 87.0, 104.0, 191.0, 295.0, 679.0, 2711.0, 1034795.0, 7598.0, 824.0, 376.0, 225.0, 150.0, 95.0, 45.0, 51.0, 36.0, 16.0, 18.0, 11.0, 8.0, 9.0, 11.0, 5.0, 8.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.018463134765625, -0.017984867095947266, -0.01750659942626953, -0.017028331756591797, -0.016550064086914062, -0.016071796417236328, -0.015593528747558594, -0.01511526107788086, -0.014636993408203125, -0.01415872573852539, -0.013680458068847656, -0.013202190399169922, -0.012723922729492188, -0.012245655059814453, -0.011767387390136719, -0.011289119720458984, -0.01081085205078125, -0.010332584381103516, -0.009854316711425781, -0.009376049041748047, -0.008897781372070312, -0.008419513702392578, -0.007941246032714844, -0.007462978363037109, -0.006984710693359375, -0.006506443023681641, -0.006028175354003906, -0.005549907684326172, -0.0050716400146484375, -0.004593372344970703, -0.004115104675292969, -0.0036368370056152344, -0.0031585693359375, -0.0026803016662597656, -0.0022020339965820312, -0.0017237663269042969, -0.0012454986572265625, -0.0007672309875488281, -0.00028896331787109375, 0.00018930435180664062, 0.000667572021484375, 0.0011458396911621094, 0.0016241073608398438, 0.002102375030517578, 0.0025806427001953125, 0.003058910369873047, 0.0035371780395507812, 0.004015445709228516, 0.00449371337890625, 0.004971981048583984, 0.005450248718261719, 0.005928516387939453, 0.0064067840576171875, 0.006885051727294922, 0.007363319396972656, 0.00784158706665039, 0.008319854736328125, 0.00879812240600586, 0.009276390075683594, 0.009754657745361328, 0.010232925415039062, 0.010711193084716797, 0.011189460754394531, 0.011667728424072266, 0.01214599609375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 30.0, 129.0, 296.0, 368.0, 140.0, 37.0, 8.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006605072994716465, -0.0006318026571534574, -0.0006030980148352683, -0.0005743933725170791, -0.0005456887884065509, -0.0005169841460883617, -0.0004882795037701726, -0.00045957486145198345, -0.0004308702191337943, -0.00040216557681560516, -0.000373460934497416, -0.00034475632128305733, -0.0003160516789648682, -0.00028734703664667904, -0.00025864242343232036, -0.0002299377811141312, -0.00020123313879594207, -0.00017252849647775292, -0.000143823868711479, -0.00011511923366924748, -8.641459862701595e-05, -5.7709956308826804e-05, -2.900532854255289e-05, -3.007007762789726e-07, 2.840394154191017e-05, 5.71085765841417e-05, 8.581321162637323e-05, 0.00011451784666860476, 0.0001432224817108363, 0.00017192712402902544, 0.00020063175179529935, 0.00022933637956157327, 0.0002580409636721015, 0.00028674560599029064, 0.0003154502483084798, 0.0003441548615228385, 0.0003728595038410276, 0.00040156414615921676, 0.00043026875937357545, 0.0004589734016917646, 0.00048767804400995374, 0.0005163826863281429, 0.000545087328646332, 0.0005737919709645212, 0.0006024965550750494, 0.0006312011973932385, 0.0006599058397114277, 0.0006886104820296168, 0.000717315124347806, 0.0007460197666659951, 0.0007747244089841843, 0.0008034290513023734, 0.0008321336936205626, 0.0008608383359387517, 0.0008895429200492799, 0.0009182475623674691, 0.0009469522046856582, 0.0009756568470038474, 0.0010043614311143756, 0.0010330660734325647, 0.0010617707157507539, 0.001090475358068943, 0.0011191800003871322, 0.0011478846427053213, 0.0011765892850235105]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 6.0, 4.0, 6.0, 11.0, 14.0, 6.0, 11.0, 15.0, 20.0, 12.0, 9.0, 12.0, 24.0, 29.0, 36.0, 36.0, 27.0, 28.0, 27.0, 33.0, 45.0, 44.0, 36.0, 38.0, 41.0, 35.0, 28.0, 32.0, 31.0, 29.0, 33.0, 36.0, 19.0, 18.0, 27.0, 26.0, 17.0, 26.0, 10.0, 10.0, 13.0, 16.0, 4.0, 7.0, 4.0, 7.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.00029647350311279297, -0.0002877218648791313, -0.00027897022664546967, -0.000270218588411808, -0.00026146695017814636, -0.0002527153119444847, -0.00024396367371082306, -0.0002352120354771614, -0.00022646039724349976, -0.0002177087590098381, -0.00020895712077617645, -0.0002002054825425148, -0.00019145384430885315, -0.0001827022060751915, -0.00017395056784152985, -0.0001651989296078682, -0.00015644729137420654, -0.0001476956531405449, -0.00013894401490688324, -0.0001301923766732216, -0.00012144073843955994, -0.00011268910020589828, -0.00010393746197223663, -9.518582373857498e-05, -8.643418550491333e-05, -7.768254727125168e-05, -6.893090903759003e-05, -6.0179270803928375e-05, -5.1427632570266724e-05, -4.267599433660507e-05, -3.392435610294342e-05, -2.517271786928177e-05, -1.6421079635620117e-05, -7.669441401958466e-06, 1.082196831703186e-06, 9.833835065364838e-06, 1.858547329902649e-05, 2.733711153268814e-05, 3.608874976634979e-05, 4.4840388000011444e-05, 5.3592026233673096e-05, 6.234366446733475e-05, 7.10953027009964e-05, 7.984694093465805e-05, 8.85985791683197e-05, 9.735021740198135e-05, 0.000106101855635643, 0.00011485349386930466, 0.0001236051321029663, 0.00013235677033662796, 0.0001411084085702896, 0.00014986004680395126, 0.00015861168503761292, 0.00016736332327127457, 0.00017611496150493622, 0.00018486659973859787, 0.00019361823797225952, 0.00020236987620592117, 0.00021112151443958282, 0.00021987315267324448, 0.00022862479090690613, 0.00023737642914056778, 0.00024612806737422943, 0.0002548797056078911, 0.00026363134384155273]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 9.0, 4.0, 10.0, 14.0, 11.0, 23.0, 21.0, 28.0, 28.0, 33.0, 35.0, 26.0, 43.0, 47.0, 54.0, 47.0, 61.0, 40.0, 64.0, 53.0, 42.0, 33.0, 30.0, 48.0, 27.0, 24.0, 25.0, 24.0, 20.0, 20.0, 13.0, 15.0, 8.0, 3.0, 5.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8828125, -5.7059326171875, -5.529052734375, -5.3521728515625, -5.17529296875, -4.9984130859375, -4.821533203125, -4.6446533203125, -4.4677734375, -4.2908935546875, -4.114013671875, -3.9371337890625, -3.76025390625, -3.5833740234375, -3.406494140625, -3.2296142578125, -3.052734375, -2.8758544921875, -2.698974609375, -2.5220947265625, -2.34521484375, -2.1683349609375, -1.991455078125, -1.8145751953125, -1.6376953125, -1.4608154296875, -1.283935546875, -1.1070556640625, -0.93017578125, -0.7532958984375, -0.576416015625, -0.3995361328125, -0.22265625, -0.0457763671875, 0.131103515625, 0.3079833984375, 0.48486328125, 0.6617431640625, 0.838623046875, 1.0155029296875, 1.1923828125, 1.3692626953125, 1.546142578125, 1.7230224609375, 1.89990234375, 2.0767822265625, 2.253662109375, 2.4305419921875, 2.607421875, 2.7843017578125, 2.961181640625, 3.1380615234375, 3.31494140625, 3.4918212890625, 3.668701171875, 3.8455810546875, 4.0224609375, 4.1993408203125, 4.376220703125, 4.5531005859375, 4.72998046875, 4.9068603515625, 5.083740234375, 5.2606201171875, 5.4375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 9.0, 14.0, 16.0, 22.0, 41.0, 49.0, 64.0, 87.0, 119.0, 161.0, 219.0, 312.0, 429.0, 642.0, 1074.0, 2028.0, 4172.0, 10842.0, 41189.0, 276733.0, 586309.0, 92021.0, 19034.0, 6249.0, 2652.0, 1397.0, 832.0, 549.0, 360.0, 252.0, 169.0, 136.0, 95.0, 81.0, 52.0, 38.0, 33.0, 17.0, 18.0, 13.0, 8.0, 10.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7421875, -8.4530029296875, -8.163818359375, -7.8746337890625, -7.58544921875, -7.2962646484375, -7.007080078125, -6.7178955078125, -6.4287109375, -6.1395263671875, -5.850341796875, -5.5611572265625, -5.27197265625, -4.9827880859375, -4.693603515625, -4.4044189453125, -4.115234375, -3.8260498046875, -3.536865234375, -3.2476806640625, -2.95849609375, -2.6693115234375, -2.380126953125, -2.0909423828125, -1.8017578125, -1.5125732421875, -1.223388671875, -0.9342041015625, -0.64501953125, -0.3558349609375, -0.066650390625, 0.2225341796875, 0.51171875, 0.8009033203125, 1.090087890625, 1.3792724609375, 1.66845703125, 1.9576416015625, 2.246826171875, 2.5360107421875, 2.8251953125, 3.1143798828125, 3.403564453125, 3.6927490234375, 3.98193359375, 4.2711181640625, 4.560302734375, 4.8494873046875, 5.138671875, 5.4278564453125, 5.717041015625, 6.0062255859375, 6.29541015625, 6.5845947265625, 6.873779296875, 7.1629638671875, 7.4521484375, 7.7413330078125, 8.030517578125, 8.3197021484375, 8.60888671875, 8.8980712890625, 9.187255859375, 9.4764404296875, 9.765625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 9.0, 7.0, 20.0, 17.0, 16.0, 25.0, 36.0, 47.0, 51.0, 49.0, 69.0, 112.0, 404.0, 1651.0, 124.0, 83.0, 77.0, 53.0, 30.0, 34.0, 28.0, 28.0, 10.0, 4.0, 12.0, 11.0, 8.0, 7.0, 7.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.953125, -19.351806640625, -18.75048828125, -18.149169921875, -17.5478515625, -16.946533203125, -16.34521484375, -15.743896484375, -15.142578125, -14.541259765625, -13.93994140625, -13.338623046875, -12.7373046875, -12.135986328125, -11.53466796875, -10.933349609375, -10.33203125, -9.730712890625, -9.12939453125, -8.528076171875, -7.9267578125, -7.325439453125, -6.72412109375, -6.122802734375, -5.521484375, -4.920166015625, -4.31884765625, -3.717529296875, -3.1162109375, -2.514892578125, -1.91357421875, -1.312255859375, -0.7109375, -0.109619140625, 0.49169921875, 1.093017578125, 1.6943359375, 2.295654296875, 2.89697265625, 3.498291015625, 4.099609375, 4.700927734375, 5.30224609375, 5.903564453125, 6.5048828125, 7.106201171875, 7.70751953125, 8.308837890625, 8.91015625, 9.511474609375, 10.11279296875, 10.714111328125, 11.3154296875, 11.916748046875, 12.51806640625, 13.119384765625, 13.720703125, 14.322021484375, 14.92333984375, 15.524658203125, 16.1259765625, 16.727294921875, 17.32861328125, 17.929931640625, 18.53125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 8.0, 4.0, 14.0, 6.0, 16.0, 25.0, 33.0, 55.0, 95.0, 113.0, 174.0, 339.0, 766.0, 5458.0, 3131864.0, 4998.0, 819.0, 336.0, 225.0, 115.0, 78.0, 51.0, 36.0, 28.0, 13.0, 15.0, 8.0, 5.0, 5.0, 0.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.59375, -47.09814453125, -45.6025390625, -44.10693359375, -42.611328125, -41.11572265625, -39.6201171875, -38.12451171875, -36.62890625, -35.13330078125, -33.6376953125, -32.14208984375, -30.646484375, -29.15087890625, -27.6552734375, -26.15966796875, -24.6640625, -23.16845703125, -21.6728515625, -20.17724609375, -18.681640625, -17.18603515625, -15.6904296875, -14.19482421875, -12.69921875, -11.20361328125, -9.7080078125, -8.21240234375, -6.716796875, -5.22119140625, -3.7255859375, -2.22998046875, -0.734375, 0.76123046875, 2.2568359375, 3.75244140625, 5.248046875, 6.74365234375, 8.2392578125, 9.73486328125, 11.23046875, 12.72607421875, 14.2216796875, 15.71728515625, 17.212890625, 18.70849609375, 20.2041015625, 21.69970703125, 23.1953125, 24.69091796875, 26.1865234375, 27.68212890625, 29.177734375, 30.67333984375, 32.1689453125, 33.66455078125, 35.16015625, 36.65576171875, 38.1513671875, 39.64697265625, 41.142578125, 42.63818359375, 44.1337890625, 45.62939453125, 47.125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 245.0, 734.0, 33.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.6597900390625, -97.63075256347656, -93.60172271728516, -89.57269287109375, -85.54365539550781, -81.51461791992188, -77.48558807373047, -73.45655822753906, -69.42752075195312, -65.39848327636719, -61.36945343017578, -57.34041976928711, -53.31138610839844, -49.282352447509766, -45.253318786621094, -41.22428512573242, -37.19525146484375, -33.16621780395508, -29.137184143066406, -25.108150482177734, -21.079116821289062, -17.05008316040039, -13.021049499511719, -8.992015838623047, -4.962982177734375, -0.9339485168457031, 3.0950851440429688, 7.124118804931641, 11.153152465820312, 15.182186126708984, 19.211219787597656, 23.240253448486328, 27.269302368164062, 31.298336029052734, 35.327369689941406, 39.35640335083008, 43.38543701171875, 47.41447067260742, 51.443504333496094, 55.472537994384766, 59.50157165527344, 63.53060531616211, 67.55963897705078, 71.58866882324219, 75.61770629882812, 79.64674377441406, 83.67577362060547, 87.70480346679688, 91.73384094238281, 95.76287841796875, 99.79190826416016, 103.82093811035156, 107.8499755859375, 111.87901306152344, 115.90804290771484, 119.93707275390625, 123.96611022949219, 127.99514770507812, 132.024169921875, 136.05320739746094, 140.08224487304688, 144.1112823486328, 148.14031982421875, 152.16934204101562, 156.19837951660156]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 4.0, 3.0, 10.0, 16.0, 8.0, 15.0, 19.0, 19.0, 19.0, 18.0, 14.0, 26.0, 31.0, 36.0, 31.0, 27.0, 45.0, 37.0, 44.0, 56.0, 42.0, 54.0, 38.0, 35.0, 40.0, 40.0, 37.0, 20.0, 36.0, 22.0, 28.0, 19.0, 23.0, 19.0, 16.0, 16.0, 10.0, 10.0, 4.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-35.77206039428711, -34.684051513671875, -33.59604263305664, -32.508033752441406, -31.420026779174805, -30.33201789855957, -29.24401092529297, -28.156002044677734, -27.0679931640625, -25.979984283447266, -24.89197540283203, -23.80396842956543, -22.715959548950195, -21.62795066833496, -20.53994369506836, -19.451934814453125, -18.36392593383789, -17.275917053222656, -16.187908172607422, -15.09990119934082, -14.011892318725586, -12.923883438110352, -11.835875511169434, -10.747867584228516, -9.659858703613281, -8.571849822998047, -7.483841896057129, -6.395833492279053, -5.307825088500977, -4.2198166847229, -3.131808280944824, -2.043799877166748, -0.9557952880859375, 0.13221311569213867, 1.2202215194702148, 2.308229923248291, 3.396238327026367, 4.484246730804443, 5.5722551345825195, 6.660263538360596, 7.748271942138672, 8.836280822753906, 9.924288749694824, 11.012296676635742, 12.100305557250977, 13.188314437866211, 14.276322364807129, 15.364330291748047, 16.45233917236328, 17.540348052978516, 18.62835693359375, 19.71636390686035, 20.804372787475586, 21.89238166809082, 22.980388641357422, 24.068397521972656, 25.15640640258789, 26.244415283203125, 27.33242416381836, 28.42043113708496, 29.508440017700195, 30.59644889831543, 31.68445587158203, 32.772464752197266, 33.8604736328125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 7.0, 12.0, 8.0, 7.0, 10.0, 15.0, 12.0, 20.0, 27.0, 28.0, 38.0, 32.0, 41.0, 38.0, 32.0, 36.0, 33.0, 41.0, 31.0, 48.0, 29.0, 45.0, 45.0, 40.0, 33.0, 28.0, 43.0, 25.0, 31.0, 21.0, 23.0, 8.0, 20.0, 16.0, 15.0, 10.0, 12.0, 4.0, 12.0, 5.0, 3.0, 7.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.49609375, -5.31622314453125, -5.1363525390625, -4.95648193359375, -4.776611328125, -4.59674072265625, -4.4168701171875, -4.23699951171875, -4.05712890625, -3.87725830078125, -3.6973876953125, -3.51751708984375, -3.337646484375, -3.15777587890625, -2.9779052734375, -2.79803466796875, -2.6181640625, -2.43829345703125, -2.2584228515625, -2.07855224609375, -1.898681640625, -1.71881103515625, -1.5389404296875, -1.35906982421875, -1.17919921875, -0.99932861328125, -0.8194580078125, -0.63958740234375, -0.459716796875, -0.27984619140625, -0.0999755859375, 0.07989501953125, 0.259765625, 0.43963623046875, 0.6195068359375, 0.79937744140625, 0.979248046875, 1.15911865234375, 1.3389892578125, 1.51885986328125, 1.69873046875, 1.87860107421875, 2.0584716796875, 2.23834228515625, 2.418212890625, 2.59808349609375, 2.7779541015625, 2.95782470703125, 3.1376953125, 3.31756591796875, 3.4974365234375, 3.67730712890625, 3.857177734375, 4.03704833984375, 4.2169189453125, 4.39678955078125, 4.57666015625, 4.75653076171875, 4.9364013671875, 5.11627197265625, 5.296142578125, 5.47601318359375, 5.6558837890625, 5.83575439453125, 6.015625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 10.0, 6.0, 12.0, 23.0, 25.0, 28.0, 47.0, 37.0, 56.0, 79.0, 98.0, 135.0, 157.0, 244.0, 321.0, 527.0, 803.0, 1399.0, 5190.0, 543685.0, 3604393.0, 31283.0, 2525.0, 1024.0, 626.0, 404.0, 263.0, 210.0, 178.0, 102.0, 86.0, 70.0, 47.0, 46.0, 29.0, 29.0, 21.0, 12.0, 11.0, 12.0, 10.0, 6.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.84375, -28.82421875, -27.8046875, -26.78515625, -25.765625, -24.74609375, -23.7265625, -22.70703125, -21.6875, -20.66796875, -19.6484375, -18.62890625, -17.609375, -16.58984375, -15.5703125, -14.55078125, -13.53125, -12.51171875, -11.4921875, -10.47265625, -9.453125, -8.43359375, -7.4140625, -6.39453125, -5.375, -4.35546875, -3.3359375, -2.31640625, -1.296875, -0.27734375, 0.7421875, 1.76171875, 2.78125, 3.80078125, 4.8203125, 5.83984375, 6.859375, 7.87890625, 8.8984375, 9.91796875, 10.9375, 11.95703125, 12.9765625, 13.99609375, 15.015625, 16.03515625, 17.0546875, 18.07421875, 19.09375, 20.11328125, 21.1328125, 22.15234375, 23.171875, 24.19140625, 25.2109375, 26.23046875, 27.25, 28.26953125, 29.2890625, 30.30859375, 31.328125, 32.34765625, 33.3671875, 34.38671875, 35.40625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 18.0, 19.0, 24.0, 40.0, 98.0, 160.0, 335.0, 590.0, 853.0, 806.0, 519.0, 290.0, 140.0, 66.0, 42.0, 23.0, 21.0, 3.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.234375, -15.782958984375, -15.33154296875, -14.880126953125, -14.4287109375, -13.977294921875, -13.52587890625, -13.074462890625, -12.623046875, -12.171630859375, -11.72021484375, -11.268798828125, -10.8173828125, -10.365966796875, -9.91455078125, -9.463134765625, -9.01171875, -8.560302734375, -8.10888671875, -7.657470703125, -7.2060546875, -6.754638671875, -6.30322265625, -5.851806640625, -5.400390625, -4.948974609375, -4.49755859375, -4.046142578125, -3.5947265625, -3.143310546875, -2.69189453125, -2.240478515625, -1.7890625, -1.337646484375, -0.88623046875, -0.434814453125, 0.0166015625, 0.468017578125, 0.91943359375, 1.370849609375, 1.822265625, 2.273681640625, 2.72509765625, 3.176513671875, 3.6279296875, 4.079345703125, 4.53076171875, 4.982177734375, 5.43359375, 5.885009765625, 6.33642578125, 6.787841796875, 7.2392578125, 7.690673828125, 8.14208984375, 8.593505859375, 9.044921875, 9.496337890625, 9.94775390625, 10.399169921875, 10.8505859375, 11.302001953125, 11.75341796875, 12.204833984375, 12.65625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 6.0, 8.0, 8.0, 18.0, 27.0, 47.0, 101.0, 234.0, 522.0, 1296.0, 4476.0, 29440.0, 1028206.0, 3041436.0, 77940.0, 7320.0, 1904.0, 728.0, 299.0, 123.0, 49.0, 29.0, 20.0, 15.0, 10.0, 2.0, 4.0, 3.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.953125, -13.457763671875, -12.96240234375, -12.467041015625, -11.9716796875, -11.476318359375, -10.98095703125, -10.485595703125, -9.990234375, -9.494873046875, -8.99951171875, -8.504150390625, -8.0087890625, -7.513427734375, -7.01806640625, -6.522705078125, -6.02734375, -5.531982421875, -5.03662109375, -4.541259765625, -4.0458984375, -3.550537109375, -3.05517578125, -2.559814453125, -2.064453125, -1.569091796875, -1.07373046875, -0.578369140625, -0.0830078125, 0.412353515625, 0.90771484375, 1.403076171875, 1.8984375, 2.393798828125, 2.88916015625, 3.384521484375, 3.8798828125, 4.375244140625, 4.87060546875, 5.365966796875, 5.861328125, 6.356689453125, 6.85205078125, 7.347412109375, 7.8427734375, 8.338134765625, 8.83349609375, 9.328857421875, 9.82421875, 10.319580078125, 10.81494140625, 11.310302734375, 11.8056640625, 12.301025390625, 12.79638671875, 13.291748046875, 13.787109375, 14.282470703125, 14.77783203125, 15.273193359375, 15.7685546875, 16.263916015625, 16.75927734375, 17.254638671875, 17.75]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 14.0, 23.0, 49.0, 84.0, 106.0, 154.0, 145.0, 158.0, 97.0, 69.0, 42.0, 30.0, 12.0, 8.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.885250091552734, -51.268924713134766, -48.65260314941406, -46.036277770996094, -43.419952392578125, -40.803627014160156, -38.18730545043945, -35.570980072021484, -32.95465850830078, -30.338335037231445, -27.722009658813477, -25.10568618774414, -22.489360809326172, -19.873037338256836, -17.2567138671875, -14.640388488769531, -12.024063110351562, -9.40773868560791, -6.791414737701416, -4.175090789794922, -1.5587663650512695, 1.0575580596923828, 3.6738815307617188, 6.2902069091796875, 8.906530380249023, 11.522854804992676, 14.139179229736328, 16.755502700805664, 19.371826171875, 21.98815155029297, 24.604475021362305, 27.220800399780273, 29.837127685546875, 32.453453063964844, 35.06977462768555, 37.686100006103516, 40.302425384521484, 42.91874694824219, 45.535072326660156, 48.151397705078125, 50.767723083496094, 53.38404846191406, 56.000370025634766, 58.616695404052734, 61.2330207824707, 63.849342346191406, 66.46566772460938, 69.08199310302734, 71.69831848144531, 74.31464385986328, 76.93096923828125, 79.54728698730469, 82.16361236572266, 84.77993774414062, 87.3962631225586, 90.01258850097656, 92.62890625, 95.24523162841797, 97.86155700683594, 100.47787475585938, 103.09420013427734, 105.71052551269531, 108.32685089111328, 110.94317626953125, 113.55950164794922]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 8.0, 9.0, 11.0, 15.0, 12.0, 10.0, 12.0, 20.0, 12.0, 25.0, 38.0, 31.0, 27.0, 40.0, 28.0, 38.0, 42.0, 39.0, 48.0, 41.0, 47.0, 27.0, 43.0, 43.0, 45.0, 53.0, 32.0, 29.0, 35.0, 20.0, 19.0, 18.0, 10.0, 23.0, 12.0, 8.0, 7.0, 8.0, 6.0, 4.0, 5.0, 0.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-32.498497009277344, -31.512523651123047, -30.52655029296875, -29.540576934814453, -28.55460548400879, -27.568632125854492, -26.582658767700195, -25.5966854095459, -24.610713958740234, -23.624740600585938, -22.63876724243164, -21.652793884277344, -20.66682243347168, -19.680849075317383, -18.694875717163086, -17.70890235900879, -16.722929000854492, -15.736955642700195, -14.750983238220215, -13.765009880065918, -12.779037475585938, -11.79306411743164, -10.807090759277344, -9.821117401123047, -8.835144996643066, -7.849172115325928, -6.863199234008789, -5.877225875854492, -4.8912529945373535, -3.905280113220215, -2.919306755065918, -1.9333338737487793, -0.9473609924316406, 0.0386120080947876, 1.0245850086212158, 2.0105581283569336, 2.9965310096740723, 3.982503890991211, 4.968477249145508, 5.9544501304626465, 6.940423011779785, 7.926395893096924, 8.912368774414062, 9.89834213256836, 10.884315490722656, 11.870287895202637, 12.856261253356934, 13.842233657836914, 14.828207015991211, 15.814180374145508, 16.800153732299805, 17.78612518310547, 18.772098541259766, 19.758071899414062, 20.74404525756836, 21.730018615722656, 22.715991973876953, 23.70196533203125, 24.687938690185547, 25.673912048339844, 26.659883499145508, 27.645856857299805, 28.6318302154541, 29.6178035736084, 30.603775024414062]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 6.0, 14.0, 8.0, 9.0, 12.0, 13.0, 16.0, 15.0, 21.0, 22.0, 25.0, 35.0, 30.0, 46.0, 31.0, 41.0, 34.0, 42.0, 50.0, 49.0, 27.0, 45.0, 53.0, 51.0, 38.0, 26.0, 37.0, 41.0, 23.0, 24.0, 25.0, 13.0, 20.0, 9.0, 9.0, 11.0, 5.0, 8.0, 4.0, 2.0, 7.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-58.78125, -57.125, -55.46875, -53.8125, -52.15625, -50.5, -48.84375, -47.1875, -45.53125, -43.875, -42.21875, -40.5625, -38.90625, -37.25, -35.59375, -33.9375, -32.28125, -30.625, -28.96875, -27.3125, -25.65625, -24.0, -22.34375, -20.6875, -19.03125, -17.375, -15.71875, -14.0625, -12.40625, -10.75, -9.09375, -7.4375, -5.78125, -4.125, -2.46875, -0.8125, 0.84375, 2.5, 4.15625, 5.8125, 7.46875, 9.125, 10.78125, 12.4375, 14.09375, 15.75, 17.40625, 19.0625, 20.71875, 22.375, 24.03125, 25.6875, 27.34375, 29.0, 30.65625, 32.3125, 33.96875, 35.625, 37.28125, 38.9375, 40.59375, 42.25, 43.90625, 45.5625, 47.21875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 12.0, 19.0, 23.0, 30.0, 57.0, 88.0, 105.0, 160.0, 277.0, 429.0, 631.0, 981.0, 1503.0, 2290.0, 3632.0, 5645.0, 9074.0, 14748.0, 24521.0, 41020.0, 71545.0, 138227.0, 359680.0, 170974.0, 83221.0, 46981.0, 27783.0, 16878.0, 10342.0, 6330.0, 3998.0, 2521.0, 1677.0, 1083.0, 692.0, 470.0, 311.0, 202.0, 134.0, 83.0, 69.0, 34.0, 27.0, 16.0, 12.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.546875, -11.1817626953125, -10.816650390625, -10.4515380859375, -10.08642578125, -9.7213134765625, -9.356201171875, -8.9910888671875, -8.6259765625, -8.2608642578125, -7.895751953125, -7.5306396484375, -7.16552734375, -6.8004150390625, -6.435302734375, -6.0701904296875, -5.705078125, -5.3399658203125, -4.974853515625, -4.6097412109375, -4.24462890625, -3.8795166015625, -3.514404296875, -3.1492919921875, -2.7841796875, -2.4190673828125, -2.053955078125, -1.6888427734375, -1.32373046875, -0.9586181640625, -0.593505859375, -0.2283935546875, 0.13671875, 0.5018310546875, 0.866943359375, 1.2320556640625, 1.59716796875, 1.9622802734375, 2.327392578125, 2.6925048828125, 3.0576171875, 3.4227294921875, 3.787841796875, 4.1529541015625, 4.51806640625, 4.8831787109375, 5.248291015625, 5.6134033203125, 5.978515625, 6.3436279296875, 6.708740234375, 7.0738525390625, 7.43896484375, 7.8040771484375, 8.169189453125, 8.5343017578125, 8.8994140625, 9.2645263671875, 9.629638671875, 9.9947509765625, 10.35986328125, 10.7249755859375, 11.090087890625, 11.4552001953125, 11.8203125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 8.0, 4.0, 7.0, 8.0, 8.0, 12.0, 11.0, 11.0, 16.0, 20.0, 15.0, 21.0, 22.0, 30.0, 24.0, 35.0, 28.0, 36.0, 40.0, 36.0, 44.0, 31.0, 33.0, 1053.0, 30.0, 41.0, 51.0, 32.0, 36.0, 31.0, 26.0, 36.0, 22.0, 31.0, 24.0, 22.0, 25.0, 13.0, 12.0, 9.0, 5.0, 8.0, 3.0, 6.0, 5.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-28.109375, -27.172607421875, -26.23583984375, -25.299072265625, -24.3623046875, -23.425537109375, -22.48876953125, -21.552001953125, -20.615234375, -19.678466796875, -18.74169921875, -17.804931640625, -16.8681640625, -15.931396484375, -14.99462890625, -14.057861328125, -13.12109375, -12.184326171875, -11.24755859375, -10.310791015625, -9.3740234375, -8.437255859375, -7.50048828125, -6.563720703125, -5.626953125, -4.690185546875, -3.75341796875, -2.816650390625, -1.8798828125, -0.943115234375, -0.00634765625, 0.930419921875, 1.8671875, 2.803955078125, 3.74072265625, 4.677490234375, 5.6142578125, 6.551025390625, 7.48779296875, 8.424560546875, 9.361328125, 10.298095703125, 11.23486328125, 12.171630859375, 13.1083984375, 14.045166015625, 14.98193359375, 15.918701171875, 16.85546875, 17.792236328125, 18.72900390625, 19.665771484375, 20.6025390625, 21.539306640625, 22.47607421875, 23.412841796875, 24.349609375, 25.286376953125, 26.22314453125, 27.159912109375, 28.0966796875, 29.033447265625, 29.97021484375, 30.906982421875, 31.84375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 9.0, 4.0, 7.0, 20.0, 21.0, 29.0, 28.0, 46.0, 84.0, 92.0, 137.0, 223.0, 325.0, 486.0, 747.0, 1266.0, 1913.0, 3156.0, 4824.0, 7897.0, 12776.0, 21550.0, 36454.0, 64890.0, 122692.0, 1365933.0, 220241.0, 98654.0, 54378.0, 30995.0, 18198.0, 10855.0, 6677.0, 4074.0, 2488.0, 1651.0, 1156.0, 703.0, 494.0, 313.0, 236.0, 140.0, 87.0, 69.0, 38.0, 29.0, 16.0, 17.0, 6.0, 6.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-13.0625, -12.676513671875, -12.29052734375, -11.904541015625, -11.5185546875, -11.132568359375, -10.74658203125, -10.360595703125, -9.974609375, -9.588623046875, -9.20263671875, -8.816650390625, -8.4306640625, -8.044677734375, -7.65869140625, -7.272705078125, -6.88671875, -6.500732421875, -6.11474609375, -5.728759765625, -5.3427734375, -4.956787109375, -4.57080078125, -4.184814453125, -3.798828125, -3.412841796875, -3.02685546875, -2.640869140625, -2.2548828125, -1.868896484375, -1.48291015625, -1.096923828125, -0.7109375, -0.324951171875, 0.06103515625, 0.447021484375, 0.8330078125, 1.218994140625, 1.60498046875, 1.990966796875, 2.376953125, 2.762939453125, 3.14892578125, 3.534912109375, 3.9208984375, 4.306884765625, 4.69287109375, 5.078857421875, 5.46484375, 5.850830078125, 6.23681640625, 6.622802734375, 7.0087890625, 7.394775390625, 7.78076171875, 8.166748046875, 8.552734375, 8.938720703125, 9.32470703125, 9.710693359375, 10.0966796875, 10.482666015625, 10.86865234375, 11.254638671875, 11.640625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 2.0, 5.0, 3.0, 7.0, 3.0, 11.0, 15.0, 13.0, 19.0, 24.0, 17.0, 35.0, 44.0, 53.0, 73.0, 141.0, 133.0, 119.0, 87.0, 31.0, 28.0, 26.0, 25.0, 17.0, 13.0, 10.0, 11.0, 6.0, 9.0, 2.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01409912109375, -0.013649225234985352, -0.013199329376220703, -0.012749433517456055, -0.012299537658691406, -0.011849641799926758, -0.01139974594116211, -0.010949850082397461, -0.010499954223632812, -0.010050058364868164, -0.009600162506103516, -0.009150266647338867, -0.008700370788574219, -0.00825047492980957, -0.007800579071044922, -0.0073506832122802734, -0.006900787353515625, -0.0064508914947509766, -0.006000995635986328, -0.00555109977722168, -0.005101203918457031, -0.004651308059692383, -0.004201412200927734, -0.003751516342163086, -0.0033016204833984375, -0.002851724624633789, -0.0024018287658691406, -0.0019519329071044922, -0.0015020370483398438, -0.0010521411895751953, -0.0006022453308105469, -0.00015234947204589844, 0.00029754638671875, 0.0007474422454833984, 0.0011973381042480469, 0.0016472339630126953, 0.0020971298217773438, 0.002547025680541992, 0.0029969215393066406, 0.003446817398071289, 0.0038967132568359375, 0.004346609115600586, 0.004796504974365234, 0.005246400833129883, 0.005696296691894531, 0.00614619255065918, 0.006596088409423828, 0.0070459842681884766, 0.007495880126953125, 0.007945775985717773, 0.008395671844482422, 0.00884556770324707, 0.009295463562011719, 0.009745359420776367, 0.010195255279541016, 0.010645151138305664, 0.011095046997070312, 0.011544942855834961, 0.01199483871459961, 0.012444734573364258, 0.012894630432128906, 0.013344526290893555, 0.013794422149658203, 0.014244318008422852, 0.0146942138671875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 6.0, 5.0, 6.0, 14.0, 12.0, 20.0, 36.0, 34.0, 64.0, 60.0, 96.0, 157.0, 225.0, 358.0, 648.0, 1281.0, 3201.0, 10472.0, 45642.0, 390281.0, 521284.0, 55642.0, 12110.0, 3631.0, 1389.0, 701.0, 374.0, 219.0, 168.0, 103.0, 98.0, 40.0, 41.0, 38.0, 22.0, 15.0, 16.0, 13.0, 4.0, 5.0, 9.0, 3.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0838623046875, -0.08132553100585938, -0.07878875732421875, -0.07625198364257812, -0.0737152099609375, -0.07117843627929688, -0.06864166259765625, -0.06610488891601562, -0.063568115234375, -0.061031341552734375, -0.05849456787109375, -0.055957794189453125, -0.0534210205078125, -0.050884246826171875, -0.04834747314453125, -0.045810699462890625, -0.04327392578125, -0.040737152099609375, -0.03820037841796875, -0.035663604736328125, -0.0331268310546875, -0.030590057373046875, -0.02805328369140625, -0.025516510009765625, -0.022979736328125, -0.020442962646484375, -0.01790618896484375, -0.015369415283203125, -0.0128326416015625, -0.010295867919921875, -0.00775909423828125, -0.005222320556640625, -0.002685546875, -0.000148773193359375, 0.00238800048828125, 0.004924774169921875, 0.0074615478515625, 0.009998321533203125, 0.01253509521484375, 0.015071868896484375, 0.017608642578125, 0.020145416259765625, 0.02268218994140625, 0.025218963623046875, 0.0277557373046875, 0.030292510986328125, 0.03282928466796875, 0.035366058349609375, 0.03790283203125, 0.040439605712890625, 0.04297637939453125, 0.045513153076171875, 0.0480499267578125, 0.050586700439453125, 0.05312347412109375, 0.055660247802734375, 0.058197021484375, 0.060733795166015625, 0.06327056884765625, 0.06580734252929688, 0.0683441162109375, 0.07088088989257812, 0.07341766357421875, 0.07595443725585938, 0.0784912109375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 7.0, 14.0, 41.0, 58.0, 103.0, 146.0, 193.0, 170.0, 107.0, 67.0, 49.0, 23.0, 5.0, 7.0, 3.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01397439930588007, -0.013517401181161404, -0.013060402125120163, -0.012603404000401497, -0.012146404944360256, -0.01168940681964159, -0.01123240776360035, -0.010775409638881683, -0.010318411514163017, -0.009861413389444351, -0.00940441433340311, -0.008947416208684444, -0.008490417152643204, -0.008033419027924538, -0.007576420437544584, -0.007119421847164631, -0.0066624232567846775, -0.006205424666404724, -0.005748426076024771, -0.005291427485644817, -0.004834429360926151, -0.004377430770546198, -0.0039204321801662445, -0.0034634338226169348, -0.0030064352322369814, -0.002549436641857028, -0.0020924382843077183, -0.001635439693927765, -0.0011784412199631333, -0.0007214427459985018, -0.0002644441556185484, 0.00019255420193076134, 0.0006495527923107147, 0.0011065512662753463, 0.0015635497402399778, 0.0020205483306199312, 0.002477546688169241, 0.0029345452785491943, 0.0033915438689291477, 0.0038485422264784575, 0.004305540584027767, 0.0047625391744077206, 0.005219537764787674, 0.00567653588950634, 0.006133534479886293, 0.006590533070266247, 0.0070475316606462, 0.0075045302510261536, 0.00796152837574482, 0.008418526500463486, 0.008875525556504726, 0.009332523681223392, 0.009789522737264633, 0.0102465208619833, 0.010703518986701965, 0.011160518042743206, 0.011617517098784447, 0.012074515223503113, 0.012531514279544353, 0.01298851240426302, 0.01344551146030426, 0.013902509585022926, 0.014359507709741592, 0.014816506765782833, 0.0152735048905015]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 1.0, 4.0, 3.0, 4.0, 7.0, 4.0, 10.0, 3.0, 5.0, 7.0, 12.0, 18.0, 22.0, 13.0, 22.0, 29.0, 25.0, 31.0, 35.0, 24.0, 28.0, 32.0, 39.0, 53.0, 50.0, 38.0, 39.0, 44.0, 40.0, 29.0, 42.0, 43.0, 30.0, 22.0, 21.0, 16.0, 27.0, 24.0, 25.0, 16.0, 11.0, 10.0, 15.0, 9.0, 8.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005554914474487305, -0.00538150779902935, -0.005208101123571396, -0.0050346944481134415, -0.004861287772655487, -0.004687881097197533, -0.004514474421739578, -0.004341067746281624, -0.004167661070823669, -0.003994254395365715, -0.0038208477199077606, -0.003647441044449806, -0.003474034368991852, -0.0033006276935338974, -0.003127221018075943, -0.0029538143426179886, -0.002780407667160034, -0.0026070009917020798, -0.0024335943162441254, -0.002260187640786171, -0.0020867809653282166, -0.0019133742898702621, -0.0017399676144123077, -0.0015665609389543533, -0.001393154263496399, -0.0012197475880384445, -0.0010463409125804901, -0.0008729342371225357, -0.0006995275616645813, -0.0005261208862066269, -0.0003527142107486725, -0.00017930753529071808, -5.900859832763672e-06, 0.00016750581562519073, 0.00034091249108314514, 0.0005143191665410995, 0.000687725841999054, 0.0008611325174570084, 0.0010345391929149628, 0.0012079458683729172, 0.0013813525438308716, 0.001554759219288826, 0.0017281658947467804, 0.0019015725702047348, 0.002074979245662689, 0.0022483859211206436, 0.002421792596578598, 0.0025951992720365524, 0.002768605947494507, 0.0029420126229524612, 0.0031154192984104156, 0.00328882597386837, 0.0034622326493263245, 0.003635639324784279, 0.0038090460002422333, 0.003982452675700188, 0.004155859351158142, 0.0043292660266160965, 0.004502672702074051, 0.004676079377532005, 0.00484948605298996, 0.005022892728447914, 0.0051962994039058685, 0.005369706079363823, 0.005543112754821777]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 6.0, 14.0, 8.0, 9.0, 12.0, 13.0, 16.0, 16.0, 20.0, 22.0, 25.0, 35.0, 31.0, 45.0, 31.0, 40.0, 35.0, 42.0, 50.0, 49.0, 26.0, 46.0, 53.0, 51.0, 38.0, 25.0, 38.0, 41.0, 24.0, 23.0, 26.0, 12.0, 19.0, 10.0, 9.0, 12.0, 4.0, 8.0, 4.0, 2.0, 7.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-58.78125, -57.125, -55.46875, -53.8125, -52.15625, -50.5, -48.84375, -47.1875, -45.53125, -43.875, -42.21875, -40.5625, -38.90625, -37.25, -35.59375, -33.9375, -32.28125, -30.625, -28.96875, -27.3125, -25.65625, -24.0, -22.34375, -20.6875, -19.03125, -17.375, -15.71875, -14.0625, -12.40625, -10.75, -9.09375, -7.4375, -5.78125, -4.125, -2.46875, -0.8125, 0.84375, 2.5, 4.15625, 5.8125, 7.46875, 9.125, 10.78125, 12.4375, 14.09375, 15.75, 17.40625, 19.0625, 20.71875, 22.375, 24.03125, 25.6875, 27.34375, 29.0, 30.65625, 32.3125, 33.96875, 35.625, 37.28125, 38.9375, 40.59375, 42.25, 43.90625, 45.5625, 47.21875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 0.0, 0.0, 11.0, 4.0, 7.0, 10.0, 19.0, 21.0, 32.0, 48.0, 62.0, 86.0, 139.0, 210.0, 365.0, 724.0, 1256.0, 2651.0, 6187.0, 18908.0, 84961.0, 463472.0, 377346.0, 66016.0, 15549.0, 5377.0, 2373.0, 1098.0, 625.0, 357.0, 220.0, 126.0, 97.0, 51.0, 40.0, 26.0, 25.0, 15.0, 13.0, 8.0, 9.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.375, -11.9991455078125, -11.623291015625, -11.2474365234375, -10.87158203125, -10.4957275390625, -10.119873046875, -9.7440185546875, -9.3681640625, -8.9923095703125, -8.616455078125, -8.2406005859375, -7.86474609375, -7.4888916015625, -7.113037109375, -6.7371826171875, -6.361328125, -5.9854736328125, -5.609619140625, -5.2337646484375, -4.85791015625, -4.4820556640625, -4.106201171875, -3.7303466796875, -3.3544921875, -2.9786376953125, -2.602783203125, -2.2269287109375, -1.85107421875, -1.4752197265625, -1.099365234375, -0.7235107421875, -0.34765625, 0.0281982421875, 0.404052734375, 0.7799072265625, 1.15576171875, 1.5316162109375, 1.907470703125, 2.2833251953125, 2.6591796875, 3.0350341796875, 3.410888671875, 3.7867431640625, 4.16259765625, 4.5384521484375, 4.914306640625, 5.2901611328125, 5.666015625, 6.0418701171875, 6.417724609375, 6.7935791015625, 7.16943359375, 7.5452880859375, 7.921142578125, 8.2969970703125, 8.6728515625, 9.0487060546875, 9.424560546875, 9.8004150390625, 10.17626953125, 10.5521240234375, 10.927978515625, 11.3038330078125, 11.6796875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 9.0, 6.0, 15.0, 29.0, 33.0, 36.0, 58.0, 57.0, 70.0, 69.0, 1781.0, 445.0, 93.0, 69.0, 66.0, 53.0, 49.0, 42.0, 21.0, 14.0, 9.0, 10.0, 6.0, 0.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.9375, -123.5205078125, -119.103515625, -114.6865234375, -110.26953125, -105.8525390625, -101.435546875, -97.0185546875, -92.6015625, -88.1845703125, -83.767578125, -79.3505859375, -74.93359375, -70.5166015625, -66.099609375, -61.6826171875, -57.265625, -52.8486328125, -48.431640625, -44.0146484375, -39.59765625, -35.1806640625, -30.763671875, -26.3466796875, -21.9296875, -17.5126953125, -13.095703125, -8.6787109375, -4.26171875, 0.1552734375, 4.572265625, 8.9892578125, 13.40625, 17.8232421875, 22.240234375, 26.6572265625, 31.07421875, 35.4912109375, 39.908203125, 44.3251953125, 48.7421875, 53.1591796875, 57.576171875, 61.9931640625, 66.41015625, 70.8271484375, 75.244140625, 79.6611328125, 84.078125, 88.4951171875, 92.912109375, 97.3291015625, 101.74609375, 106.1630859375, 110.580078125, 114.9970703125, 119.4140625, 123.8310546875, 128.248046875, 132.6650390625, 137.08203125, 141.4990234375, 145.916015625, 150.3330078125, 154.75]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 8.0, 9.0, 10.0, 18.0, 19.0, 26.0, 42.0, 64.0, 80.0, 111.0, 200.0, 332.0, 498.0, 929.0, 1871.0, 7691.0, 103064.0, 2915671.0, 103053.0, 7723.0, 2004.0, 867.0, 490.0, 328.0, 191.0, 147.0, 77.0, 52.0, 40.0, 26.0, 21.0, 13.0, 4.0, 7.0, 2.0, 5.0, 0.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.78125, -23.111328125, -22.44140625, -21.771484375, -21.1015625, -20.431640625, -19.76171875, -19.091796875, -18.421875, -17.751953125, -17.08203125, -16.412109375, -15.7421875, -15.072265625, -14.40234375, -13.732421875, -13.0625, -12.392578125, -11.72265625, -11.052734375, -10.3828125, -9.712890625, -9.04296875, -8.373046875, -7.703125, -7.033203125, -6.36328125, -5.693359375, -5.0234375, -4.353515625, -3.68359375, -3.013671875, -2.34375, -1.673828125, -1.00390625, -0.333984375, 0.3359375, 1.005859375, 1.67578125, 2.345703125, 3.015625, 3.685546875, 4.35546875, 5.025390625, 5.6953125, 6.365234375, 7.03515625, 7.705078125, 8.375, 9.044921875, 9.71484375, 10.384765625, 11.0546875, 11.724609375, 12.39453125, 13.064453125, 13.734375, 14.404296875, 15.07421875, 15.744140625, 16.4140625, 17.083984375, 17.75390625, 18.423828125, 19.09375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 8.0, 31.0, 56.0, 177.0, 320.0, 234.0, 107.0, 34.0, 16.0, 9.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-244.5985107421875, -236.3458251953125, -228.09315490722656, -219.84046936035156, -211.58779907226562, -203.33511352539062, -195.08242797851562, -186.82974243164062, -178.5770721435547, -170.3243865966797, -162.07171630859375, -153.81903076171875, -145.56634521484375, -137.3136749267578, -129.0609893798828, -120.80831146240234, -112.55563354492188, -104.3029556274414, -96.05027770996094, -87.79759216308594, -79.54491424560547, -71.292236328125, -63.039554595947266, -54.78687286376953, -46.53419494628906, -38.281517028808594, -30.02883529663086, -21.776155471801758, -13.523475646972656, -5.2707977294921875, 2.981884002685547, 11.234565734863281, 19.487213134765625, 27.739892959594727, 35.99257278442383, 44.24525451660156, 52.49793243408203, 60.7506103515625, 69.0032958984375, 77.25597381591797, 85.50865173339844, 93.7613296508789, 102.01400756835938, 110.26669311523438, 118.51937103271484, 126.77204895019531, 135.0247344970703, 143.27740478515625, 151.53009033203125, 159.78277587890625, 168.0354461669922, 176.2881317138672, 184.54080200195312, 192.79348754882812, 201.04617309570312, 209.29885864257812, 217.55152893066406, 225.80421447753906, 234.056884765625, 242.3095703125, 250.562255859375, 258.81494140625, 267.0675964355469, 275.3202819824219, 283.5729675292969]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 6.0, 10.0, 13.0, 16.0, 18.0, 27.0, 41.0, 37.0, 38.0, 38.0, 46.0, 51.0, 59.0, 60.0, 51.0, 56.0, 66.0, 46.0, 48.0, 44.0, 30.0, 35.0, 23.0, 23.0, 19.0, 15.0, 13.0, 16.0, 11.0, 9.0, 3.0, 4.0, 4.0, 1.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.2759780883789, -110.3872299194336, -106.49848937988281, -102.6097412109375, -98.72099304199219, -94.83224487304688, -90.94349670410156, -87.05475616455078, -83.16600799560547, -79.27725982666016, -75.38851928710938, -71.49977111816406, -67.61102294921875, -63.72227478027344, -59.83353042602539, -55.944786071777344, -52.05603790283203, -48.16728973388672, -44.27854537963867, -40.389801025390625, -36.50105285644531, -32.6123046875, -28.723560333251953, -24.834814071655273, -20.946067810058594, -17.057321548461914, -13.168575286865234, -9.279829025268555, -5.391082763671875, -1.5023365020751953, 2.3864097595214844, 6.275156021118164, 10.163894653320312, 14.052640914916992, 17.941387176513672, 21.83013343811035, 25.71887969970703, 29.60762596130371, 33.49637222290039, 37.38511657714844, 41.27386474609375, 45.16261291503906, 49.05135726928711, 52.940101623535156, 56.82884979248047, 60.71759796142578, 64.60633850097656, 68.49508666992188, 72.38383483886719, 76.2725830078125, 80.16133117675781, 84.0500717163086, 87.9388198852539, 91.82756805419922, 95.71630859375, 99.60505676269531, 103.49380493164062, 107.38255310058594, 111.27130126953125, 115.16004180908203, 119.04878997802734, 122.93753814697266, 126.82627868652344, 130.71502685546875, 134.60377502441406]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 11.0, 12.0, 18.0, 22.0, 26.0, 42.0, 57.0, 88.0, 116.0, 195.0, 303.0, 452.0, 635.0, 1072.0, 1629.0, 2534.0, 3845.0, 5803.0, 1020115.0, 4063.0, 2544.0, 1664.0, 1132.0, 761.0, 450.0, 284.0, 210.0, 144.0, 86.0, 63.0, 36.0, 36.0, 25.0, 17.0, 9.0, 10.0, 7.0, 10.0, 5.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-26.637210845947266, -25.898723602294922, -25.160236358642578, -24.421749114990234, -23.68326187133789, -22.944774627685547, -22.206287384033203, -21.46780014038086, -20.729312896728516, -19.990825653076172, -19.252338409423828, -18.513851165771484, -17.77536392211914, -17.036876678466797, -16.298389434814453, -15.55990219116211, -14.821415901184082, -14.082928657531738, -13.344441413879395, -12.60595417022705, -11.867466926574707, -11.128979682922363, -10.390493392944336, -9.652006149291992, -8.913518905639648, -8.175031661987305, -7.436544418334961, -6.698057174682617, -5.959569931030273, -5.22108268737793, -4.482595920562744, -3.7441086769104004, -3.0056209564208984, -2.2671337127685547, -1.5286465883255005, -0.7901594638824463, -0.05167222023010254, 0.6868150234222412, 1.4253020286560059, 2.1637892723083496, 2.9022765159606934, 3.640763759613037, 4.379251003265381, 5.117737770080566, 5.85622501373291, 6.594712257385254, 7.333199501037598, 8.071686744689941, 8.810173988342285, 9.548661231994629, 10.287148475646973, 11.025635719299316, 11.76412296295166, 12.502610206604004, 13.241096496582031, 13.979583740234375, 14.718070983886719, 15.456558227539062, 16.195045471191406, 16.93353271484375, 17.672019958496094, 18.410507202148438, 19.14899444580078, 19.887481689453125, 20.62596893310547]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 10.0, 5.0, 16.0, 44.0, 48.0, 78.0, 355.0, 51462120.0, 231.0, 89.0, 24.0, 21.0, 16.0, 22.0, 20.0, 17.0, 21.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8247.9609375, -7994.0458984375, -7740.13037109375, -7486.21533203125, -7232.2998046875, -6978.384765625, -6724.4697265625, -6470.5546875, -6216.63916015625, -5962.72412109375, -5708.80859375, -5454.8935546875, -5200.978515625, -4947.06298828125, -4693.14794921875, -4439.232421875, -4185.3173828125, -3931.402099609375, -3677.48681640625, -3423.57177734375, -3169.656494140625, -2915.7412109375, -2661.826171875, -2407.910888671875, -2153.99560546875, -1900.080322265625, -1646.1651611328125, -1392.25, -1138.334716796875, -884.41943359375, -630.5042724609375, -376.589111328125, -122.67333984375, 131.24188232421875, 385.1571044921875, 639.0723266601562, 892.987548828125, 1146.90283203125, 1400.8179931640625, 1654.733154296875, 1908.6484375, 2162.563720703125, 2416.47900390625, 2670.39404296875, 2924.309326171875, 3178.224609375, 3432.1396484375, 3686.054931640625, 3939.97021484375, 4193.88525390625, 4447.80078125, 4701.7158203125, 4955.630859375, 5209.54638671875, 5463.46142578125, 5717.376953125, 5971.2919921875, 6225.20703125, 6479.12255859375, 6733.03759765625, 6986.953125, 7240.8681640625, 7494.783203125, 7748.6982421875, 8002.61376953125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 3.0, 12.0, 22.0, 28.0, 34.0, 46.0, 79.0, 117.0, 175.0, 261.0, 344.0, 485.0, 734.0, 1064.0, 1455.0, 2309.0, 3058.0, 4636.0, 6736.0, 9847.0, 14510.0, 22155.0, 32900.0, 50738.0, 78129.0, 127197.0, 215189.0, 440147.0, 3874563.0, 714150.0, 267705.0, 152500.0, 93010.0, 59932.0, 38481.0, 25382.0, 16725.0, 11482.0, 7755.0, 5409.0, 3608.0, 2622.0, 1739.0, 1273.0, 836.0, 598.0, 365.0, 253.0, 251.0, 137.0, 75.0, 65.0, 34.0, 31.0, 25.0, 9.0, 7.0, 5.0, 3.0, 3.0, 3.0], "bins": [-4.69140625, -4.5433349609375, -4.395263671875, -4.2471923828125, -4.09912109375, -3.9510498046875, -3.802978515625, -3.6549072265625, -3.5068359375, -3.3587646484375, -3.210693359375, -3.0626220703125, -2.91455078125, -2.7664794921875, -2.618408203125, -2.4703369140625, -2.322265625, -2.1741943359375, -2.026123046875, -1.8780517578125, -1.72998046875, -1.5819091796875, -1.433837890625, -1.2857666015625, -1.1376953125, -0.9896240234375, -0.841552734375, -0.6934814453125, -0.54541015625, -0.3973388671875, -0.249267578125, -0.1011962890625, 0.046875, 0.1949462890625, 0.343017578125, 0.4910888671875, 0.63916015625, 0.7872314453125, 0.935302734375, 1.0833740234375, 1.2314453125, 1.3795166015625, 1.527587890625, 1.6756591796875, 1.82373046875, 1.9718017578125, 2.119873046875, 2.2679443359375, 2.416015625, 2.5640869140625, 2.712158203125, 2.8602294921875, 3.00830078125, 3.1563720703125, 3.304443359375, 3.4525146484375, 3.6005859375, 3.7486572265625, 3.896728515625, 4.0447998046875, 4.19287109375, 4.3409423828125, 4.489013671875, 4.6370849609375, 4.78515625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 6.0, 9.0, 7.0, 12.0, 14.0, 8.0, 22.0, 12.0, 17.0, 29.0, 38.0, 25.0, 32.0, 30.0, 39.0, 38.0, 38.0, 51.0, 112.0, 489.0, 420.0, 119.0, 78.0, 50.0, 27.0, 37.0, 28.0, 33.0, 32.0, 34.0, 34.0, 15.0, 21.0, 14.0, 6.0, 13.0, 7.0, 9.0, 5.0, 2.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.4140625, -11.0677490234375, -10.721435546875, -10.3751220703125, -10.02880859375, -9.6824951171875, -9.336181640625, -8.9898681640625, -8.6435546875, -8.2972412109375, -7.950927734375, -7.6046142578125, -7.25830078125, -6.9119873046875, -6.565673828125, -6.2193603515625, -5.873046875, -5.5267333984375, -5.180419921875, -4.8341064453125, -4.48779296875, -4.1414794921875, -3.795166015625, -3.4488525390625, -3.1025390625, -2.7562255859375, -2.409912109375, -2.0635986328125, -1.71728515625, -1.3709716796875, -1.024658203125, -0.6783447265625, -0.33203125, 0.0142822265625, 0.360595703125, 0.7069091796875, 1.05322265625, 1.3995361328125, 1.745849609375, 2.0921630859375, 2.4384765625, 2.7847900390625, 3.131103515625, 3.4774169921875, 3.82373046875, 4.1700439453125, 4.516357421875, 4.8626708984375, 5.208984375, 5.5552978515625, 5.901611328125, 6.2479248046875, 6.59423828125, 6.9405517578125, 7.286865234375, 7.6331787109375, 7.9794921875, 8.3258056640625, 8.672119140625, 9.0184326171875, 9.36474609375, 9.7110595703125, 10.057373046875, 10.4036865234375, 10.75]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 5.0, 5.0, 13.0, 16.0, 5.0, 25.0, 35.0, 55.0, 71.0, 118.0, 220.0, 308.0, 479.0, 666.0, 971.0, 1348.0, 1795.0, 2952.0, 4595.0, 6967.0, 10305.0, 14677.0, 22015.0, 33608.0, 54609.0, 86491.0, 148523.0, 283714.0, 805877.0, 3790786.0, 482128.0, 215769.0, 120129.0, 72001.0, 43642.0, 29207.0, 19466.0, 12282.0, 8026.0, 5714.0, 3957.0, 2626.0, 1869.0, 1104.0, 764.0, 513.0, 346.0, 214.0, 120.0, 78.0, 85.0, 41.0, 29.0, 37.0, 11.0, 18.0, 6.0, 2.0, 3.0, 11.0], "bins": [-5.37109375, -5.2098388671875, -5.048583984375, -4.8873291015625, -4.72607421875, -4.5648193359375, -4.403564453125, -4.2423095703125, -4.0810546875, -3.9197998046875, -3.758544921875, -3.5972900390625, -3.43603515625, -3.2747802734375, -3.113525390625, -2.9522705078125, -2.791015625, -2.6297607421875, -2.468505859375, -2.3072509765625, -2.14599609375, -1.9847412109375, -1.823486328125, -1.6622314453125, -1.5009765625, -1.3397216796875, -1.178466796875, -1.0172119140625, -0.85595703125, -0.6947021484375, -0.533447265625, -0.3721923828125, -0.2109375, -0.0496826171875, 0.111572265625, 0.2728271484375, 0.43408203125, 0.5953369140625, 0.756591796875, 0.9178466796875, 1.0791015625, 1.2403564453125, 1.401611328125, 1.5628662109375, 1.72412109375, 1.8853759765625, 2.046630859375, 2.2078857421875, 2.369140625, 2.5303955078125, 2.691650390625, 2.8529052734375, 3.01416015625, 3.1754150390625, 3.336669921875, 3.4979248046875, 3.6591796875, 3.8204345703125, 3.981689453125, 4.1429443359375, 4.30419921875, 4.4654541015625, 4.626708984375, 4.7879638671875, 4.94921875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 6.0, 8.0, 8.0, 8.0, 12.0, 13.0, 8.0, 8.0, 14.0, 22.0, 26.0, 27.0, 20.0, 37.0, 31.0, 31.0, 43.0, 48.0, 58.0, 89.0, 199.0, 579.0, 195.0, 94.0, 63.0, 39.0, 50.0, 36.0, 42.0, 29.0, 22.0, 21.0, 17.0, 18.0, 19.0, 17.0, 18.0, 9.0, 11.0, 6.0, 7.0, 5.0, 4.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-8.0390625, -7.7984619140625, -7.557861328125, -7.3172607421875, -7.07666015625, -6.8360595703125, -6.595458984375, -6.3548583984375, -6.1142578125, -5.8736572265625, -5.633056640625, -5.3924560546875, -5.15185546875, -4.9112548828125, -4.670654296875, -4.4300537109375, -4.189453125, -3.9488525390625, -3.708251953125, -3.4676513671875, -3.22705078125, -2.9864501953125, -2.745849609375, -2.5052490234375, -2.2646484375, -2.0240478515625, -1.783447265625, -1.5428466796875, -1.30224609375, -1.0616455078125, -0.821044921875, -0.5804443359375, -0.33984375, -0.0992431640625, 0.141357421875, 0.3819580078125, 0.62255859375, 0.8631591796875, 1.103759765625, 1.3443603515625, 1.5849609375, 1.8255615234375, 2.066162109375, 2.3067626953125, 2.54736328125, 2.7879638671875, 3.028564453125, 3.2691650390625, 3.509765625, 3.7503662109375, 3.990966796875, 4.2315673828125, 4.47216796875, 4.7127685546875, 4.953369140625, 5.1939697265625, 5.4345703125, 5.6751708984375, 5.915771484375, 6.1563720703125, 6.39697265625, 6.6375732421875, 6.878173828125, 7.1187744140625, 7.359375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 6.0, 3.0, 0.0, 13.0, 21.0, 20.0, 44.0, 35.0, 39.0, 75.0, 62.0, 98.0, 152.0, 206.0, 303.0, 348.0, 416.0, 719.0, 1019.0, 1409.0, 2710.0, 4214.0, 8607.0, 18882.0, 60060.0, 5808777.0, 304903.0, 44994.0, 15539.0, 6999.0, 3710.0, 2218.0, 1505.0, 949.0, 638.0, 474.0, 275.0, 302.0, 202.0, 103.0, 94.0, 74.0, 30.0, 41.0, 36.0, 31.0, 14.0, 16.0, 23.0, 11.0, 6.0, 13.0, 0.0, 0.0, 0.0, 6.0], "bins": [-20.1875, -19.591796875, -18.99609375, -18.400390625, -17.8046875, -17.208984375, -16.61328125, -16.017578125, -15.421875, -14.826171875, -14.23046875, -13.634765625, -13.0390625, -12.443359375, -11.84765625, -11.251953125, -10.65625, -10.060546875, -9.46484375, -8.869140625, -8.2734375, -7.677734375, -7.08203125, -6.486328125, -5.890625, -5.294921875, -4.69921875, -4.103515625, -3.5078125, -2.912109375, -2.31640625, -1.720703125, -1.125, -0.529296875, 0.06640625, 0.662109375, 1.2578125, 1.853515625, 2.44921875, 3.044921875, 3.640625, 4.236328125, 4.83203125, 5.427734375, 6.0234375, 6.619140625, 7.21484375, 7.810546875, 8.40625, 9.001953125, 9.59765625, 10.193359375, 10.7890625, 11.384765625, 11.98046875, 12.576171875, 13.171875, 13.767578125, 14.36328125, 14.958984375, 15.5546875, 16.150390625, 16.74609375, 17.341796875, 17.9375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 7.0, 9.0, 13.0, 16.0, 16.0, 20.0, 27.0, 21.0, 36.0, 27.0, 41.0, 46.0, 37.0, 53.0, 75.0, 141.0, 345.0, 397.0, 163.0, 97.0, 66.0, 66.0, 48.0, 40.0, 23.0, 29.0, 14.0, 27.0, 12.0, 17.0, 14.0, 15.0, 11.0, 7.0, 4.0, 7.0, 3.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0], "bins": [-6.97265625, -6.77923583984375, -6.5858154296875, -6.39239501953125, -6.198974609375, -6.00555419921875, -5.8121337890625, -5.61871337890625, -5.42529296875, -5.23187255859375, -5.0384521484375, -4.84503173828125, -4.651611328125, -4.45819091796875, -4.2647705078125, -4.07135009765625, -3.8779296875, -3.68450927734375, -3.4910888671875, -3.29766845703125, -3.104248046875, -2.91082763671875, -2.7174072265625, -2.52398681640625, -2.33056640625, -2.13714599609375, -1.9437255859375, -1.75030517578125, -1.556884765625, -1.36346435546875, -1.1700439453125, -0.97662353515625, -0.783203125, -0.58978271484375, -0.3963623046875, -0.20294189453125, -0.009521484375, 0.18389892578125, 0.3773193359375, 0.57073974609375, 0.76416015625, 0.95758056640625, 1.1510009765625, 1.34442138671875, 1.537841796875, 1.73126220703125, 1.9246826171875, 2.11810302734375, 2.3115234375, 2.50494384765625, 2.6983642578125, 2.89178466796875, 3.085205078125, 3.27862548828125, 3.4720458984375, 3.66546630859375, 3.85888671875, 4.05230712890625, 4.2457275390625, 4.43914794921875, 4.632568359375, 4.82598876953125, 5.0194091796875, 5.21282958984375, 5.40625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 25.0, 57.0, 465.0, 372.0, 55.0, 23.0, 7.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.42376136779785, -16.574420928955078, -14.725079536437988, -12.875739097595215, -11.026397705078125, -9.177057266235352, -7.327716827392578, -5.478375434875488, -3.629034996032715, -1.7796941995620728, 0.06964659690856934, 1.9189872741699219, 3.7683281898498535, 5.617669105529785, 7.467009544372559, 9.316350936889648, 11.165691375732422, 13.015031814575195, 14.864373207092285, 16.713714599609375, 18.56305503845215, 20.412395477294922, 22.261735916137695, 24.11107635498047, 25.960418701171875, 27.80975914001465, 29.659099578857422, 31.508441925048828, 33.35778045654297, 35.207122802734375, 37.05646514892578, 38.90580368041992, 40.75514602661133, 42.604488372802734, 44.453826904296875, 46.30316925048828, 48.15250778198242, 50.00185012817383, 51.85118865966797, 53.700531005859375, 55.54987335205078, 57.39921569824219, 59.24855422973633, 61.097896575927734, 62.947235107421875, 64.79657745361328, 66.64591979980469, 68.4952621459961, 70.34459686279297, 72.19393920898438, 74.04328155517578, 75.89261627197266, 77.74195861816406, 79.59130096435547, 81.44064331054688, 83.28998565673828, 85.13932800292969, 86.9886703491211, 88.8380126953125, 90.68734741210938, 92.53668975830078, 94.38603210449219, 96.2353744506836, 98.084716796875, 99.93405151367188]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 4.0, 2.0, 7.0, 7.0, 15.0, 3.0, 11.0, 10.0, 11.0, 25.0, 24.0, 19.0, 25.0, 36.0, 27.0, 32.0, 26.0, 46.0, 33.0, 33.0, 50.0, 36.0, 47.0, 36.0, 39.0, 49.0, 39.0, 50.0, 38.0, 25.0, 26.0, 24.0, 25.0, 25.0, 18.0, 12.0, 18.0, 11.0, 3.0, 6.0, 8.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0], "bins": [-9.475214004516602, -9.20776653289795, -8.940320014953613, -8.672872543334961, -8.405425071716309, -8.137977600097656, -7.87053108215332, -7.603083610534668, -7.335636615753174, -7.06818962097168, -6.800742149353027, -6.533295154571533, -6.265848159790039, -5.998400688171387, -5.730953693389893, -5.463506698608398, -5.196059226989746, -4.928612232208252, -4.6611647605896, -4.3937177658081055, -4.126270294189453, -3.858823299407959, -3.591376304626465, -3.3239290714263916, -3.0564818382263184, -2.789034605026245, -2.521587371826172, -2.2541403770446777, -1.9866931438446045, -1.7192459106445312, -1.4517987966537476, -1.1843516826629639, -0.9169044494628906, -0.6494572758674622, -0.3820101022720337, -0.11456292867660522, 0.15288424491882324, 0.4203314781188965, 0.6877785921096802, 0.9552257061004639, 1.222672939300537, 1.4901201725006104, 1.757567286491394, 2.0250144004821777, 2.292461633682251, 2.559908866882324, 2.8273558616638184, 3.0948030948638916, 3.362250328063965, 3.629697561264038, 3.8971447944641113, 4.1645917892456055, 4.432039260864258, 4.699486255645752, 4.966933250427246, 5.234380722045898, 5.501827716827393, 5.769274711608887, 6.036722183227539, 6.304169178009033, 6.571616172790527, 6.83906364440918, 7.106510639190674, 7.373957633972168, 7.64140510559082]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 12.0, 10.0, 13.0, 13.0, 11.0, 27.0, 36.0, 44.0, 57.0, 102.0, 170.0, 307.0, 521.0, 1041.0, 2218.0, 5508.0, 19240.0, 4009994.0, 135246.0, 12026.0, 4043.0, 1732.0, 831.0, 445.0, 220.0, 139.0, 78.0, 62.0, 27.0, 25.0, 15.0, 15.0, 9.0, 8.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.039398193359375, -0.0381627082824707, -0.036927223205566406, -0.03569173812866211, -0.03445625305175781, -0.033220767974853516, -0.03198528289794922, -0.030749797821044922, -0.029514312744140625, -0.028278827667236328, -0.02704334259033203, -0.025807857513427734, -0.024572372436523438, -0.02333688735961914, -0.022101402282714844, -0.020865917205810547, -0.01963043212890625, -0.018394947052001953, -0.017159461975097656, -0.01592397689819336, -0.014688491821289062, -0.013453006744384766, -0.012217521667480469, -0.010982036590576172, -0.009746551513671875, -0.008511066436767578, -0.007275581359863281, -0.006040096282958984, -0.0048046112060546875, -0.0035691261291503906, -0.0023336410522460938, -0.0010981559753417969, 0.0001373291015625, 0.0013728141784667969, 0.0026082992553710938, 0.0038437843322753906, 0.0050792694091796875, 0.006314754486083984, 0.007550239562988281, 0.008785724639892578, 0.010021209716796875, 0.011256694793701172, 0.012492179870605469, 0.013727664947509766, 0.014963150024414062, 0.01619863510131836, 0.017434120178222656, 0.018669605255126953, 0.01990509033203125, 0.021140575408935547, 0.022376060485839844, 0.02361154556274414, 0.024847030639648438, 0.026082515716552734, 0.02731800079345703, 0.028553485870361328, 0.029788970947265625, 0.031024456024169922, 0.03225994110107422, 0.033495426177978516, 0.03473091125488281, 0.03596639633178711, 0.037201881408691406, 0.0384373664855957, 0.0396728515625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 4.0, 8.0, 7.0, 8.0, 6.0, 7.0, 21.0, 14.0, 11.0, 11.0, 20.0, 762.0, 23.0, 14.0, 21.0, 10.0, 12.0, 3.0, 4.0, 3.0, 3.0, 7.0, 5.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.004222869873046875, -0.004107028245925903, -0.003991186618804932, -0.00387534499168396, -0.0037595033645629883, -0.0036436617374420166, -0.003527820110321045, -0.0034119784832000732, -0.0032961368560791016, -0.00318029522895813, -0.003064453601837158, -0.0029486119747161865, -0.002832770347595215, -0.002716928720474243, -0.0026010870933532715, -0.0024852454662323, -0.002369403839111328, -0.0022535622119903564, -0.0021377205848693848, -0.002021878957748413, -0.0019060373306274414, -0.0017901957035064697, -0.001674354076385498, -0.0015585124492645264, -0.0014426708221435547, -0.001326829195022583, -0.0012109875679016113, -0.0010951459407806396, -0.000979304313659668, -0.0008634626865386963, -0.0007476210594177246, -0.0006317794322967529, -0.0005159378051757812, -0.00040009617805480957, -0.0002842545509338379, -0.0001684129238128662, -5.257129669189453e-05, 6.327033042907715e-05, 0.00017911195755004883, 0.0002949535846710205, 0.0004107952117919922, 0.0005266368389129639, 0.0006424784660339355, 0.0007583200931549072, 0.0008741617202758789, 0.0009900033473968506, 0.0011058449745178223, 0.001221686601638794, 0.0013375282287597656, 0.0014533698558807373, 0.001569211483001709, 0.0016850531101226807, 0.0018008947372436523, 0.001916736364364624, 0.0020325779914855957, 0.0021484196186065674, 0.002264261245727539, 0.0023801028728485107, 0.0024959444999694824, 0.002611786127090454, 0.0027276277542114258, 0.0028434693813323975, 0.002959311008453369, 0.003075152635574341, 0.0031909942626953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 9.0, 11.0, 15.0, 14.0, 22.0, 37.0, 56.0, 89.0, 137.0, 185.0, 347.0, 556.0, 1114.0, 2370.0, 5879.0, 17850.0, 80682.0, 3492036.0, 524193.0, 47802.0, 12362.0, 4397.0, 1839.0, 946.0, 517.0, 291.0, 170.0, 117.0, 79.0, 52.0, 32.0, 21.0, 16.0, 13.0, 11.0, 10.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031890869140625, -0.03092026710510254, -0.029949665069580078, -0.028979063034057617, -0.028008460998535156, -0.027037858963012695, -0.026067256927490234, -0.025096654891967773, -0.024126052856445312, -0.02315545082092285, -0.02218484878540039, -0.02121424674987793, -0.02024364471435547, -0.019273042678833008, -0.018302440643310547, -0.017331838607788086, -0.016361236572265625, -0.015390634536743164, -0.014420032501220703, -0.013449430465698242, -0.012478828430175781, -0.01150822639465332, -0.01053762435913086, -0.009567022323608398, -0.008596420288085938, -0.0076258182525634766, -0.006655216217041016, -0.005684614181518555, -0.004714012145996094, -0.003743410110473633, -0.002772808074951172, -0.001802206039428711, -0.00083160400390625, 0.00013899803161621094, 0.0011096000671386719, 0.002080202102661133, 0.0030508041381835938, 0.004021406173706055, 0.004992008209228516, 0.0059626102447509766, 0.0069332122802734375, 0.007903814315795898, 0.00887441635131836, 0.00984501838684082, 0.010815620422363281, 0.011786222457885742, 0.012756824493408203, 0.013727426528930664, 0.014698028564453125, 0.015668630599975586, 0.016639232635498047, 0.017609834671020508, 0.01858043670654297, 0.01955103874206543, 0.02052164077758789, 0.02149224281311035, 0.022462844848632812, 0.023433446884155273, 0.024404048919677734, 0.025374650955200195, 0.026345252990722656, 0.027315855026245117, 0.028286457061767578, 0.02925705909729004, 0.0302276611328125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 2.0, 11.0, 10.0, 21.0, 19.0, 31.0, 39.0, 59.0, 65.0, 90.0, 143.0, 203.0, 704.0, 1880.0, 307.0, 140.0, 104.0, 64.0, 46.0, 23.0, 26.0, 24.0, 14.0, 9.0, 11.0, 5.0, 5.0, 1.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00608062744140625, -0.0058858394622802734, -0.005691051483154297, -0.00549626350402832, -0.005301475524902344, -0.005106687545776367, -0.004911899566650391, -0.004717111587524414, -0.0045223236083984375, -0.004327535629272461, -0.004132747650146484, -0.003937959671020508, -0.0037431716918945312, -0.0035483837127685547, -0.003353595733642578, -0.0031588077545166016, -0.002964019775390625, -0.0027692317962646484, -0.002574443817138672, -0.0023796558380126953, -0.0021848678588867188, -0.001990079879760742, -0.0017952919006347656, -0.001600503921508789, -0.0014057159423828125, -0.001210927963256836, -0.0010161399841308594, -0.0008213520050048828, -0.0006265640258789062, -0.0004317760467529297, -0.00023698806762695312, -4.220008850097656e-05, 0.000152587890625, 0.00034737586975097656, 0.0005421638488769531, 0.0007369518280029297, 0.0009317398071289062, 0.0011265277862548828, 0.0013213157653808594, 0.001516103744506836, 0.0017108917236328125, 0.001905679702758789, 0.0021004676818847656, 0.002295255661010742, 0.0024900436401367188, 0.0026848316192626953, 0.002879619598388672, 0.0030744075775146484, 0.003269195556640625, 0.0034639835357666016, 0.003658771514892578, 0.0038535594940185547, 0.004048347473144531, 0.004243135452270508, 0.004437923431396484, 0.004632711410522461, 0.0048274993896484375, 0.005022287368774414, 0.005217075347900391, 0.005411863327026367, 0.005606651306152344, 0.00580143928527832, 0.005996227264404297, 0.0061910152435302734, 0.00638580322265625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 7.0, 2.0, 9.0, 27.0, 78.0, 303.0, 422.0, 123.0, 26.0, 9.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1435861587524414, -0.14048056304454803, -0.13737498223781586, -0.13426938652992249, -0.1311637908220291, -0.12805821001529694, -0.12495261430740356, -0.12184701859951019, -0.11874143034219742, -0.11563584208488464, -0.11253024637699127, -0.1094246581196785, -0.10631906986236572, -0.10321347415447235, -0.10010788589715958, -0.0970022976398468, -0.09389670193195343, -0.09079111367464066, -0.08768551796674728, -0.08457992970943451, -0.08147434145212173, -0.07836874574422836, -0.07526315748691559, -0.07215756177902222, -0.06905198097229004, -0.06594639271497726, -0.06284079700708389, -0.05973520874977112, -0.056629616767168045, -0.05352402478456497, -0.0504184365272522, -0.047312844544649124, -0.04420725256204605, -0.04110166057944298, -0.0379960723221302, -0.03489048033952713, -0.03178488835692406, -0.028679298236966133, -0.02557370811700821, -0.022468116134405136, -0.019362526014447212, -0.01625693589448929, -0.013151343911886215, -0.010045753791928291, -0.006940162740647793, -0.0038345716893672943, -0.0007289815694093704, 0.0023766104131937027, 0.005482200533151627, 0.008587791584432125, 0.011693382635712624, 0.014798972755670547, 0.01790456473827362, 0.021010154858231544, 0.02411574497818947, 0.02722133696079254, 0.030326927080750465, 0.03343251720070839, 0.03653810918331146, 0.03964369744062424, 0.04274928942322731, 0.04585488140583038, 0.04896046966314316, 0.05206606537103653, 0.055171653628349304]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 17.0, 14.0, 18.0, 19.0, 24.0, 34.0, 26.0, 40.0, 38.0, 48.0, 44.0, 52.0, 54.0, 63.0, 58.0, 56.0, 53.0, 60.0, 47.0, 37.0, 35.0, 33.0, 35.0, 23.0, 9.0, 13.0, 16.0, 11.0, 4.0, 6.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.017418265342712402, -0.016780920326709747, -0.01614357717335224, -0.015506233088672161, -0.01486888900399208, -0.014231544919312, -0.01359420083463192, -0.01295685674995184, -0.012319512665271759, -0.011682168580591679, -0.011044824495911598, -0.010407480411231518, -0.009770136326551437, -0.009132792241871357, -0.008495448157191277, -0.007858104072511196, -0.007220759987831116, -0.006583415903151035, -0.005946071818470955, -0.0053087277337908745, -0.004671383649110794, -0.004034039564430714, -0.0033966954797506332, -0.002759351395070553, -0.0021220073103904724, -0.001484663225710392, -0.0008473191410303116, -0.00020997505635023117, 0.00042736902832984924, 0.0010647131130099297, 0.00170205719769001, 0.0023394012823700905, 0.002976745367050171, 0.0036140894517302513, 0.004251433536410332, 0.004888777621090412, 0.0055261217057704926, 0.006163465790450573, 0.006800809875130653, 0.007438153959810734, 0.008075498044490814, 0.008712842129170895, 0.009350186213850975, 0.009987530298531055, 0.010624874383211136, 0.011262218467891216, 0.011899562552571297, 0.012536906637251377, 0.013174250721931458, 0.013811594806611538, 0.014448938891291618, 0.015086282975971699, 0.01572362706065178, 0.016360972076654434, 0.01699831523001194, 0.017635658383369446, 0.0182730033993721, 0.018910348415374756, 0.01954769156873226, 0.020185034722089767, 0.020822379738092422, 0.021459724754095078, 0.022097067907452583, 0.02273441106081009, 0.023371756076812744]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 1.0, 4.0, 4.0, 12.0, 7.0, 11.0, 20.0, 19.0, 45.0, 48.0, 75.0, 102.0, 133.0, 215.0, 309.0, 495.0, 717.0, 1243.0, 2069.0, 3611.0, 6892.0, 14739.0, 41398.0, 888360.0, 54608.0, 16114.0, 7499.0, 3946.0, 2176.0, 1317.0, 792.0, 530.0, 334.0, 209.0, 155.0, 104.0, 56.0, 54.0, 33.0, 30.0, 19.0, 17.0, 12.0, 8.0, 1.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0382080078125, -0.03706979751586914, -0.03593158721923828, -0.03479337692260742, -0.03365516662597656, -0.0325169563293457, -0.031378746032714844, -0.030240535736083984, -0.029102325439453125, -0.027964115142822266, -0.026825904846191406, -0.025687694549560547, -0.024549484252929688, -0.023411273956298828, -0.02227306365966797, -0.02113485336303711, -0.01999664306640625, -0.01885843276977539, -0.01772022247314453, -0.016582012176513672, -0.015443801879882812, -0.014305591583251953, -0.013167381286621094, -0.012029170989990234, -0.010890960693359375, -0.009752750396728516, -0.008614540100097656, -0.007476329803466797, -0.0063381195068359375, -0.005199909210205078, -0.004061698913574219, -0.0029234886169433594, -0.0017852783203125, -0.0006470680236816406, 0.0004911422729492188, 0.0016293525695800781, 0.0027675628662109375, 0.003905773162841797, 0.005043983459472656, 0.006182193756103516, 0.007320404052734375, 0.008458614349365234, 0.009596824645996094, 0.010735034942626953, 0.011873245239257812, 0.013011455535888672, 0.014149665832519531, 0.01528787612915039, 0.01642608642578125, 0.01756429672241211, 0.01870250701904297, 0.019840717315673828, 0.020978927612304688, 0.022117137908935547, 0.023255348205566406, 0.024393558502197266, 0.025531768798828125, 0.026669979095458984, 0.027808189392089844, 0.028946399688720703, 0.030084609985351562, 0.031222820281982422, 0.03236103057861328, 0.03349924087524414, 0.034637451171875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 1.0, 4.0, 2.0, 6.0, 6.0, 9.0, 7.0, 10.0, 11.0, 16.0, 12.0, 19.0, 46.0, 332.0, 368.0, 69.0, 18.0, 8.0, 16.0, 8.0, 2.0, 7.0, 3.0, 5.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.004180908203125, -0.004064470529556274, -0.003948032855987549, -0.0038315951824188232, -0.0037151575088500977, -0.003598719835281372, -0.0034822821617126465, -0.003365844488143921, -0.0032494068145751953, -0.0031329691410064697, -0.003016531467437744, -0.0029000937938690186, -0.002783656120300293, -0.0026672184467315674, -0.002550780773162842, -0.002434343099594116, -0.0023179054260253906, -0.002201467752456665, -0.0020850300788879395, -0.001968592405319214, -0.0018521547317504883, -0.0017357170581817627, -0.0016192793846130371, -0.0015028417110443115, -0.001386404037475586, -0.0012699663639068604, -0.0011535286903381348, -0.0010370910167694092, -0.0009206533432006836, -0.000804215669631958, -0.0006877779960632324, -0.0005713403224945068, -0.00045490264892578125, -0.00033846497535705566, -0.00022202730178833008, -0.00010558962821960449, 1.0848045349121094e-05, 0.00012728571891784668, 0.00024372339248657227, 0.00036016106605529785, 0.00047659873962402344, 0.000593036413192749, 0.0007094740867614746, 0.0008259117603302002, 0.0009423494338989258, 0.0010587871074676514, 0.001175224781036377, 0.0012916624546051025, 0.0014081001281738281, 0.0015245378017425537, 0.0016409754753112793, 0.0017574131488800049, 0.0018738508224487305, 0.001990288496017456, 0.0021067261695861816, 0.0022231638431549072, 0.002339601516723633, 0.0024560391902923584, 0.002572476863861084, 0.0026889145374298096, 0.002805352210998535, 0.0029217898845672607, 0.0030382275581359863, 0.003154665231704712, 0.0032711029052734375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 5.0, 6.0, 7.0, 9.0, 29.0, 28.0, 36.0, 43.0, 54.0, 80.0, 140.0, 196.0, 250.0, 360.0, 645.0, 1107.0, 1850.0, 3812.0, 9320.0, 41818.0, 761933.0, 194365.0, 19795.0, 6023.0, 2825.0, 1386.0, 825.0, 512.0, 330.0, 249.0, 153.0, 105.0, 65.0, 46.0, 39.0, 27.0, 21.0, 23.0, 7.0, 9.0, 7.0, 5.0, 2.0, 5.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.057708740234375, -0.05613994598388672, -0.05457115173339844, -0.053002357482910156, -0.051433563232421875, -0.049864768981933594, -0.04829597473144531, -0.04672718048095703, -0.04515838623046875, -0.04358959197998047, -0.04202079772949219, -0.040452003479003906, -0.038883209228515625, -0.037314414978027344, -0.03574562072753906, -0.03417682647705078, -0.0326080322265625, -0.03103923797607422, -0.029470443725585938, -0.027901649475097656, -0.026332855224609375, -0.024764060974121094, -0.023195266723632812, -0.02162647247314453, -0.02005767822265625, -0.01848888397216797, -0.016920089721679688, -0.015351295471191406, -0.013782501220703125, -0.012213706970214844, -0.010644912719726562, -0.009076118469238281, -0.00750732421875, -0.005938529968261719, -0.0043697357177734375, -0.0028009414672851562, -0.001232147216796875, 0.00033664703369140625, 0.0019054412841796875, 0.0034742355346679688, 0.00504302978515625, 0.006611824035644531, 0.008180618286132812, 0.009749412536621094, 0.011318206787109375, 0.012887001037597656, 0.014455795288085938, 0.01602458953857422, 0.0175933837890625, 0.01916217803955078, 0.020730972290039062, 0.022299766540527344, 0.023868560791015625, 0.025437355041503906, 0.027006149291992188, 0.02857494354248047, 0.03014373779296875, 0.03171253204345703, 0.03328132629394531, 0.034850120544433594, 0.036418914794921875, 0.037987709045410156, 0.03955650329589844, 0.04112529754638672, 0.042694091796875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 3.0, 5.0, 5.0, 6.0, 8.0, 16.0, 8.0, 19.0, 21.0, 21.0, 16.0, 29.0, 32.0, 23.0, 33.0, 45.0, 26.0, 41.0, 42.0, 31.0, 47.0, 35.0, 37.0, 32.0, 33.0, 33.0, 39.0, 30.0, 39.0, 31.0, 28.0, 27.0, 19.0, 22.0, 18.0, 15.0, 12.0, 15.0, 11.0, 11.0, 4.0, 9.0, 8.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0128021240234375, -0.012413501739501953, -0.012024879455566406, -0.01163625717163086, -0.011247634887695312, -0.010859012603759766, -0.010470390319824219, -0.010081768035888672, -0.009693145751953125, -0.009304523468017578, -0.008915901184082031, -0.008527278900146484, -0.008138656616210938, -0.007750034332275391, -0.007361412048339844, -0.006972789764404297, -0.00658416748046875, -0.006195545196533203, -0.005806922912597656, -0.005418300628662109, -0.0050296783447265625, -0.004641056060791016, -0.004252433776855469, -0.003863811492919922, -0.003475189208984375, -0.003086566925048828, -0.0026979446411132812, -0.0023093223571777344, -0.0019207000732421875, -0.0015320777893066406, -0.0011434555053710938, -0.0007548332214355469, -0.0003662109375, 2.2411346435546875e-05, 0.00041103363037109375, 0.0007996559143066406, 0.0011882781982421875, 0.0015769004821777344, 0.0019655227661132812, 0.002354145050048828, 0.002742767333984375, 0.003131389617919922, 0.0035200119018554688, 0.003908634185791016, 0.0042972564697265625, 0.004685878753662109, 0.005074501037597656, 0.005463123321533203, 0.00585174560546875, 0.006240367889404297, 0.006628990173339844, 0.007017612457275391, 0.0074062347412109375, 0.007794857025146484, 0.008183479309082031, 0.008572101593017578, 0.008960723876953125, 0.009349346160888672, 0.009737968444824219, 0.010126590728759766, 0.010515213012695312, 0.01090383529663086, 0.011292457580566406, 0.011681079864501953, 0.0120697021484375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 5.0, 8.0, 7.0, 14.0, 15.0, 22.0, 38.0, 55.0, 73.0, 110.0, 206.0, 282.0, 504.0, 1043.0, 2443.0, 8236.0, 82512.0, 920127.0, 24687.0, 4671.0, 1623.0, 725.0, 452.0, 241.0, 149.0, 87.0, 61.0, 47.0, 33.0, 16.0, 23.0, 14.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.075927734375, -0.07333564758300781, -0.07074356079101562, -0.06815147399902344, -0.06555938720703125, -0.06296730041503906, -0.060375213623046875, -0.05778312683105469, -0.0551910400390625, -0.05259895324707031, -0.050006866455078125, -0.04741477966308594, -0.04482269287109375, -0.04223060607910156, -0.039638519287109375, -0.03704643249511719, -0.034454345703125, -0.03186225891113281, -0.029270172119140625, -0.026678085327148438, -0.02408599853515625, -0.021493911743164062, -0.018901824951171875, -0.016309738159179688, -0.0137176513671875, -0.011125564575195312, -0.008533477783203125, -0.0059413909912109375, -0.00334930419921875, -0.0007572174072265625, 0.001834869384765625, 0.0044269561767578125, 0.00701904296875, 0.009611129760742188, 0.012203216552734375, 0.014795303344726562, 0.01738739013671875, 0.019979476928710938, 0.022571563720703125, 0.025163650512695312, 0.0277557373046875, 0.030347824096679688, 0.032939910888671875, 0.03553199768066406, 0.03812408447265625, 0.04071617126464844, 0.043308258056640625, 0.04590034484863281, 0.048492431640625, 0.05108451843261719, 0.053676605224609375, 0.05626869201660156, 0.05886077880859375, 0.06145286560058594, 0.06404495239257812, 0.06663703918457031, 0.0692291259765625, 0.07182121276855469, 0.07441329956054688, 0.07700538635253906, 0.07959747314453125, 0.08218955993652344, 0.08478164672851562, 0.08737373352050781, 0.0899658203125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 3.0, 7.0, 6.0, 11.0, 12.0, 14.0, 12.0, 22.0, 18.0, 25.0, 47.0, 101.0, 210.0, 192.0, 92.0, 46.0, 35.0, 29.0, 28.0, 12.0, 7.0, 10.0, 15.0, 7.0, 7.0, 7.0, 2.0, 2.0, 8.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014486312866210938, -0.0014046579599380493, -0.0013606846332550049, -0.0013167113065719604, -0.001272737979888916, -0.0012287646532058716, -0.0011847913265228271, -0.0011408179998397827, -0.0010968446731567383, -0.0010528713464736938, -0.0010088980197906494, -0.000964924693107605, -0.0009209513664245605, -0.0008769780397415161, -0.0008330047130584717, -0.0007890313863754272, -0.0007450580596923828, -0.0007010847330093384, -0.0006571114063262939, -0.0006131380796432495, -0.0005691647529602051, -0.0005251914262771606, -0.0004812180995941162, -0.0004372447729110718, -0.00039327144622802734, -0.0003492981195449829, -0.0003053247928619385, -0.00026135146617889404, -0.0002173781394958496, -0.00017340481281280518, -0.00012943148612976074, -8.545815944671631e-05, -4.1484832763671875e-05, 2.4884939193725586e-06, 4.646182060241699e-05, 9.043514728546143e-05, 0.00013440847396850586, 0.0001783818006515503, 0.00022235512733459473, 0.00026632845401763916, 0.0003103017807006836, 0.00035427510738372803, 0.00039824843406677246, 0.0004422217607498169, 0.00048619508743286133, 0.0005301684141159058, 0.0005741417407989502, 0.0006181150674819946, 0.0006620883941650391, 0.0007060617208480835, 0.0007500350475311279, 0.0007940083742141724, 0.0008379817008972168, 0.0008819550275802612, 0.0009259283542633057, 0.0009699016809463501, 0.0010138750076293945, 0.001057848334312439, 0.0011018216609954834, 0.0011457949876785278, 0.0011897683143615723, 0.0012337416410446167, 0.0012777149677276611, 0.0013216882944107056, 0.00136566162109375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 7.0, 8.0, 18.0, 13.0, 23.0, 34.0, 42.0, 84.0, 112.0, 186.0, 321.0, 607.0, 1112.0, 2374.0, 5740.0, 17261.0, 80469.0, 839659.0, 73760.0, 16323.0, 5578.0, 2316.0, 1107.0, 579.0, 319.0, 182.0, 108.0, 57.0, 54.0, 38.0, 17.0, 15.0, 6.0, 9.0, 8.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06622314453125, -0.06418418884277344, -0.062145233154296875, -0.06010627746582031, -0.05806732177734375, -0.05602836608886719, -0.053989410400390625, -0.05195045471191406, -0.0499114990234375, -0.04787254333496094, -0.045833587646484375, -0.04379463195800781, -0.04175567626953125, -0.03971672058105469, -0.037677764892578125, -0.03563880920410156, -0.033599853515625, -0.03156089782714844, -0.029521942138671875, -0.027482986450195312, -0.02544403076171875, -0.023405075073242188, -0.021366119384765625, -0.019327163696289062, -0.0172882080078125, -0.015249252319335938, -0.013210296630859375, -0.011171340942382812, -0.00913238525390625, -0.0070934295654296875, -0.005054473876953125, -0.0030155181884765625, -0.0009765625, 0.0010623931884765625, 0.003101348876953125, 0.0051403045654296875, 0.00717926025390625, 0.009218215942382812, 0.011257171630859375, 0.013296127319335938, 0.0153350830078125, 0.017374038696289062, 0.019412994384765625, 0.021451950073242188, 0.02349090576171875, 0.025529861450195312, 0.027568817138671875, 0.029607772827148438, 0.031646728515625, 0.03368568420410156, 0.035724639892578125, 0.03776359558105469, 0.03980255126953125, 0.04184150695800781, 0.043880462646484375, 0.04591941833496094, 0.0479583740234375, 0.04999732971191406, 0.052036285400390625, 0.05407524108886719, 0.05611419677734375, 0.05815315246582031, 0.060192108154296875, 0.06223106384277344, 0.06427001953125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 7.0, 8.0, 14.0, 13.0, 10.0, 15.0, 13.0, 28.0, 29.0, 47.0, 69.0, 104.0, 274.0, 107.0, 67.0, 57.0, 27.0, 16.0, 27.0, 13.0, 8.0, 11.0, 8.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041656494140625, -0.040377140045166016, -0.03909778594970703, -0.03781843185424805, -0.03653907775878906, -0.03525972366333008, -0.033980369567871094, -0.03270101547241211, -0.031421661376953125, -0.03014230728149414, -0.028862953186035156, -0.027583599090576172, -0.026304244995117188, -0.025024890899658203, -0.02374553680419922, -0.022466182708740234, -0.02118682861328125, -0.019907474517822266, -0.01862812042236328, -0.017348766326904297, -0.016069412231445312, -0.014790058135986328, -0.013510704040527344, -0.01223134994506836, -0.010951995849609375, -0.00967264175415039, -0.008393287658691406, -0.007113933563232422, -0.0058345794677734375, -0.004555225372314453, -0.0032758712768554688, -0.0019965171813964844, -0.0007171630859375, 0.0005621910095214844, 0.0018415451049804688, 0.003120899200439453, 0.0044002532958984375, 0.005679607391357422, 0.006958961486816406, 0.00823831558227539, 0.009517669677734375, 0.01079702377319336, 0.012076377868652344, 0.013355731964111328, 0.014635086059570312, 0.015914440155029297, 0.01719379425048828, 0.018473148345947266, 0.01975250244140625, 0.021031856536865234, 0.02231121063232422, 0.023590564727783203, 0.024869918823242188, 0.026149272918701172, 0.027428627014160156, 0.02870798110961914, 0.029987335205078125, 0.03126668930053711, 0.032546043395996094, 0.03382539749145508, 0.03510475158691406, 0.03638410568237305, 0.03766345977783203, 0.038942813873291016, 0.04022216796875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 9.0, 29.0, 141.0, 557.0, 169.0, 53.0, 12.0, 10.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0424519777297974, -1.0166871547698975, -0.9909223914146423, -0.9651575684547424, -0.9393928050994873, -0.9136279821395874, -0.8878631591796875, -0.8620983362197876, -0.8363335728645325, -0.8105687499046326, -0.7848039865493774, -0.7590391635894775, -0.7332743406295776, -0.7075095772743225, -0.6817447543144226, -0.6559799909591675, -0.6302151679992676, -0.6044503450393677, -0.5786855816841125, -0.5529207587242126, -0.5271559953689575, -0.5013911724090576, -0.4756263494491577, -0.4498615562915802, -0.4240967631340027, -0.39833196997642517, -0.37256717681884766, -0.34680235385894775, -0.32103756070137024, -0.2952727675437927, -0.2695079445838928, -0.2437431514263153, -0.21797829866409302, -0.1922135055065155, -0.1664486974477768, -0.14068388938903809, -0.11491909623146057, -0.08915430307388306, -0.06338949501514435, -0.03762468695640564, -0.011859893798828125, 0.013904906809329987, 0.0396697074174881, 0.06543450802564621, 0.09119930863380432, 0.11696410179138184, 0.14272890985012054, 0.16849371790885925, 0.19425851106643677, 0.22002330422401428, 0.245788112282753, 0.2715529203414917, 0.2973177134990692, 0.32308250665664673, 0.34884732961654663, 0.37461212277412415, 0.40037691593170166, 0.4261417090892792, 0.4519065022468567, 0.4776713252067566, 0.5034360885620117, 0.5292009115219116, 0.5549657344818115, 0.5807305574417114, 0.6064953207969666]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 6.0, 8.0, 7.0, 9.0, 13.0, 8.0, 23.0, 32.0, 54.0, 100.0, 105.0, 128.0, 132.0, 116.0, 77.0, 64.0, 30.0, 21.0, 13.0, 14.0, 10.0, 7.0, 5.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3502047061920166, -0.34066644310951233, -0.33112815022468567, -0.3215898871421814, -0.3120516240596771, -0.30251336097717285, -0.2929750680923462, -0.2834368050098419, -0.27389854192733765, -0.2643602788448334, -0.2548219859600067, -0.24528372287750244, -0.23574545979499817, -0.2262071818113327, -0.21666890382766724, -0.20713064074516296, -0.1975923478603363, -0.18805406987667084, -0.17851580679416656, -0.1689775288105011, -0.15943926572799683, -0.14990098774433136, -0.1403627097606659, -0.13082444667816162, -0.12128616869449615, -0.11174789816141129, -0.10220962762832642, -0.09267134964466095, -0.08313307911157608, -0.07359480857849121, -0.06405653059482574, -0.054518260061740875, -0.044979989528656006, -0.035441718995571136, -0.02590344473719597, -0.01636517234146595, -0.006826899945735931, 0.002711370587348938, 0.012249644845724106, 0.021787919104099274, 0.03132618963718414, 0.04086446017026901, 0.05040273442864418, 0.05994100868701935, 0.06947927922010422, 0.07901754975318909, 0.08855582773685455, 0.09809409826993942, 0.10763236880302429, 0.11717063933610916, 0.12670890986919403, 0.1362471878528595, 0.14578545093536377, 0.15532372891902924, 0.1648620069026947, 0.17440026998519897, 0.18393854796886444, 0.1934768259525299, 0.20301508903503418, 0.21255336701869965, 0.2220916450023651, 0.23162990808486938, 0.24116818606853485, 0.2507064640522003, 0.2602447271347046]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 2.0, 4.0, 4.0, 6.0, 8.0, 10.0, 8.0, 17.0, 18.0, 25.0, 29.0, 58.0, 133.0, 949.0, 27346.0, 4160409.0, 4832.0, 215.0, 63.0, 32.0, 15.0, 24.0, 14.0, 12.0, 5.0, 9.0, 7.0, 7.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.568359375, -2.49761962890625, -2.4268798828125, -2.35614013671875, -2.285400390625, -2.21466064453125, -2.1439208984375, -2.07318115234375, -2.00244140625, -1.93170166015625, -1.8609619140625, -1.79022216796875, -1.719482421875, -1.64874267578125, -1.5780029296875, -1.50726318359375, -1.4365234375, -1.36578369140625, -1.2950439453125, -1.22430419921875, -1.153564453125, -1.08282470703125, -1.0120849609375, -0.94134521484375, -0.87060546875, -0.79986572265625, -0.7291259765625, -0.65838623046875, -0.587646484375, -0.51690673828125, -0.4461669921875, -0.37542724609375, -0.3046875, -0.23394775390625, -0.1632080078125, -0.09246826171875, -0.021728515625, 0.04901123046875, 0.1197509765625, 0.19049072265625, 0.26123046875, 0.33197021484375, 0.4027099609375, 0.47344970703125, 0.544189453125, 0.61492919921875, 0.6856689453125, 0.75640869140625, 0.8271484375, 0.89788818359375, 0.9686279296875, 1.03936767578125, 1.110107421875, 1.18084716796875, 1.2515869140625, 1.32232666015625, 1.39306640625, 1.46380615234375, 1.5345458984375, 1.60528564453125, 1.676025390625, 1.74676513671875, 1.8175048828125, 1.88824462890625, 1.958984375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 6.0, 11.0, 9.0, 12.0, 12.0, 13.0, 29.0, 58.0, 121.0, 252.0, 198.0, 144.0, 53.0, 27.0, 14.0, 14.0, 6.0, 4.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.005809783935546875, -0.005685657262802124, -0.005561530590057373, -0.005437403917312622, -0.005313277244567871, -0.00518915057182312, -0.005065023899078369, -0.004940897226333618, -0.004816770553588867, -0.004692643880844116, -0.004568517208099365, -0.004444390535354614, -0.004320263862609863, -0.004196137189865112, -0.004072010517120361, -0.00394788384437561, -0.0038237571716308594, -0.0036996304988861084, -0.0035755038261413574, -0.0034513771533966064, -0.0033272504806518555, -0.0032031238079071045, -0.0030789971351623535, -0.0029548704624176025, -0.0028307437896728516, -0.0027066171169281006, -0.0025824904441833496, -0.0024583637714385986, -0.0023342370986938477, -0.0022101104259490967, -0.0020859837532043457, -0.0019618570804595947, -0.0018377304077148438, -0.0017136037349700928, -0.0015894770622253418, -0.0014653503894805908, -0.0013412237167358398, -0.0012170970439910889, -0.0010929703712463379, -0.0009688436985015869, -0.0008447170257568359, -0.000720590353012085, -0.000596463680267334, -0.000472337007522583, -0.00034821033477783203, -0.00022408366203308105, -9.995698928833008e-05, 2.41696834564209e-05, 0.00014829635620117188, 0.00027242302894592285, 0.00039654970169067383, 0.0005206763744354248, 0.0006448030471801758, 0.0007689297199249268, 0.0008930563926696777, 0.0010171830654144287, 0.0011413097381591797, 0.0012654364109039307, 0.0013895630836486816, 0.0015136897563934326, 0.0016378164291381836, 0.0017619431018829346, 0.0018860697746276855, 0.0020101964473724365, 0.0021343231201171875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 6.0, 5.0, 5.0, 5.0, 9.0, 21.0, 17.0, 20.0, 29.0, 39.0, 42.0, 57.0, 84.0, 89.0, 142.0, 243.0, 1657.0, 4059588.0, 130466.0, 893.0, 210.0, 118.0, 95.0, 91.0, 84.0, 67.0, 46.0, 42.0, 25.0, 24.0, 11.0, 12.0, 11.0, 7.0, 7.0, 7.0, 3.0, 0.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.51025390625, -0.4951896667480469, -0.48012542724609375, -0.4650611877441406, -0.4499969482421875, -0.4349327087402344, -0.41986846923828125, -0.4048042297363281, -0.389739990234375, -0.3746757507324219, -0.35961151123046875, -0.3445472717285156, -0.3294830322265625, -0.3144187927246094, -0.29935455322265625, -0.2842903137207031, -0.26922607421875, -0.2541618347167969, -0.23909759521484375, -0.22403335571289062, -0.2089691162109375, -0.19390487670898438, -0.17884063720703125, -0.16377639770507812, -0.148712158203125, -0.13364791870117188, -0.11858367919921875, -0.10351943969726562, -0.0884552001953125, -0.07339096069335938, -0.05832672119140625, -0.043262481689453125, -0.0281982421875, -0.013134002685546875, 0.00193023681640625, 0.016994476318359375, 0.0320587158203125, 0.047122955322265625, 0.06218719482421875, 0.07725143432617188, 0.092315673828125, 0.10737991333007812, 0.12244415283203125, 0.13750839233398438, 0.1525726318359375, 0.16763687133789062, 0.18270111083984375, 0.19776535034179688, 0.21282958984375, 0.22789382934570312, 0.24295806884765625, 0.2580223083496094, 0.2730865478515625, 0.2881507873535156, 0.30321502685546875, 0.3182792663574219, 0.333343505859375, 0.3484077453613281, 0.36347198486328125, 0.3785362243652344, 0.3936004638671875, 0.4086647033691406, 0.42372894287109375, 0.4387931823730469, 0.453857421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 3.0, 12.0, 6.0, 7.0, 13.0, 10.0, 14.0, 25.0, 33.0, 43.0, 54.0, 79.0, 76.0, 138.0, 173.0, 289.0, 520.0, 1288.0, 347.0, 205.0, 163.0, 127.0, 114.0, 68.0, 66.0, 44.0, 29.0, 21.0, 19.0, 18.0, 17.0, 5.0, 12.0, 12.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0051727294921875, -0.005016624927520752, -0.004860520362854004, -0.004704415798187256, -0.004548311233520508, -0.00439220666885376, -0.004236102104187012, -0.004079997539520264, -0.003923892974853516, -0.0037677884101867676, -0.0036116838455200195, -0.0034555792808532715, -0.0032994747161865234, -0.0031433701515197754, -0.0029872655868530273, -0.0028311610221862793, -0.0026750564575195312, -0.002518951892852783, -0.002362847328186035, -0.002206742763519287, -0.002050638198852539, -0.001894533634185791, -0.001738429069519043, -0.001582324504852295, -0.0014262199401855469, -0.0012701153755187988, -0.0011140108108520508, -0.0009579062461853027, -0.0008018016815185547, -0.0006456971168518066, -0.0004895925521850586, -0.00033348798751831055, -0.0001773834228515625, -2.1278858184814453e-05, 0.0001348257064819336, 0.00029093027114868164, 0.0004470348358154297, 0.0006031394004821777, 0.0007592439651489258, 0.0009153485298156738, 0.0010714530944824219, 0.00122755765914917, 0.001383662223815918, 0.001539766788482666, 0.001695871353149414, 0.0018519759178161621, 0.00200808048248291, 0.002164185047149658, 0.0023202896118164062, 0.0024763941764831543, 0.0026324987411499023, 0.0027886033058166504, 0.0029447078704833984, 0.0031008124351501465, 0.0032569169998168945, 0.0034130215644836426, 0.0035691261291503906, 0.0037252306938171387, 0.0038813352584838867, 0.004037439823150635, 0.004193544387817383, 0.004349648952484131, 0.004505753517150879, 0.004661858081817627, 0.004817962646484375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 8.0, 130.0, 810.0, 58.0, 10.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10178752988576889, -0.08207255601882935, -0.0623575821518898, -0.042642608284950256, -0.02292763441801071, -0.003212660551071167, 0.016502313315868378, 0.036217279732227325, 0.05593226104974747, 0.07564723491668701, 0.09536220878362656, 0.1150771826505661, 0.13479214906692505, 0.1545071303844452, 0.17422211170196533, 0.19393706321716309, 0.21365204453468323, 0.23336702585220337, 0.2530819773674011, 0.27279695868492126, 0.2925119400024414, 0.31222692131996155, 0.3319419026374817, 0.35165685415267944, 0.3713718354701996, 0.3910868167877197, 0.4108017683029175, 0.4305167496204376, 0.45023173093795776, 0.4699467122554779, 0.48966169357299805, 0.5093766450881958, 0.5290915966033936, 0.5488065481185913, 0.5685215592384338, 0.5882365107536316, 0.6079515218734741, 0.6276664733886719, 0.6473814249038696, 0.6670963764190674, 0.6868113875389099, 0.7065263390541077, 0.7262413501739502, 0.745956301689148, 0.7656712532043457, 0.7853862643241882, 0.805101215839386, 0.8248162269592285, 0.8445311784744263, 0.864246129989624, 0.8839611411094666, 0.9036760926246643, 0.9233911037445068, 0.9431060552597046, 0.9628210067749023, 0.9825359582901001, 1.0022509098052979, 1.0219658613204956, 1.0416808128356934, 1.0613958835601807, 1.0811108350753784, 1.1008257865905762, 1.120540738105774, 1.1402556896209717, 1.159970760345459]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 14.0, 20.0, 32.0, 50.0, 51.0, 78.0, 101.0, 112.0, 89.0, 104.0, 96.0, 85.0, 55.0, 41.0, 24.0, 15.0, 13.0, 6.0, 4.0, 10.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04989194869995117, -0.04710703343153, -0.04432211443781853, -0.041537195444107056, -0.03875228017568588, -0.03596736490726471, -0.03318244591355324, -0.030397528782486916, -0.027612611651420593, -0.02482769452035427, -0.02204277738928795, -0.019257860258221626, -0.016472943127155304, -0.013688025996088982, -0.01090310886502266, -0.008118191733956337, -0.005333274602890015, -0.0025483574718236923, 0.00023655965924263, 0.0030214767903089523, 0.005806393921375275, 0.008591311052441597, 0.01137622818350792, 0.014161145314574242, 0.016946062445640564, 0.019730979576706886, 0.02251589670777321, 0.02530081383883953, 0.028085730969905853, 0.030870648100972176, 0.0336555652320385, 0.03644048422574997, 0.03922539949417114, 0.042010314762592316, 0.04479523375630379, 0.04758015275001526, 0.05036506801843643, 0.053149983286857605, 0.05593490228056908, 0.05871982127428055, 0.06150473654270172, 0.0642896518111229, 0.06707456707954407, 0.06985948979854584, 0.07264440506696701, 0.07542932033538818, 0.07821424305438995, 0.08099915832281113, 0.0837840735912323, 0.08656898885965347, 0.08935390412807465, 0.09213882684707642, 0.09492374211549759, 0.09770865738391876, 0.10049358010292053, 0.1032784953713417, 0.10606341063976288, 0.10884832590818405, 0.11163324117660522, 0.114418163895607, 0.11720307916402817, 0.11998799443244934, 0.12277291715145111, 0.1255578249692917, 0.12834274768829346]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 5.0, 7.0, 8.0, 8.0, 1.0, 7.0, 10.0, 16.0, 20.0, 19.0, 17.0, 40.0, 54.0, 90.0, 159.0, 324.0, 619.0, 1258.0, 2751.0, 6437.0, 20102.0, 154438.0, 787852.0, 53820.0, 12113.0, 4324.0, 1978.0, 949.0, 472.0, 219.0, 135.0, 69.0, 49.0, 47.0, 26.0, 23.0, 18.0, 16.0, 8.0, 11.0, 6.0, 8.0, 7.0, 5.0, 5.0, 1.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.051788330078125, -0.05018472671508789, -0.04858112335205078, -0.04697751998901367, -0.04537391662597656, -0.04377031326293945, -0.042166709899902344, -0.040563106536865234, -0.038959503173828125, -0.037355899810791016, -0.035752296447753906, -0.0341486930847168, -0.03254508972167969, -0.030941486358642578, -0.02933788299560547, -0.02773427963256836, -0.02613067626953125, -0.02452707290649414, -0.02292346954345703, -0.021319866180419922, -0.019716262817382812, -0.018112659454345703, -0.016509056091308594, -0.014905452728271484, -0.013301849365234375, -0.011698246002197266, -0.010094642639160156, -0.008491039276123047, -0.0068874359130859375, -0.005283832550048828, -0.0036802291870117188, -0.0020766258239746094, -0.0004730224609375, 0.0011305809020996094, 0.0027341842651367188, 0.004337787628173828, 0.0059413909912109375, 0.007544994354248047, 0.009148597717285156, 0.010752201080322266, 0.012355804443359375, 0.013959407806396484, 0.015563011169433594, 0.017166614532470703, 0.018770217895507812, 0.020373821258544922, 0.02197742462158203, 0.02358102798461914, 0.02518463134765625, 0.02678823471069336, 0.02839183807373047, 0.029995441436767578, 0.03159904479980469, 0.0332026481628418, 0.034806251525878906, 0.036409854888916016, 0.038013458251953125, 0.039617061614990234, 0.041220664978027344, 0.04282426834106445, 0.04442787170410156, 0.04603147506713867, 0.04763507843017578, 0.04923868179321289, 0.05084228515625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 10.0, 13.0, 15.0, 37.0, 66.0, 185.0, 233.0, 219.0, 115.0, 50.0, 27.0, 14.0, 7.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00316619873046875, -0.0029876232147216797, -0.0028090476989746094, -0.002630472183227539, -0.0024518966674804688, -0.0022733211517333984, -0.002094745635986328, -0.0019161701202392578, -0.0017375946044921875, -0.0015590190887451172, -0.0013804435729980469, -0.0012018680572509766, -0.0010232925415039062, -0.0008447170257568359, -0.0006661415100097656, -0.0004875659942626953, -0.000308990478515625, -0.0001304149627685547, 4.8160552978515625e-05, 0.00022673606872558594, 0.00040531158447265625, 0.0005838871002197266, 0.0007624626159667969, 0.0009410381317138672, 0.0011196136474609375, 0.0012981891632080078, 0.0014767646789550781, 0.0016553401947021484, 0.0018339157104492188, 0.002012491226196289, 0.0021910667419433594, 0.0023696422576904297, 0.0025482177734375, 0.0027267932891845703, 0.0029053688049316406, 0.003083944320678711, 0.0032625198364257812, 0.0034410953521728516, 0.003619670867919922, 0.003798246383666992, 0.0039768218994140625, 0.004155397415161133, 0.004333972930908203, 0.0045125484466552734, 0.004691123962402344, 0.004869699478149414, 0.005048274993896484, 0.005226850509643555, 0.005405426025390625, 0.005584001541137695, 0.005762577056884766, 0.005941152572631836, 0.006119728088378906, 0.0062983036041259766, 0.006476879119873047, 0.006655454635620117, 0.0068340301513671875, 0.007012605667114258, 0.007191181182861328, 0.0073697566986083984, 0.007548332214355469, 0.007726907730102539, 0.00790548324584961, 0.00808405876159668, 0.00826263427734375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 4.0, 6.0, 7.0, 7.0, 9.0, 11.0, 13.0, 16.0, 11.0, 17.0, 24.0, 31.0, 27.0, 44.0, 61.0, 142.0, 375.0, 2037.0, 21600.0, 834700.0, 180876.0, 7059.0, 889.0, 237.0, 80.0, 55.0, 33.0, 38.0, 21.0, 13.0, 17.0, 21.0, 11.0, 12.0, 7.0, 11.0, 8.0, 5.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0], "bins": [-0.08465576171875, -0.0824732780456543, -0.0802907943725586, -0.07810831069946289, -0.07592582702636719, -0.07374334335327148, -0.07156085968017578, -0.06937837600708008, -0.06719589233398438, -0.06501340866088867, -0.06283092498779297, -0.060648441314697266, -0.05846595764160156, -0.05628347396850586, -0.054100990295410156, -0.05191850662231445, -0.04973602294921875, -0.04755353927612305, -0.045371055603027344, -0.04318857192993164, -0.04100608825683594, -0.038823604583740234, -0.03664112091064453, -0.03445863723754883, -0.032276153564453125, -0.030093669891357422, -0.02791118621826172, -0.025728702545166016, -0.023546218872070312, -0.02136373519897461, -0.019181251525878906, -0.016998767852783203, -0.0148162841796875, -0.012633800506591797, -0.010451316833496094, -0.00826883316040039, -0.0060863494873046875, -0.0039038658142089844, -0.0017213821411132812, 0.0004611015319824219, 0.002643585205078125, 0.004826068878173828, 0.007008552551269531, 0.009191036224365234, 0.011373519897460938, 0.01355600357055664, 0.015738487243652344, 0.017920970916748047, 0.02010345458984375, 0.022285938262939453, 0.024468421936035156, 0.02665090560913086, 0.028833389282226562, 0.031015872955322266, 0.03319835662841797, 0.03538084030151367, 0.037563323974609375, 0.03974580764770508, 0.04192829132080078, 0.044110774993896484, 0.04629325866699219, 0.04847574234008789, 0.050658226013183594, 0.0528407096862793, 0.055023193359375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 12.0, 10.0, 9.0, 14.0, 6.0, 12.0, 15.0, 19.0, 28.0, 22.0, 26.0, 28.0, 39.0, 52.0, 32.0, 42.0, 40.0, 49.0, 44.0, 52.0, 43.0, 45.0, 46.0, 45.0, 37.0, 28.0, 26.0, 24.0, 24.0, 21.0, 23.0, 18.0, 9.0, 9.0, 12.0, 7.0, 10.0, 7.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.0099945068359375, -0.00970447063446045, -0.009414434432983398, -0.009124398231506348, -0.008834362030029297, -0.008544325828552246, -0.008254289627075195, -0.007964253425598145, -0.007674217224121094, -0.007384181022644043, -0.007094144821166992, -0.006804108619689941, -0.006514072418212891, -0.00622403621673584, -0.005934000015258789, -0.005643963813781738, -0.0053539276123046875, -0.005063891410827637, -0.004773855209350586, -0.004483819007873535, -0.004193782806396484, -0.0039037466049194336, -0.003613710403442383, -0.003323674201965332, -0.0030336380004882812, -0.0027436017990112305, -0.0024535655975341797, -0.002163529396057129, -0.0018734931945800781, -0.0015834569931030273, -0.0012934207916259766, -0.0010033845901489258, -0.000713348388671875, -0.0004233121871948242, -0.00013327598571777344, 0.00015676021575927734, 0.0004467964172363281, 0.0007368326187133789, 0.0010268688201904297, 0.0013169050216674805, 0.0016069412231445312, 0.001896977424621582, 0.002187013626098633, 0.0024770498275756836, 0.0027670860290527344, 0.003057122230529785, 0.003347158432006836, 0.0036371946334838867, 0.0039272308349609375, 0.004217267036437988, 0.004507303237915039, 0.00479733943939209, 0.005087375640869141, 0.005377411842346191, 0.005667448043823242, 0.005957484245300293, 0.006247520446777344, 0.0065375566482543945, 0.006827592849731445, 0.007117629051208496, 0.007407665252685547, 0.007697701454162598, 0.007987737655639648, 0.0082777738571167, 0.00856781005859375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 5.0, 1.0, 8.0, 7.0, 6.0, 7.0, 9.0, 13.0, 16.0, 17.0, 37.0, 132.0, 753.0, 17768.0, 1024926.0, 4220.0, 405.0, 100.0, 27.0, 14.0, 16.0, 10.0, 8.0, 6.0, 13.0, 6.0, 8.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.240966796875, -0.2337360382080078, -0.22650527954101562, -0.21927452087402344, -0.21204376220703125, -0.20481300354003906, -0.19758224487304688, -0.1903514862060547, -0.1831207275390625, -0.1758899688720703, -0.16865921020507812, -0.16142845153808594, -0.15419769287109375, -0.14696693420410156, -0.13973617553710938, -0.1325054168701172, -0.125274658203125, -0.11804389953613281, -0.11081314086914062, -0.10358238220214844, -0.09635162353515625, -0.08912086486816406, -0.08189010620117188, -0.07465934753417969, -0.0674285888671875, -0.06019783020019531, -0.052967071533203125, -0.04573631286621094, -0.03850555419921875, -0.03127479553222656, -0.024044036865234375, -0.016813278198242188, -0.00958251953125, -0.0023517608642578125, 0.004878997802734375, 0.012109756469726562, 0.01934051513671875, 0.026571273803710938, 0.033802032470703125, 0.04103279113769531, 0.0482635498046875, 0.05549430847167969, 0.06272506713867188, 0.06995582580566406, 0.07718658447265625, 0.08441734313964844, 0.09164810180664062, 0.09887886047363281, 0.106109619140625, 0.11334037780761719, 0.12057113647460938, 0.12780189514160156, 0.13503265380859375, 0.14226341247558594, 0.14949417114257812, 0.1567249298095703, 0.1639556884765625, 0.1711864471435547, 0.17841720581054688, 0.18564796447753906, 0.19287872314453125, 0.20010948181152344, 0.20734024047851562, 0.2145709991455078, 0.2218017578125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 4.0, 11.0, 12.0, 8.0, 9.0, 14.0, 25.0, 16.0, 22.0, 25.0, 375.0, 370.0, 22.0, 15.0, 17.0, 7.0, 7.0, 3.0, 8.0, 7.0, 4.0, 1.0, 4.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014333724975585938, -0.0013839006423950195, -0.0013344287872314453, -0.001284956932067871, -0.0012354850769042969, -0.0011860132217407227, -0.0011365413665771484, -0.0010870695114135742, -0.00103759765625, -0.0009881258010864258, -0.0009386539459228516, -0.0008891820907592773, -0.0008397102355957031, -0.0007902383804321289, -0.0007407665252685547, -0.0006912946701049805, -0.0006418228149414062, -0.000592350959777832, -0.0005428791046142578, -0.0004934072494506836, -0.0004439353942871094, -0.00039446353912353516, -0.00034499168395996094, -0.0002955198287963867, -0.0002460479736328125, -0.00019657611846923828, -0.00014710426330566406, -9.763240814208984e-05, -4.8160552978515625e-05, 1.3113021850585938e-06, 5.078315734863281e-05, 0.00010025501251220703, 0.00014972686767578125, 0.00019919872283935547, 0.0002486705780029297, 0.0002981424331665039, 0.0003476142883300781, 0.00039708614349365234, 0.00044655799865722656, 0.0004960298538208008, 0.000545501708984375, 0.0005949735641479492, 0.0006444454193115234, 0.0006939172744750977, 0.0007433891296386719, 0.0007928609848022461, 0.0008423328399658203, 0.0008918046951293945, 0.0009412765502929688, 0.000990748405456543, 0.0010402202606201172, 0.0010896921157836914, 0.0011391639709472656, 0.0011886358261108398, 0.001238107681274414, 0.0012875795364379883, 0.0013370513916015625, 0.0013865232467651367, 0.001435995101928711, 0.0014854669570922852, 0.0015349388122558594, 0.0015844106674194336, 0.0016338825225830078, 0.001683354377746582, 0.0017328262329101562]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 11.0, 10.0, 25.0, 52.0, 139.0, 389.0, 1713.0, 40684.0, 995399.0, 8742.0, 916.0, 247.0, 112.0, 45.0, 23.0, 11.0, 12.0, 6.0, 3.0, 4.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1424560546875, -0.1379070281982422, -0.13335800170898438, -0.12880897521972656, -0.12425994873046875, -0.11971092224121094, -0.11516189575195312, -0.11061286926269531, -0.1060638427734375, -0.10151481628417969, -0.09696578979492188, -0.09241676330566406, -0.08786773681640625, -0.08331871032714844, -0.07876968383789062, -0.07422065734863281, -0.069671630859375, -0.06512260437011719, -0.060573577880859375, -0.05602455139160156, -0.05147552490234375, -0.04692649841308594, -0.042377471923828125, -0.03782844543457031, -0.0332794189453125, -0.028730392456054688, -0.024181365966796875, -0.019632339477539062, -0.01508331298828125, -0.010534286499023438, -0.005985260009765625, -0.0014362335205078125, 0.00311279296875, 0.0076618194580078125, 0.012210845947265625, 0.016759872436523438, 0.02130889892578125, 0.025857925415039062, 0.030406951904296875, 0.03495597839355469, 0.0395050048828125, 0.04405403137207031, 0.048603057861328125, 0.05315208435058594, 0.05770111083984375, 0.06225013732910156, 0.06679916381835938, 0.07134819030761719, 0.075897216796875, 0.08044624328613281, 0.08499526977539062, 0.08954429626464844, 0.09409332275390625, 0.09864234924316406, 0.10319137573242188, 0.10774040222167969, 0.1122894287109375, 0.11683845520019531, 0.12138748168945312, 0.12593650817871094, 0.13048553466796875, 0.13503456115722656, 0.13958358764648438, 0.1441326141357422, 0.148681640625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 8.0, 7.0, 18.0, 22.0, 20.0, 43.0, 53.0, 90.0, 277.0, 197.0, 79.0, 62.0, 41.0, 26.0, 18.0, 13.0, 10.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024139404296875, -0.023126602172851562, -0.022113800048828125, -0.021100997924804688, -0.02008819580078125, -0.019075393676757812, -0.018062591552734375, -0.017049789428710938, -0.0160369873046875, -0.015024185180664062, -0.014011383056640625, -0.012998580932617188, -0.01198577880859375, -0.010972976684570312, -0.009960174560546875, -0.008947372436523438, -0.0079345703125, -0.0069217681884765625, -0.005908966064453125, -0.0048961639404296875, -0.00388336181640625, -0.0028705596923828125, -0.001857757568359375, -0.0008449554443359375, 0.0001678466796875, 0.0011806488037109375, 0.002193450927734375, 0.0032062530517578125, 0.00421905517578125, 0.0052318572998046875, 0.006244659423828125, 0.0072574615478515625, 0.008270263671875, 0.009283065795898438, 0.010295867919921875, 0.011308670043945312, 0.01232147216796875, 0.013334274291992188, 0.014347076416015625, 0.015359878540039062, 0.0163726806640625, 0.017385482788085938, 0.018398284912109375, 0.019411087036132812, 0.02042388916015625, 0.021436691284179688, 0.022449493408203125, 0.023462295532226562, 0.02447509765625, 0.025487899780273438, 0.026500701904296875, 0.027513504028320312, 0.02852630615234375, 0.029539108276367188, 0.030551910400390625, 0.03156471252441406, 0.0325775146484375, 0.03359031677246094, 0.034603118896484375, 0.03561592102050781, 0.03662872314453125, 0.03764152526855469, 0.038654327392578125, 0.03966712951660156, 0.040679931640625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 34.0, 401.0, 507.0, 47.0, 12.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6720820069313049, -0.6529055833816528, -0.633729100227356, -0.6145526766777039, -0.595376193523407, -0.5761997699737549, -0.557023286819458, -0.5378468632698059, -0.5186704397201538, -0.4994939863681793, -0.48031753301620483, -0.46114107966423035, -0.44196462631225586, -0.42278820276260376, -0.4036117494106293, -0.3844352960586548, -0.3652588129043579, -0.3460823595523834, -0.32690590620040894, -0.30772945284843445, -0.28855299949645996, -0.26937657594680786, -0.2502001225948334, -0.2310236692428589, -0.2118472158908844, -0.1926707625389099, -0.17349430918693542, -0.15431787073612213, -0.13514141738414764, -0.11596496403217316, -0.09678851813077927, -0.07761207222938538, -0.05843555927276611, -0.039259109646081924, -0.020082660019397736, -0.0009062103927135468, 0.018270239233970642, 0.03744669258594513, 0.05662313848733902, 0.07579958438873291, 0.0949760377407074, 0.11415249109268188, 0.13332894444465637, 0.15250538289546967, 0.17168183624744415, 0.19085828959941864, 0.21003472805023193, 0.22921118140220642, 0.2483876347541809, 0.2675640881061554, 0.2867405414581299, 0.30591699481010437, 0.32509344816207886, 0.34426987171173096, 0.36344632506370544, 0.38262277841567993, 0.4017992317676544, 0.4209756851196289, 0.4401521384716034, 0.4593285918235779, 0.47850501537323, 0.49768149852752686, 0.516857922077179, 0.536034345626831, 0.5552108287811279]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 12.0, 10.0, 13.0, 15.0, 32.0, 34.0, 51.0, 53.0, 63.0, 82.0, 97.0, 68.0, 89.0, 73.0, 56.0, 53.0, 50.0, 42.0, 22.0, 21.0, 17.0, 13.0, 9.0, 2.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09995931386947632, -0.09662645310163498, -0.09329359233379364, -0.0899607315659523, -0.08662787079811096, -0.08329501003026962, -0.07996214926242828, -0.07662928849458694, -0.0732964277267456, -0.06996356695890427, -0.06663070619106293, -0.06329784542322159, -0.05996498465538025, -0.05663212388753891, -0.05329926311969757, -0.04996640235185623, -0.04663354158401489, -0.04330068081617355, -0.039967820048332214, -0.036634959280490875, -0.033302098512649536, -0.029969237744808197, -0.026636376976966858, -0.02330351620912552, -0.01997065544128418, -0.01663779467344284, -0.013304933905601501, -0.009972073137760162, -0.006639212369918823, -0.003306351602077484, 2.650916576385498e-05, 0.003359369933605194, 0.006692230701446533, 0.010025091469287872, 0.013357952237129211, 0.01669081300497055, 0.02002367377281189, 0.02335653454065323, 0.026689395308494568, 0.030022256076335907, 0.033355116844177246, 0.036687977612018585, 0.040020838379859924, 0.04335369914770126, 0.0466865599155426, 0.05001942068338394, 0.05335228145122528, 0.05668514221906662, 0.06001800298690796, 0.0633508637547493, 0.06668372452259064, 0.07001658529043198, 0.07334944605827332, 0.07668230682611465, 0.080015167593956, 0.08334802836179733, 0.08668088912963867, 0.09001374989748001, 0.09334661066532135, 0.09667947143316269, 0.10001233220100403, 0.10334519296884537, 0.1066780537366867, 0.11001091450452805, 0.11334377527236938]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 8.0, 2.0, 4.0, 2.0, 8.0, 10.0, 8.0, 16.0, 8.0, 16.0, 20.0, 12.0, 22.0, 32.0, 39.0, 193.0, 4191515.0, 2010.0, 160.0, 28.0, 28.0, 25.0, 18.0, 20.0, 6.0, 6.0, 6.0, 8.0, 6.0, 4.0, 2.0, 2.0, 6.0, 0.0, 4.0, 2.0, 4.0, 6.0, 4.0, 4.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.6142578125, -1.570343017578125, -1.52642822265625, -1.482513427734375, -1.4385986328125, -1.394683837890625, -1.35076904296875, -1.306854248046875, -1.262939453125, -1.219024658203125, -1.17510986328125, -1.131195068359375, -1.0872802734375, -1.043365478515625, -0.99945068359375, -0.955535888671875, -0.91162109375, -0.867706298828125, -0.82379150390625, -0.779876708984375, -0.7359619140625, -0.692047119140625, -0.64813232421875, -0.604217529296875, -0.560302734375, -0.516387939453125, -0.47247314453125, -0.428558349609375, -0.3846435546875, -0.340728759765625, -0.29681396484375, -0.252899169921875, -0.208984375, -0.165069580078125, -0.12115478515625, -0.077239990234375, -0.0333251953125, 0.010589599609375, 0.05450439453125, 0.098419189453125, 0.142333984375, 0.186248779296875, 0.23016357421875, 0.274078369140625, 0.3179931640625, 0.361907958984375, 0.40582275390625, 0.449737548828125, 0.49365234375, 0.537567138671875, 0.58148193359375, 0.625396728515625, 0.6693115234375, 0.713226318359375, 0.75714111328125, 0.801055908203125, 0.844970703125, 0.888885498046875, 0.93280029296875, 0.976715087890625, 1.0206298828125, 1.064544677734375, 1.10845947265625, 1.152374267578125, 1.1962890625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 8.0, 13.0, 18.0, 30.0, 62.0, 112.0, 163.0, 176.0, 158.0, 96.0, 79.0, 30.0, 17.0, 17.0, 11.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003265380859375, -0.003126859664916992, -0.0029883384704589844, -0.0028498172760009766, -0.0027112960815429688, -0.002572774887084961, -0.002434253692626953, -0.0022957324981689453, -0.0021572113037109375, -0.0020186901092529297, -0.0018801689147949219, -0.001741647720336914, -0.0016031265258789062, -0.0014646053314208984, -0.0013260841369628906, -0.0011875629425048828, -0.001049041748046875, -0.0009105205535888672, -0.0007719993591308594, -0.0006334781646728516, -0.0004949569702148438, -0.00035643577575683594, -0.00021791458129882812, -7.939338684082031e-05, 5.91278076171875e-05, 0.0001976490020751953, 0.0003361701965332031, 0.00047469139099121094, 0.0006132125854492188, 0.0007517337799072266, 0.0008902549743652344, 0.0010287761688232422, 0.00116729736328125, 0.0013058185577392578, 0.0014443397521972656, 0.0015828609466552734, 0.0017213821411132812, 0.001859903335571289, 0.001998424530029297, 0.0021369457244873047, 0.0022754669189453125, 0.0024139881134033203, 0.002552509307861328, 0.002691030502319336, 0.0028295516967773438, 0.0029680728912353516, 0.0031065940856933594, 0.003245115280151367, 0.003383636474609375, 0.003522157669067383, 0.0036606788635253906, 0.0037992000579833984, 0.003937721252441406, 0.004076242446899414, 0.004214763641357422, 0.00435328483581543, 0.0044918060302734375, 0.004630327224731445, 0.004768848419189453, 0.004907369613647461, 0.005045890808105469, 0.0051844120025634766, 0.005322933197021484, 0.005461454391479492, 0.0055999755859375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 1.0, 9.0, 9.0, 12.0, 21.0, 23.0, 45.0, 81.0, 180.0, 1503.0, 4186945.0, 4973.0, 245.0, 87.0, 68.0, 25.0, 22.0, 9.0, 9.0, 5.0, 5.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.708984375, -0.6930961608886719, -0.6772079467773438, -0.6613197326660156, -0.6454315185546875, -0.6295433044433594, -0.6136550903320312, -0.5977668762207031, -0.581878662109375, -0.5659904479980469, -0.5501022338867188, -0.5342140197753906, -0.5183258056640625, -0.5024375915527344, -0.48654937744140625, -0.4706611633300781, -0.45477294921875, -0.4388847351074219, -0.42299652099609375, -0.4071083068847656, -0.3912200927734375, -0.3753318786621094, -0.35944366455078125, -0.3435554504394531, -0.327667236328125, -0.3117790222167969, -0.29589080810546875, -0.2800025939941406, -0.2641143798828125, -0.24822616577148438, -0.23233795166015625, -0.21644973754882812, -0.2005615234375, -0.18467330932617188, -0.16878509521484375, -0.15289688110351562, -0.1370086669921875, -0.12112045288085938, -0.10523223876953125, -0.08934402465820312, -0.073455810546875, -0.057567596435546875, -0.04167938232421875, -0.025791168212890625, -0.0099029541015625, 0.005985260009765625, 0.02187347412109375, 0.037761688232421875, 0.05364990234375, 0.06953811645507812, 0.08542633056640625, 0.10131454467773438, 0.1172027587890625, 0.13309097290039062, 0.14897918701171875, 0.16486740112304688, 0.180755615234375, 0.19664382934570312, 0.21253204345703125, 0.22842025756835938, 0.2443084716796875, 0.2601966857910156, 0.27608489990234375, 0.2919731140136719, 0.307861328125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 5.0, 12.0, 14.0, 14.0, 30.0, 38.0, 57.0, 139.0, 357.0, 2333.0, 648.0, 189.0, 94.0, 42.0, 27.0, 15.0, 23.0, 7.0, 10.0, 12.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00911712646484375, -0.008854448795318604, -0.008591771125793457, -0.00832909345626831, -0.008066415786743164, -0.007803738117218018, -0.007541060447692871, -0.007278382778167725, -0.007015705108642578, -0.006753027439117432, -0.006490349769592285, -0.006227672100067139, -0.005964994430541992, -0.005702316761016846, -0.005439639091491699, -0.005176961421966553, -0.004914283752441406, -0.00465160608291626, -0.004388928413391113, -0.004126250743865967, -0.0038635730743408203, -0.003600895404815674, -0.0033382177352905273, -0.003075540065765381, -0.0028128623962402344, -0.002550184726715088, -0.0022875070571899414, -0.002024829387664795, -0.0017621517181396484, -0.001499474048614502, -0.0012367963790893555, -0.000974118709564209, -0.0007114410400390625, -0.000448763370513916, -0.00018608570098876953, 7.659196853637695e-05, 0.00033926963806152344, 0.0006019473075866699, 0.0008646249771118164, 0.0011273026466369629, 0.0013899803161621094, 0.0016526579856872559, 0.0019153356552124023, 0.002178013324737549, 0.0024406909942626953, 0.002703368663787842, 0.0029660463333129883, 0.0032287240028381348, 0.0034914016723632812, 0.0037540793418884277, 0.004016757011413574, 0.004279434680938721, 0.004542112350463867, 0.004804790019989014, 0.00506746768951416, 0.005330145359039307, 0.005592823028564453, 0.0058555006980896, 0.006118178367614746, 0.006380856037139893, 0.006643533706665039, 0.0069062113761901855, 0.007168889045715332, 0.0074315667152404785, 0.007694244384765625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1008.0, 7.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7073004245758057, -1.6781212091445923, -1.648941993713379, -1.619762659072876, -1.5905834436416626, -1.5614042282104492, -1.5322248935699463, -1.503045678138733, -1.4738664627075195, -1.4446872472763062, -1.4155080318450928, -1.3863286972045898, -1.3571494817733765, -1.327970266342163, -1.2987909317016602, -1.2696117162704468, -1.2404325008392334, -1.21125328540802, -1.1820740699768066, -1.1528947353363037, -1.1237155199050903, -1.094536304473877, -1.065356969833374, -1.0361777544021606, -1.0069985389709473, -0.9778193235397339, -0.9486400485038757, -0.9194607734680176, -0.8902815580368042, -0.8611023426055908, -0.8319230675697327, -0.8027437925338745, -0.7735645174980164, -0.7443852424621582, -0.7152060270309448, -0.6860268115997314, -0.6568475365638733, -0.6276682615280151, -0.5984890460968018, -0.5693098306655884, -0.5401305556297302, -0.5109512805938721, -0.4817720651626587, -0.4525928199291229, -0.42341357469558716, -0.3942343294620514, -0.3650550842285156, -0.33587583899497986, -0.3066965937614441, -0.2775173485279083, -0.24833810329437256, -0.2191588580608368, -0.18997961282730103, -0.16080036759376526, -0.1316211223602295, -0.10244187712669373, -0.07326263189315796, -0.04408338665962219, -0.014904141426086426, 0.01427510380744934, 0.04345434904098511, 0.07263359427452087, 0.10181283950805664, 0.1309920847415924, 0.16017132997512817]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 6.0, 11.0, 24.0, 28.0, 48.0, 77.0, 86.0, 122.0, 116.0, 118.0, 121.0, 83.0, 60.0, 37.0, 29.0, 13.0, 9.0, 10.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0659530758857727, -0.06450649350881577, -0.06305990368127823, -0.06161332130432129, -0.06016673520207405, -0.05872014909982681, -0.05727356672286987, -0.055826980620622635, -0.0543803945183754, -0.05293380841612816, -0.05148722231388092, -0.05004063993692398, -0.04859405383467674, -0.047147467732429504, -0.045700885355472565, -0.04425429925322533, -0.04280771315097809, -0.04136112704873085, -0.03991454094648361, -0.03846795856952667, -0.037021372467279434, -0.035574786365032196, -0.034128203988075256, -0.03268161788582802, -0.03123503178358078, -0.029788445681333542, -0.028341861441731453, -0.026895277202129364, -0.025448691099882126, -0.024002104997634888, -0.0225555207580328, -0.02110893651843071, -0.01966235041618347, -0.018215764313936234, -0.016769180074334145, -0.015322594903409481, -0.013876009732484818, -0.012429424561560154, -0.01098283939063549, -0.009536254219710827, -0.008089669048786163, -0.0066430838778615, -0.005196498706936836, -0.0037499135360121727, -0.002303328365087509, -0.0008567431941628456, 0.0005898419767618179, 0.0020364271476864815, 0.003483012318611145, 0.0049295974895358086, 0.006376182660460472, 0.007822767831385136, 0.0092693530023098, 0.010715938173234463, 0.012162523344159126, 0.01360910851508379, 0.015055693686008453, 0.01650227978825569, 0.01794886402785778, 0.01939544826745987, 0.020842034369707108, 0.022288620471954346, 0.023735204711556435, 0.025181788951158524, 0.02662837505340576]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 1.0, 3.0, 7.0, 3.0, 2.0, 7.0, 13.0, 5.0, 11.0, 8.0, 16.0, 21.0, 36.0, 33.0, 49.0, 55.0, 94.0, 308.0, 4936.0, 877870.0, 162880.0, 1689.0, 183.0, 67.0, 57.0, 44.0, 41.0, 24.0, 16.0, 17.0, 12.0, 10.0, 5.0, 6.0, 4.0, 11.0, 2.0, 6.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.11590576171875, -0.112579345703125, -0.1092529296875, -0.105926513671875, -0.10260009765625, -0.099273681640625, -0.095947265625, -0.092620849609375, -0.08929443359375, -0.085968017578125, -0.0826416015625, -0.079315185546875, -0.07598876953125, -0.072662353515625, -0.0693359375, -0.066009521484375, -0.06268310546875, -0.059356689453125, -0.0560302734375, -0.052703857421875, -0.04937744140625, -0.046051025390625, -0.042724609375, -0.039398193359375, -0.03607177734375, -0.032745361328125, -0.0294189453125, -0.026092529296875, -0.02276611328125, -0.019439697265625, -0.01611328125, -0.012786865234375, -0.00946044921875, -0.006134033203125, -0.0028076171875, 0.000518798828125, 0.00384521484375, 0.007171630859375, 0.010498046875, 0.013824462890625, 0.01715087890625, 0.020477294921875, 0.0238037109375, 0.027130126953125, 0.03045654296875, 0.033782958984375, 0.037109375, 0.040435791015625, 0.04376220703125, 0.047088623046875, 0.0504150390625, 0.053741455078125, 0.05706787109375, 0.060394287109375, 0.063720703125, 0.067047119140625, 0.07037353515625, 0.073699951171875, 0.0770263671875, 0.080352783203125, 0.08367919921875, 0.087005615234375, 0.09033203125, 0.093658447265625, 0.09698486328125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 4.0, 6.0, 20.0, 42.0, 58.0, 108.0, 163.0, 168.0, 134.0, 119.0, 83.0, 61.0, 21.0, 11.0, 9.0, 2.0, 1.0, 1.0], "bins": [-0.0087890625, -0.008625015616416931, -0.008460968732833862, -0.008296921849250793, -0.008132874965667725, -0.007968828082084656, -0.007804781198501587, -0.007640734314918518, -0.007476687431335449, -0.00731264054775238, -0.0071485936641693115, -0.006984546780586243, -0.006820499897003174, -0.006656453013420105, -0.006492406129837036, -0.006328359246253967, -0.0061643123626708984, -0.00600026547908783, -0.005836218595504761, -0.005672171711921692, -0.005508124828338623, -0.005344077944755554, -0.005180031061172485, -0.0050159841775894165, -0.004851937294006348, -0.004687890410423279, -0.00452384352684021, -0.004359796643257141, -0.004195749759674072, -0.004031702876091003, -0.0038676559925079346, -0.0037036091089248657, -0.003539562225341797, -0.003375515341758728, -0.003211468458175659, -0.0030474215745925903, -0.0028833746910095215, -0.0027193278074264526, -0.002555280923843384, -0.002391234040260315, -0.002227187156677246, -0.0020631402730941772, -0.0018990933895111084, -0.0017350465059280396, -0.0015709996223449707, -0.0014069527387619019, -0.001242905855178833, -0.0010788589715957642, -0.0009148120880126953, -0.0007507652044296265, -0.0005867183208465576, -0.00042267143726348877, -0.0002586245536804199, -9.457767009735107e-05, 6.946921348571777e-05, 0.00023351609706878662, 0.00039756298065185547, 0.0005616098642349243, 0.0007256567478179932, 0.000889703631401062, 0.0010537505149841309, 0.0012177973985671997, 0.0013818442821502686, 0.0015458911657333374, 0.0017099380493164062]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 4.0, 14.0, 19.0, 25.0, 37.0, 43.0, 68.0, 109.0, 170.0, 354.0, 865.0, 3749.0, 32256.0, 622783.0, 364585.0, 19291.0, 2639.0, 739.0, 326.0, 159.0, 100.0, 60.0, 47.0, 41.0, 20.0, 11.0, 9.0, 5.0, 12.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05609130859375, -0.054483890533447266, -0.05287647247314453, -0.0512690544128418, -0.04966163635253906, -0.04805421829223633, -0.046446800231933594, -0.04483938217163086, -0.043231964111328125, -0.04162454605102539, -0.040017127990722656, -0.03840970993041992, -0.03680229187011719, -0.03519487380981445, -0.03358745574951172, -0.031980037689208984, -0.03037261962890625, -0.028765201568603516, -0.02715778350830078, -0.025550365447998047, -0.023942947387695312, -0.022335529327392578, -0.020728111267089844, -0.01912069320678711, -0.017513275146484375, -0.01590585708618164, -0.014298439025878906, -0.012691020965576172, -0.011083602905273438, -0.009476184844970703, -0.007868766784667969, -0.006261348724365234, -0.0046539306640625, -0.0030465126037597656, -0.0014390945434570312, 0.00016832351684570312, 0.0017757415771484375, 0.003383159637451172, 0.004990577697753906, 0.006597995758056641, 0.008205413818359375, 0.00981283187866211, 0.011420249938964844, 0.013027667999267578, 0.014635086059570312, 0.016242504119873047, 0.01784992218017578, 0.019457340240478516, 0.02106475830078125, 0.022672176361083984, 0.02427959442138672, 0.025887012481689453, 0.027494430541992188, 0.029101848602294922, 0.030709266662597656, 0.03231668472290039, 0.033924102783203125, 0.03553152084350586, 0.037138938903808594, 0.03874635696411133, 0.04035377502441406, 0.0419611930847168, 0.04356861114501953, 0.045176029205322266, 0.046783447265625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 7.0, 12.0, 10.0, 15.0, 12.0, 23.0, 18.0, 22.0, 29.0, 45.0, 44.0, 51.0, 42.0, 61.0, 60.0, 49.0, 49.0, 54.0, 53.0, 60.0, 41.0, 38.0, 42.0, 37.0, 23.0, 20.0, 18.0, 16.0, 10.0, 12.0, 7.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01183319091796875, -0.011432647705078125, -0.0110321044921875, -0.010631561279296875, -0.01023101806640625, -0.009830474853515625, -0.009429931640625, -0.009029388427734375, -0.00862884521484375, -0.008228302001953125, -0.0078277587890625, -0.007427215576171875, -0.00702667236328125, -0.006626129150390625, -0.0062255859375, -0.005825042724609375, -0.00542449951171875, -0.005023956298828125, -0.0046234130859375, -0.004222869873046875, -0.00382232666015625, -0.003421783447265625, -0.003021240234375, -0.002620697021484375, -0.00222015380859375, -0.001819610595703125, -0.0014190673828125, -0.001018524169921875, -0.00061798095703125, -0.000217437744140625, 0.00018310546875, 0.000583648681640625, 0.00098419189453125, 0.001384735107421875, 0.0017852783203125, 0.002185821533203125, 0.00258636474609375, 0.002986907958984375, 0.003387451171875, 0.003787994384765625, 0.00418853759765625, 0.004589080810546875, 0.0049896240234375, 0.005390167236328125, 0.00579071044921875, 0.006191253662109375, 0.006591796875, 0.006992340087890625, 0.00739288330078125, 0.007793426513671875, 0.0081939697265625, 0.008594512939453125, 0.00899505615234375, 0.009395599365234375, 0.009796142578125, 0.010196685791015625, 0.01059722900390625, 0.010997772216796875, 0.0113983154296875, 0.011798858642578125, 0.01219940185546875, 0.012599945068359375, 0.01300048828125, 0.013401031494140625, 0.01380157470703125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 6.0, 1.0, 1.0, 4.0, 1.0, 6.0, 5.0, 2.0, 10.0, 3.0, 14.0, 12.0, 15.0, 32.0, 22.0, 56.0, 49.0, 98.0, 169.0, 422.0, 1398.0, 6717.0, 155580.0, 864845.0, 15430.0, 2303.0, 707.0, 264.0, 118.0, 73.0, 53.0, 34.0, 29.0, 14.0, 11.0, 13.0, 6.0, 6.0, 2.0, 9.0, 1.0, 4.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 4.0], "bins": [-0.08447265625, -0.08207225799560547, -0.07967185974121094, -0.0772714614868164, -0.07487106323242188, -0.07247066497802734, -0.07007026672363281, -0.06766986846923828, -0.06526947021484375, -0.06286907196044922, -0.06046867370605469, -0.058068275451660156, -0.055667877197265625, -0.053267478942871094, -0.05086708068847656, -0.04846668243408203, -0.0460662841796875, -0.04366588592529297, -0.04126548767089844, -0.038865089416503906, -0.036464691162109375, -0.034064292907714844, -0.03166389465332031, -0.02926349639892578, -0.02686309814453125, -0.02446269989013672, -0.022062301635742188, -0.019661903381347656, -0.017261505126953125, -0.014861106872558594, -0.012460708618164062, -0.010060310363769531, -0.007659912109375, -0.005259513854980469, -0.0028591156005859375, -0.00045871734619140625, 0.001941680908203125, 0.004342079162597656, 0.0067424774169921875, 0.009142875671386719, 0.01154327392578125, 0.013943672180175781, 0.016344070434570312, 0.018744468688964844, 0.021144866943359375, 0.023545265197753906, 0.025945663452148438, 0.02834606170654297, 0.0307464599609375, 0.03314685821533203, 0.03554725646972656, 0.037947654724121094, 0.040348052978515625, 0.042748451232910156, 0.04514884948730469, 0.04754924774169922, 0.04994964599609375, 0.05235004425048828, 0.05475044250488281, 0.057150840759277344, 0.059551239013671875, 0.061951637268066406, 0.06435203552246094, 0.06675243377685547, 0.06915283203125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 6.0, 3.0, 6.0, 7.0, 18.0, 23.0, 46.0, 102.0, 169.0, 261.0, 157.0, 90.0, 40.0, 22.0, 20.0, 9.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000244140625, -0.0002363733947277069, -0.00022860616445541382, -0.00022083893418312073, -0.00021307170391082764, -0.00020530447363853455, -0.00019753724336624146, -0.00018977001309394836, -0.00018200278282165527, -0.00017423555254936218, -0.0001664683222770691, -0.000158701092004776, -0.0001509338617324829, -0.00014316663146018982, -0.00013539940118789673, -0.00012763217091560364, -0.00011986494064331055, -0.00011209771037101746, -0.00010433048009872437, -9.656324982643127e-05, -8.879601955413818e-05, -8.102878928184509e-05, -7.3261559009552e-05, -6.549432873725891e-05, -5.772709846496582e-05, -4.995986819267273e-05, -4.219263792037964e-05, -3.442540764808655e-05, -2.6658177375793457e-05, -1.8890947103500366e-05, -1.1123716831207275e-05, -3.3564865589141846e-06, 4.410743713378906e-06, 1.2177973985671997e-05, 1.9945204257965088e-05, 2.771243453025818e-05, 3.547966480255127e-05, 4.324689507484436e-05, 5.101412534713745e-05, 5.878135561943054e-05, 6.654858589172363e-05, 7.431581616401672e-05, 8.208304643630981e-05, 8.98502767086029e-05, 9.7617506980896e-05, 0.00010538473725318909, 0.00011315196752548218, 0.00012091919779777527, 0.00012868642807006836, 0.00013645365834236145, 0.00014422088861465454, 0.00015198811888694763, 0.00015975534915924072, 0.0001675225794315338, 0.0001752898097038269, 0.00018305703997612, 0.00019082427024841309, 0.00019859150052070618, 0.00020635873079299927, 0.00021412596106529236, 0.00022189319133758545, 0.00022966042160987854, 0.00023742765188217163, 0.0002451948821544647, 0.0002529621124267578]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 9.0, 15.0, 16.0, 36.0, 86.0, 132.0, 362.0, 1471.0, 17505.0, 1020543.0, 6981.0, 910.0, 245.0, 112.0, 56.0, 23.0, 15.0, 12.0, 8.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.312744140625, -0.30277252197265625, -0.2928009033203125, -0.28282928466796875, -0.272857666015625, -0.26288604736328125, -0.2529144287109375, -0.24294281005859375, -0.23297119140625, -0.22299957275390625, -0.2130279541015625, -0.20305633544921875, -0.193084716796875, -0.18311309814453125, -0.1731414794921875, -0.16316986083984375, -0.1531982421875, -0.14322662353515625, -0.1332550048828125, -0.12328338623046875, -0.113311767578125, -0.10334014892578125, -0.0933685302734375, -0.08339691162109375, -0.07342529296875, -0.06345367431640625, -0.0534820556640625, -0.04351043701171875, -0.033538818359375, -0.02356719970703125, -0.0135955810546875, -0.00362396240234375, 0.00634765625, 0.01631927490234375, 0.0262908935546875, 0.03626251220703125, 0.046234130859375, 0.05620574951171875, 0.0661773681640625, 0.07614898681640625, 0.08612060546875, 0.09609222412109375, 0.1060638427734375, 0.11603546142578125, 0.126007080078125, 0.13597869873046875, 0.1459503173828125, 0.15592193603515625, 0.1658935546875, 0.17586517333984375, 0.1858367919921875, 0.19580841064453125, 0.205780029296875, 0.21575164794921875, 0.2257232666015625, 0.23569488525390625, 0.24566650390625, 0.25563812255859375, 0.2656097412109375, 0.27558135986328125, 0.285552978515625, 0.29552459716796875, 0.3054962158203125, 0.31546783447265625, 0.325439453125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 8.0, 15.0, 47.0, 161.0, 384.0, 236.0, 64.0, 30.0, 13.0, 8.0, 5.0, 5.0, 1.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.09503173828125, -0.09290504455566406, -0.09077835083007812, -0.08865165710449219, -0.08652496337890625, -0.08439826965332031, -0.08227157592773438, -0.08014488220214844, -0.0780181884765625, -0.07589149475097656, -0.07376480102539062, -0.07163810729980469, -0.06951141357421875, -0.06738471984863281, -0.06525802612304688, -0.06313133239746094, -0.061004638671875, -0.05887794494628906, -0.056751251220703125, -0.05462455749511719, -0.05249786376953125, -0.05037117004394531, -0.048244476318359375, -0.04611778259277344, -0.0439910888671875, -0.04186439514160156, -0.039737701416015625, -0.03761100769042969, -0.03548431396484375, -0.03335762023925781, -0.031230926513671875, -0.029104232788085938, -0.0269775390625, -0.024850845336914062, -0.022724151611328125, -0.020597457885742188, -0.01847076416015625, -0.016344070434570312, -0.014217376708984375, -0.012090682983398438, -0.0099639892578125, -0.007837295532226562, -0.005710601806640625, -0.0035839080810546875, -0.00145721435546875, 0.0006694793701171875, 0.002796173095703125, 0.0049228668212890625, 0.007049560546875, 0.009176254272460938, 0.011302947998046875, 0.013429641723632812, 0.01555633544921875, 0.017683029174804688, 0.019809722900390625, 0.021936416625976562, 0.0240631103515625, 0.026189804077148438, 0.028316497802734375, 0.030443191528320312, 0.03256988525390625, 0.03469657897949219, 0.036823272705078125, 0.03894996643066406, 0.04107666015625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.0, 929.0, 57.0, 1.0, 2.0, 2.0], "bins": [-4.054222583770752, -3.986128091812134, -3.9180335998535156, -3.8499391078948975, -3.7818446159362793, -3.713750123977661, -3.645655632019043, -3.577561140060425, -3.5094666481018066, -3.4413721561431885, -3.3732776641845703, -3.305183172225952, -3.237088680267334, -3.168994188308716, -3.1008996963500977, -3.0328052043914795, -2.9647107124328613, -2.896616220474243, -2.828521728515625, -2.760427236557007, -2.6923327445983887, -2.6242382526397705, -2.5561437606811523, -2.488049268722534, -2.419954776763916, -2.351860284805298, -2.2837657928466797, -2.2156713008880615, -2.1475768089294434, -2.079482316970825, -2.011387825012207, -1.9432933330535889, -1.8751989603042603, -1.807104468345642, -1.739009976387024, -1.6709154844284058, -1.6028209924697876, -1.5347265005111694, -1.4666320085525513, -1.398537516593933, -1.330443024635315, -1.2623485326766968, -1.1942540407180786, -1.1261595487594604, -1.0580650568008423, -0.9899705648422241, -0.921876072883606, -0.8537815809249878, -0.7856870889663696, -0.7175925970077515, -0.6494981050491333, -0.5814036130905151, -0.513309121131897, -0.4452146291732788, -0.37712013721466064, -0.3090256452560425, -0.24093115329742432, -0.17283666133880615, -0.10474216938018799, -0.036647677421569824, 0.03144681453704834, 0.0995413064956665, 0.16763579845428467, 0.23573029041290283, 0.303824782371521]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 16.0, 19.0, 30.0, 37.0, 47.0, 67.0, 74.0, 73.0, 89.0, 89.0, 89.0, 83.0, 71.0, 59.0, 51.0, 43.0, 28.0, 17.0, 12.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08917844295501709, -0.08378955721855164, -0.07840067148208618, -0.07301178574562073, -0.06762290000915527, -0.06223401427268982, -0.056845128536224365, -0.05145624279975891, -0.04606735706329346, -0.040678471326828, -0.03528958559036255, -0.029900699853897095, -0.02451181411743164, -0.019122928380966187, -0.013734042644500732, -0.008345156908035278, -0.0029562711715698242, 0.00243261456489563, 0.007821500301361084, 0.013210386037826538, 0.018599271774291992, 0.023988157510757446, 0.0293770432472229, 0.034765928983688354, 0.04015481472015381, 0.04554370045661926, 0.05093258619308472, 0.05632147192955017, 0.061710357666015625, 0.06709924340248108, 0.07248812913894653, 0.07787701487541199, 0.08326590061187744, 0.0886547863483429, 0.09404367208480835, 0.0994325578212738, 0.10482144355773926, 0.11021032929420471, 0.11559921503067017, 0.12098810076713562, 0.12637698650360107, 0.13176587224006653, 0.13715475797653198, 0.14254364371299744, 0.1479325294494629, 0.15332141518592834, 0.1587103009223938, 0.16409918665885925, 0.1694880723953247, 0.17487695813179016, 0.18026584386825562, 0.18565472960472107, 0.19104361534118652, 0.19643250107765198, 0.20182138681411743, 0.20721027255058289, 0.21259915828704834, 0.2179880440235138, 0.22337692975997925, 0.2287658154964447, 0.23415470123291016, 0.2395435869693756, 0.24493247270584106, 0.2503213584423065, 0.255710244178772]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 12.0, 27.0, 33.0, 66.0, 148.0, 220.0, 734.0, 8430.0, 4181380.0, 2854.0, 228.0, 67.0, 40.0, 14.0, 13.0, 7.0, 2.0, 5.0, 2.0], "bins": [-0.56494140625, -0.5543642044067383, -0.5437870025634766, -0.5332098007202148, -0.5226325988769531, -0.5120553970336914, -0.5014781951904297, -0.49090099334716797, -0.48032379150390625, -0.46974658966064453, -0.4591693878173828, -0.4485921859741211, -0.4380149841308594, -0.42743778228759766, -0.41686058044433594, -0.4062833786010742, -0.3957061767578125, -0.3851289749145508, -0.37455177307128906, -0.36397457122802734, -0.3533973693847656, -0.3428201675415039, -0.3322429656982422, -0.32166576385498047, -0.31108856201171875, -0.30051136016845703, -0.2899341583251953, -0.2793569564819336, -0.2687797546386719, -0.25820255279541016, -0.24762535095214844, -0.23704814910888672, -0.226470947265625, -0.21589374542236328, -0.20531654357910156, -0.19473934173583984, -0.18416213989257812, -0.1735849380493164, -0.1630077362060547, -0.15243053436279297, -0.14185333251953125, -0.13127613067626953, -0.12069892883300781, -0.1101217269897461, -0.09954452514648438, -0.08896732330322266, -0.07839012145996094, -0.06781291961669922, -0.0572357177734375, -0.04665851593017578, -0.03608131408691406, -0.025504112243652344, -0.014926910400390625, -0.004349708557128906, 0.0062274932861328125, 0.01680469512939453, 0.02738189697265625, 0.03795909881591797, 0.04853630065917969, 0.059113502502441406, 0.06969070434570312, 0.08026790618896484, 0.09084510803222656, 0.10142230987548828, 0.11199951171875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 10.0, 17.0, 20.0, 43.0, 85.0, 141.0, 162.0, 163.0, 138.0, 95.0, 73.0, 35.0, 11.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.010498046875, -0.010288476943969727, -0.010078907012939453, -0.00986933708190918, -0.009659767150878906, -0.009450197219848633, -0.00924062728881836, -0.009031057357788086, -0.008821487426757812, -0.008611917495727539, -0.008402347564697266, -0.008192777633666992, -0.007983207702636719, -0.007773637771606445, -0.007564067840576172, -0.0073544979095458984, -0.007144927978515625, -0.0069353580474853516, -0.006725788116455078, -0.006516218185424805, -0.006306648254394531, -0.006097078323364258, -0.005887508392333984, -0.005677938461303711, -0.0054683685302734375, -0.005258798599243164, -0.005049228668212891, -0.004839658737182617, -0.004630088806152344, -0.00442051887512207, -0.004210948944091797, -0.0040013790130615234, -0.00379180908203125, -0.0035822391510009766, -0.003372669219970703, -0.0031630992889404297, -0.0029535293579101562, -0.002743959426879883, -0.0025343894958496094, -0.002324819564819336, -0.0021152496337890625, -0.001905679702758789, -0.0016961097717285156, -0.0014865398406982422, -0.0012769699096679688, -0.0010673999786376953, -0.0008578300476074219, -0.0006482601165771484, -0.000438690185546875, -0.00022912025451660156, -1.9550323486328125e-05, 0.0001900196075439453, 0.00039958953857421875, 0.0006091594696044922, 0.0008187294006347656, 0.001028299331665039, 0.0012378692626953125, 0.001447439193725586, 0.0016570091247558594, 0.0018665790557861328, 0.0020761489868164062, 0.0022857189178466797, 0.002495288848876953, 0.0027048587799072266, 0.0029144287109375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 20.0, 36.0, 99.0, 205.0, 396.0, 204232.0, 3988716.0, 379.0, 132.0, 45.0, 20.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.681640625, -1.6451034545898438, -1.6085662841796875, -1.5720291137695312, -1.535491943359375, -1.4989547729492188, -1.4624176025390625, -1.4258804321289062, -1.38934326171875, -1.3528060913085938, -1.3162689208984375, -1.2797317504882812, -1.243194580078125, -1.2066574096679688, -1.1701202392578125, -1.1335830688476562, -1.0970458984375, -1.0605087280273438, -1.0239715576171875, -0.9874343872070312, -0.950897216796875, -0.9143600463867188, -0.8778228759765625, -0.8412857055664062, -0.80474853515625, -0.7682113647460938, -0.7316741943359375, -0.6951370239257812, -0.658599853515625, -0.6220626831054688, -0.5855255126953125, -0.5489883422851562, -0.512451171875, -0.47591400146484375, -0.4393768310546875, -0.40283966064453125, -0.366302490234375, -0.32976531982421875, -0.2932281494140625, -0.25669097900390625, -0.22015380859375, -0.18361663818359375, -0.1470794677734375, -0.11054229736328125, -0.074005126953125, -0.03746795654296875, -0.0009307861328125, 0.03560638427734375, 0.0721435546875, 0.10868072509765625, 0.1452178955078125, 0.18175506591796875, 0.218292236328125, 0.25482940673828125, 0.2913665771484375, 0.32790374755859375, 0.36444091796875, 0.40097808837890625, 0.4375152587890625, 0.47405242919921875, 0.510589599609375, 0.5471267700195312, 0.5836639404296875, 0.6202011108398438, 0.65673828125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 13.0, 126.0, 3612.0, 282.0, 40.0, 8.0, 5.0], "bins": [-0.16015625, -0.1574711799621582, -0.1547861099243164, -0.1521010398864746, -0.1494159698486328, -0.14673089981079102, -0.14404582977294922, -0.14136075973510742, -0.13867568969726562, -0.13599061965942383, -0.13330554962158203, -0.13062047958374023, -0.12793540954589844, -0.12525033950805664, -0.12256526947021484, -0.11988019943237305, -0.11719512939453125, -0.11451005935668945, -0.11182498931884766, -0.10913991928100586, -0.10645484924316406, -0.10376977920532227, -0.10108470916748047, -0.09839963912963867, -0.09571456909179688, -0.09302949905395508, -0.09034442901611328, -0.08765935897827148, -0.08497428894042969, -0.08228921890258789, -0.0796041488647461, -0.0769190788269043, -0.0742340087890625, -0.0715489387512207, -0.0688638687133789, -0.06617879867553711, -0.06349372863769531, -0.060808658599853516, -0.05812358856201172, -0.05543851852416992, -0.052753448486328125, -0.05006837844848633, -0.04738330841064453, -0.044698238372802734, -0.04201316833496094, -0.03932809829711914, -0.036643028259277344, -0.03395795822143555, -0.03127288818359375, -0.028587818145751953, -0.025902748107910156, -0.02321767807006836, -0.020532608032226562, -0.017847537994384766, -0.015162467956542969, -0.012477397918701172, -0.009792327880859375, -0.007107257843017578, -0.004422187805175781, -0.0017371177673339844, 0.0009479522705078125, 0.0036330223083496094, 0.006318092346191406, 0.009003162384033203, 0.011688232421875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 41.0, 778.0, 168.0, 18.0, 5.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.068528175354004, -2.0320799350738525, -1.9956316947937012, -1.9591833353042603, -1.9227350950241089, -1.8862868547439575, -1.8498386144638062, -1.8133902549743652, -1.7769420146942139, -1.7404937744140625, -1.7040455341339111, -1.6675971746444702, -1.6311489343643188, -1.5947006940841675, -1.5582524538040161, -1.5218040943145752, -1.4853558540344238, -1.4489076137542725, -1.412459373474121, -1.3760110139846802, -1.3395627737045288, -1.3031145334243774, -1.266666293144226, -1.2302179336547852, -1.1937698125839233, -1.157321572303772, -1.1208733320236206, -1.0844249725341797, -1.0479767322540283, -1.011528491973877, -0.9750802516937256, -0.9386319518089294, -0.9021837115287781, -0.8657354712486267, -0.8292871713638306, -0.7928389310836792, -0.7563906311988831, -0.7199423909187317, -0.6834940910339355, -0.6470458507537842, -0.6105976104736328, -0.5741493701934814, -0.5377010703086853, -0.5012528300285339, -0.4648045301437378, -0.4283562898635864, -0.39190801978111267, -0.3554597496986389, -0.3190114498138428, -0.282563179731369, -0.24611490964889526, -0.2096666544675827, -0.17321838438510895, -0.1367701143026352, -0.10032185912132263, -0.06387358903884888, -0.027425318956375122, 0.009022947400808334, 0.04547121375799179, 0.08191947638988495, 0.1183677464723587, 0.15481601655483246, 0.19126427173614502, 0.22771254181861877, 0.26416081190109253]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 9.0, 16.0, 43.0, 67.0, 90.0, 143.0, 173.0, 148.0, 125.0, 79.0, 55.0, 24.0, 15.0, 6.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37566179037094116, -0.36347347497940063, -0.3512851595878601, -0.3390968441963196, -0.32690852880477905, -0.3147202134132385, -0.302531898021698, -0.29034358263015747, -0.27815526723861694, -0.2659669518470764, -0.2537786364555359, -0.24159032106399536, -0.22940200567245483, -0.2172136902809143, -0.20502537488937378, -0.19283705949783325, -0.18064874410629272, -0.1684604287147522, -0.15627211332321167, -0.14408379793167114, -0.13189548254013062, -0.11970716714859009, -0.10751885175704956, -0.09533053636550903, -0.0831422209739685, -0.07095390558242798, -0.05876559019088745, -0.046577274799346924, -0.034388959407806396, -0.02220064401626587, -0.010012328624725342, 0.0021759867668151855, 0.014364302158355713, 0.02655261754989624, 0.03874093294143677, 0.050929248332977295, 0.06311756372451782, 0.07530587911605835, 0.08749419450759888, 0.0996825098991394, 0.11187082529067993, 0.12405914068222046, 0.136247456073761, 0.1484357714653015, 0.16062408685684204, 0.17281240224838257, 0.1850007176399231, 0.19718903303146362, 0.20937734842300415, 0.22156566381454468, 0.2337539792060852, 0.24594229459762573, 0.25813060998916626, 0.2703189253807068, 0.2825072407722473, 0.29469555616378784, 0.30688387155532837, 0.3190721869468689, 0.3312605023384094, 0.34344881772994995, 0.3556371331214905, 0.367825448513031, 0.38001376390457153, 0.39220207929611206, 0.4043903946876526]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 3.0, 7.0, 7.0, 18.0, 10.0, 11.0, 17.0, 30.0, 31.0, 54.0, 69.0, 98.0, 153.0, 313.0, 597.0, 1481.0, 5232.0, 35094.0, 759141.0, 226690.0, 14293.0, 3030.0, 1074.0, 418.0, 245.0, 120.0, 92.0, 61.0, 43.0, 22.0, 21.0, 20.0, 17.0, 7.0, 6.0, 6.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11419677734375, -0.11008930206298828, -0.10598182678222656, -0.10187435150146484, -0.09776687622070312, -0.0936594009399414, -0.08955192565917969, -0.08544445037841797, -0.08133697509765625, -0.07722949981689453, -0.07312202453613281, -0.0690145492553711, -0.06490707397460938, -0.060799598693847656, -0.05669212341308594, -0.05258464813232422, -0.0484771728515625, -0.04436969757080078, -0.04026222229003906, -0.036154747009277344, -0.032047271728515625, -0.027939796447753906, -0.023832321166992188, -0.01972484588623047, -0.01561737060546875, -0.011509895324707031, -0.0074024200439453125, -0.0032949447631835938, 0.000812530517578125, 0.004920005798339844, 0.009027481079101562, 0.013134956359863281, 0.017242431640625, 0.02134990692138672, 0.025457382202148438, 0.029564857482910156, 0.033672332763671875, 0.037779808044433594, 0.04188728332519531, 0.04599475860595703, 0.05010223388671875, 0.05420970916748047, 0.05831718444824219, 0.062424659729003906, 0.06653213500976562, 0.07063961029052734, 0.07474708557128906, 0.07885456085205078, 0.0829620361328125, 0.08706951141357422, 0.09117698669433594, 0.09528446197509766, 0.09939193725585938, 0.1034994125366211, 0.10760688781738281, 0.11171436309814453, 0.11582183837890625, 0.11992931365966797, 0.12403678894042969, 0.1281442642211914, 0.13225173950195312, 0.13635921478271484, 0.14046669006347656, 0.14457416534423828, 0.148681640625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 8.0, 10.0, 20.0, 44.0, 56.0, 86.0, 121.0, 148.0, 135.0, 114.0, 98.0, 63.0, 49.0, 30.0, 13.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0203704833984375, -0.019753456115722656, -0.019136428833007812, -0.01851940155029297, -0.017902374267578125, -0.01728534698486328, -0.016668319702148438, -0.016051292419433594, -0.01543426513671875, -0.014817237854003906, -0.014200210571289062, -0.013583183288574219, -0.012966156005859375, -0.012349128723144531, -0.011732101440429688, -0.011115074157714844, -0.010498046875, -0.009881019592285156, -0.009263992309570312, -0.008646965026855469, -0.008029937744140625, -0.007412910461425781, -0.0067958831787109375, -0.006178855895996094, -0.00556182861328125, -0.004944801330566406, -0.0043277740478515625, -0.0037107467651367188, -0.003093719482421875, -0.0024766921997070312, -0.0018596649169921875, -0.0012426376342773438, -0.0006256103515625, -8.58306884765625e-06, 0.0006084442138671875, 0.0012254714965820312, 0.001842498779296875, 0.0024595260620117188, 0.0030765533447265625, 0.0036935806274414062, 0.00431060791015625, 0.004927635192871094, 0.0055446624755859375, 0.006161689758300781, 0.006778717041015625, 0.007395744323730469, 0.008012771606445312, 0.008629798889160156, 0.009246826171875, 0.009863853454589844, 0.010480880737304688, 0.011097908020019531, 0.011714935302734375, 0.012331962585449219, 0.012948989868164062, 0.013566017150878906, 0.01418304443359375, 0.014800071716308594, 0.015417098999023438, 0.01603412628173828, 0.016651153564453125, 0.01726818084716797, 0.017885208129882812, 0.018502235412597656, 0.0191192626953125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 2.0, 4.0, 1.0, 7.0, 10.0, 12.0, 12.0, 11.0, 22.0, 19.0, 42.0, 59.0, 99.0, 185.0, 507.0, 1996.0, 26203.0, 938485.0, 76276.0, 3306.0, 699.0, 265.0, 116.0, 63.0, 47.0, 27.0, 19.0, 14.0, 12.0, 9.0, 13.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11383056640625, -0.10985469818115234, -0.10587882995605469, -0.10190296173095703, -0.09792709350585938, -0.09395122528076172, -0.08997535705566406, -0.0859994888305664, -0.08202362060546875, -0.0780477523803711, -0.07407188415527344, -0.07009601593017578, -0.06612014770507812, -0.06214427947998047, -0.05816841125488281, -0.054192543029785156, -0.0502166748046875, -0.046240806579589844, -0.04226493835449219, -0.03828907012939453, -0.034313201904296875, -0.03033733367919922, -0.026361465454101562, -0.022385597229003906, -0.01840972900390625, -0.014433860778808594, -0.010457992553710938, -0.006482124328613281, -0.002506256103515625, 0.0014696121215820312, 0.0054454803466796875, 0.009421348571777344, 0.013397216796875, 0.017373085021972656, 0.021348953247070312, 0.02532482147216797, 0.029300689697265625, 0.03327655792236328, 0.03725242614746094, 0.041228294372558594, 0.04520416259765625, 0.049180030822753906, 0.05315589904785156, 0.05713176727294922, 0.061107635498046875, 0.06508350372314453, 0.06905937194824219, 0.07303524017333984, 0.0770111083984375, 0.08098697662353516, 0.08496284484863281, 0.08893871307373047, 0.09291458129882812, 0.09689044952392578, 0.10086631774902344, 0.1048421859741211, 0.10881805419921875, 0.1127939224243164, 0.11676979064941406, 0.12074565887451172, 0.12472152709960938, 0.12869739532470703, 0.1326732635498047, 0.13664913177490234, 0.140625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 9.0, 8.0, 14.0, 15.0, 10.0, 16.0, 24.0, 36.0, 30.0, 36.0, 51.0, 42.0, 39.0, 63.0, 53.0, 67.0, 66.0, 57.0, 62.0, 52.0, 49.0, 50.0, 28.0, 23.0, 29.0, 12.0, 14.0, 10.0, 8.0, 11.0, 3.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038299560546875, -0.03699636459350586, -0.03569316864013672, -0.03438997268676758, -0.03308677673339844, -0.0317835807800293, -0.030480384826660156, -0.029177188873291016, -0.027873992919921875, -0.026570796966552734, -0.025267601013183594, -0.023964405059814453, -0.022661209106445312, -0.021358013153076172, -0.02005481719970703, -0.01875162124633789, -0.01744842529296875, -0.01614522933959961, -0.014842033386230469, -0.013538837432861328, -0.012235641479492188, -0.010932445526123047, -0.009629249572753906, -0.008326053619384766, -0.007022857666015625, -0.005719661712646484, -0.004416465759277344, -0.003113269805908203, -0.0018100738525390625, -0.0005068778991699219, 0.0007963180541992188, 0.0020995140075683594, 0.0034027099609375, 0.004705905914306641, 0.006009101867675781, 0.007312297821044922, 0.008615493774414062, 0.009918689727783203, 0.011221885681152344, 0.012525081634521484, 0.013828277587890625, 0.015131473541259766, 0.016434669494628906, 0.017737865447998047, 0.019041061401367188, 0.020344257354736328, 0.02164745330810547, 0.02295064926147461, 0.02425384521484375, 0.02555704116821289, 0.02686023712158203, 0.028163433074951172, 0.029466629028320312, 0.030769824981689453, 0.032073020935058594, 0.033376216888427734, 0.034679412841796875, 0.035982608795166016, 0.037285804748535156, 0.0385890007019043, 0.03989219665527344, 0.04119539260864258, 0.04249858856201172, 0.04380178451538086, 0.04510498046875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 11.0, 10.0, 24.0, 43.0, 70.0, 167.0, 401.0, 1190.0, 6607.0, 301596.0, 726068.0, 9996.0, 1501.0, 488.0, 177.0, 84.0, 41.0, 28.0, 13.0, 7.0, 6.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09637451171875, -0.09402894973754883, -0.09168338775634766, -0.08933782577514648, -0.08699226379394531, -0.08464670181274414, -0.08230113983154297, -0.0799555778503418, -0.07761001586914062, -0.07526445388793945, -0.07291889190673828, -0.07057332992553711, -0.06822776794433594, -0.06588220596313477, -0.0635366439819336, -0.06119108200073242, -0.05884552001953125, -0.05649995803833008, -0.054154396057128906, -0.051808834075927734, -0.04946327209472656, -0.04711771011352539, -0.04477214813232422, -0.04242658615112305, -0.040081024169921875, -0.0377354621887207, -0.03538990020751953, -0.03304433822631836, -0.030698776245117188, -0.028353214263916016, -0.026007652282714844, -0.023662090301513672, -0.0213165283203125, -0.018970966339111328, -0.016625404357910156, -0.014279842376708984, -0.011934280395507812, -0.00958871841430664, -0.007243156433105469, -0.004897594451904297, -0.002552032470703125, -0.00020647048950195312, 0.0021390914916992188, 0.004484653472900391, 0.0068302154541015625, 0.009175777435302734, 0.011521339416503906, 0.013866901397705078, 0.01621246337890625, 0.018558025360107422, 0.020903587341308594, 0.023249149322509766, 0.025594711303710938, 0.02794027328491211, 0.03028583526611328, 0.03263139724731445, 0.034976959228515625, 0.0373225212097168, 0.03966808319091797, 0.04201364517211914, 0.04435920715332031, 0.046704769134521484, 0.049050331115722656, 0.05139589309692383, 0.053741455078125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 7.0, 7.0, 8.0, 8.0, 4.0, 8.0, 5.0, 17.0, 18.0, 17.0, 20.0, 27.0, 57.0, 57.0, 96.0, 109.0, 142.0, 72.0, 59.0, 38.0, 34.0, 24.0, 24.0, 24.0, 21.0, 13.0, 7.0, 13.0, 12.0, 12.0, 3.0, 4.0, 5.0, 6.0, 1.0, 5.0, 3.0, 0.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00013685226440429688, -0.00013256259262561798, -0.0001282729208469391, -0.0001239832490682602, -0.0001196935772895813, -0.0001154039055109024, -0.00011111423373222351, -0.00010682456195354462, -0.00010253489017486572, -9.824521839618683e-05, -9.395554661750793e-05, -8.966587483882904e-05, -8.537620306015015e-05, -8.108653128147125e-05, -7.679685950279236e-05, -7.250718772411346e-05, -6.821751594543457e-05, -6.392784416675568e-05, -5.963817238807678e-05, -5.534850060939789e-05, -5.1058828830718994e-05, -4.67691570520401e-05, -4.2479485273361206e-05, -3.818981349468231e-05, -3.390014171600342e-05, -2.9610469937324524e-05, -2.532079815864563e-05, -2.1031126379966736e-05, -1.6741454601287842e-05, -1.2451782822608948e-05, -8.162111043930054e-06, -3.87243926525116e-06, 4.172325134277344e-07, 4.706904292106628e-06, 8.996576070785522e-06, 1.3286247849464417e-05, 1.757591962814331e-05, 2.1865591406822205e-05, 2.61552631855011e-05, 3.0444934964179993e-05, 3.473460674285889e-05, 3.902427852153778e-05, 4.3313950300216675e-05, 4.760362207889557e-05, 5.189329385757446e-05, 5.618296563625336e-05, 6.047263741493225e-05, 6.476230919361115e-05, 6.905198097229004e-05, 7.334165275096893e-05, 7.763132452964783e-05, 8.192099630832672e-05, 8.621066808700562e-05, 9.050033986568451e-05, 9.47900116443634e-05, 9.90796834230423e-05, 0.00010336935520172119, 0.00010765902698040009, 0.00011194869875907898, 0.00011623837053775787, 0.00012052804231643677, 0.00012481771409511566, 0.00012910738587379456, 0.00013339705765247345, 0.00013768672943115234]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 8.0, 19.0, 29.0, 53.0, 95.0, 251.0, 839.0, 3836.0, 304794.0, 731651.0, 5458.0, 958.0, 292.0, 114.0, 63.0, 35.0, 12.0, 14.0, 9.0, 6.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1331787109375, -0.12977027893066406, -0.12636184692382812, -0.12295341491699219, -0.11954498291015625, -0.11613655090332031, -0.11272811889648438, -0.10931968688964844, -0.1059112548828125, -0.10250282287597656, -0.09909439086914062, -0.09568595886230469, -0.09227752685546875, -0.08886909484863281, -0.08546066284179688, -0.08205223083496094, -0.078643798828125, -0.07523536682128906, -0.07182693481445312, -0.06841850280761719, -0.06501007080078125, -0.06160163879394531, -0.058193206787109375, -0.05478477478027344, -0.0513763427734375, -0.04796791076660156, -0.044559478759765625, -0.04115104675292969, -0.03774261474609375, -0.03433418273925781, -0.030925750732421875, -0.027517318725585938, -0.02410888671875, -0.020700454711914062, -0.017292022705078125, -0.013883590698242188, -0.01047515869140625, -0.0070667266845703125, -0.003658294677734375, -0.0002498626708984375, 0.0031585693359375, 0.0065670013427734375, 0.009975433349609375, 0.013383865356445312, 0.01679229736328125, 0.020200729370117188, 0.023609161376953125, 0.027017593383789062, 0.030426025390625, 0.03383445739746094, 0.037242889404296875, 0.04065132141113281, 0.04405975341796875, 0.04746818542480469, 0.050876617431640625, 0.05428504943847656, 0.0576934814453125, 0.06110191345214844, 0.06451034545898438, 0.06791877746582031, 0.07132720947265625, 0.07473564147949219, 0.07814407348632812, 0.08155250549316406, 0.0849609375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 2.0, 2.0, 9.0, 11.0, 13.0, 19.0, 26.0, 45.0, 87.0, 103.0, 121.0, 128.0, 120.0, 99.0, 75.0, 41.0, 40.0, 22.0, 9.0, 6.0, 5.0, 5.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036865234375, -0.03573131561279297, -0.03459739685058594, -0.033463478088378906, -0.032329559326171875, -0.031195640563964844, -0.030061721801757812, -0.02892780303955078, -0.02779388427734375, -0.02665996551513672, -0.025526046752929688, -0.024392127990722656, -0.023258209228515625, -0.022124290466308594, -0.020990371704101562, -0.01985645294189453, -0.0187225341796875, -0.01758861541748047, -0.016454696655273438, -0.015320777893066406, -0.014186859130859375, -0.013052940368652344, -0.011919021606445312, -0.010785102844238281, -0.00965118408203125, -0.008517265319824219, -0.0073833465576171875, -0.006249427795410156, -0.005115509033203125, -0.003981590270996094, -0.0028476715087890625, -0.0017137527465820312, -0.000579833984375, 0.0005540847778320312, 0.0016880035400390625, 0.0028219223022460938, 0.003955841064453125, 0.005089759826660156, 0.0062236785888671875, 0.007357597351074219, 0.00849151611328125, 0.009625434875488281, 0.010759353637695312, 0.011893272399902344, 0.013027191162109375, 0.014161109924316406, 0.015295028686523438, 0.01642894744873047, 0.0175628662109375, 0.01869678497314453, 0.019830703735351562, 0.020964622497558594, 0.022098541259765625, 0.023232460021972656, 0.024366378784179688, 0.02550029754638672, 0.02663421630859375, 0.02776813507080078, 0.028902053833007812, 0.030035972595214844, 0.031169891357421875, 0.032303810119628906, 0.03343772888183594, 0.03457164764404297, 0.03570556640625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 15.0, 169.0, 725.0, 74.0, 16.0, 5.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8053152561187744, -1.7635196447372437, -1.721724033355713, -1.6799283027648926, -1.6381326913833618, -1.596337080001831, -1.5545413494110107, -1.51274573802948, -1.4709501266479492, -1.4291545152664185, -1.3873589038848877, -1.3455631732940674, -1.3037675619125366, -1.2619719505310059, -1.2201762199401855, -1.1783806085586548, -1.136584997177124, -1.0947893857955933, -1.0529937744140625, -1.0111980438232422, -0.9694024324417114, -0.9276068210601807, -0.8858111500740051, -0.8440154790878296, -0.8022198677062988, -0.7604242563247681, -0.7186285853385925, -0.676832914352417, -0.6350373029708862, -0.5932416915893555, -0.5514460206031799, -0.5096503496170044, -0.46785473823547363, -0.4260590970516205, -0.38426345586776733, -0.3424678146839142, -0.30067217350006104, -0.2588765323162079, -0.21708089113235474, -0.1752852499485016, -0.13348960876464844, -0.09169396758079529, -0.04989832639694214, -0.00810268521308899, 0.03369295597076416, 0.07548859715461731, 0.11728423833847046, 0.1590798795223236, 0.20087552070617676, 0.2426711618900299, 0.28446680307388306, 0.3262624442577362, 0.36805808544158936, 0.4098537266254425, 0.45164936780929565, 0.4934450089931488, 0.535240650177002, 0.5770362615585327, 0.6188319325447083, 0.6606276035308838, 0.7024232149124146, 0.7442188262939453, 0.7860144972801208, 0.8278101682662964, 0.8696057796478271]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 17.0, 11.0, 10.0, 23.0, 22.0, 29.0, 28.0, 63.0, 68.0, 61.0, 64.0, 76.0, 73.0, 65.0, 78.0, 48.0, 48.0, 34.0, 38.0, 33.0, 28.0, 24.0, 14.0, 7.0, 14.0, 2.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3083477020263672, -0.2979143559932709, -0.28748100996017456, -0.27704766392707825, -0.26661431789398193, -0.25618094205856323, -0.2457476109266281, -0.2353142499923706, -0.2248809039592743, -0.21444755792617798, -0.20401421189308167, -0.19358086585998535, -0.18314750492572784, -0.17271415889263153, -0.16228081285953522, -0.1518474519252777, -0.1414141207933426, -0.13098077476024628, -0.12054742127656937, -0.11011407524347305, -0.09968072175979614, -0.08924737572669983, -0.07881402969360352, -0.0683806762099266, -0.05794733017683029, -0.04751398041844368, -0.03708063066005707, -0.026647284626960754, -0.016213934868574142, -0.0057805851101875305, 0.004652760922908783, 0.015086114406585693, 0.025519460439682007, 0.03595281019806862, 0.04638615995645523, 0.056819505989551544, 0.06725285947322845, 0.07768620550632477, 0.08811955153942108, 0.09855290502309799, 0.1089862510561943, 0.11941959708929062, 0.12985295057296753, 0.14028629660606384, 0.15071964263916016, 0.16115298867225647, 0.17158633470535278, 0.1820196956396103, 0.1924530416727066, 0.20288638770580292, 0.21331973373889923, 0.22375309467315674, 0.23418644070625305, 0.24461978673934937, 0.2550531327724457, 0.265486478805542, 0.2759198248386383, 0.2863531708717346, 0.29678651690483093, 0.30721986293792725, 0.31765320897102356, 0.3280865550041199, 0.3385199308395386, 0.3489532768726349, 0.3593866229057312]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 3.0, 9.0, 10.0, 11.0, 12.0, 14.0, 28.0, 30.0, 48.0, 64.0, 90.0, 165.0, 269.0, 603.0, 1604.0, 7227.0, 151055.0, 3999899.0, 29125.0, 2980.0, 654.0, 227.0, 71.0, 39.0, 17.0, 13.0, 4.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0], "bins": [-0.331298828125, -0.3244361877441406, -0.31757354736328125, -0.3107109069824219, -0.3038482666015625, -0.2969856262207031, -0.29012298583984375, -0.2832603454589844, -0.276397705078125, -0.2695350646972656, -0.26267242431640625, -0.2558097839355469, -0.2489471435546875, -0.24208450317382812, -0.23522186279296875, -0.22835922241210938, -0.22149658203125, -0.21463394165039062, -0.20777130126953125, -0.20090866088867188, -0.1940460205078125, -0.18718338012695312, -0.18032073974609375, -0.17345809936523438, -0.166595458984375, -0.15973281860351562, -0.15287017822265625, -0.14600753784179688, -0.1391448974609375, -0.13228225708007812, -0.12541961669921875, -0.11855697631835938, -0.1116943359375, -0.10483169555664062, -0.09796905517578125, -0.09110641479492188, -0.0842437744140625, -0.07738113403320312, -0.07051849365234375, -0.06365585327148438, -0.056793212890625, -0.049930572509765625, -0.04306793212890625, -0.036205291748046875, -0.0293426513671875, -0.022480010986328125, -0.01561737060546875, -0.008754730224609375, -0.00189208984375, 0.004970550537109375, 0.01183319091796875, 0.018695831298828125, 0.0255584716796875, 0.032421112060546875, 0.03928375244140625, 0.046146392822265625, 0.053009033203125, 0.059871673583984375, 0.06673431396484375, 0.07359695434570312, 0.0804595947265625, 0.08732223510742188, 0.09418487548828125, 0.10104751586914062, 0.10791015625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 12.0, 16.0, 32.0, 59.0, 74.0, 92.0, 116.0, 124.0, 133.0, 107.0, 81.0, 60.0, 39.0, 21.0, 18.0, 10.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0240478515625, -0.023456692695617676, -0.02286553382873535, -0.022274374961853027, -0.021683216094970703, -0.02109205722808838, -0.020500898361206055, -0.01990973949432373, -0.019318580627441406, -0.018727421760559082, -0.018136262893676758, -0.017545104026794434, -0.01695394515991211, -0.016362786293029785, -0.01577162742614746, -0.015180468559265137, -0.014589309692382812, -0.013998150825500488, -0.013406991958618164, -0.01281583309173584, -0.012224674224853516, -0.011633515357971191, -0.011042356491088867, -0.010451197624206543, -0.009860038757324219, -0.009268879890441895, -0.00867772102355957, -0.008086562156677246, -0.007495403289794922, -0.006904244422912598, -0.0063130855560302734, -0.005721926689147949, -0.005130767822265625, -0.004539608955383301, -0.0039484500885009766, -0.0033572912216186523, -0.002766132354736328, -0.002174973487854004, -0.0015838146209716797, -0.0009926557540893555, -0.00040149688720703125, 0.00018966197967529297, 0.0007808208465576172, 0.0013719797134399414, 0.0019631385803222656, 0.00255429744720459, 0.003145456314086914, 0.0037366151809692383, 0.0043277740478515625, 0.004918932914733887, 0.005510091781616211, 0.006101250648498535, 0.006692409515380859, 0.007283568382263184, 0.007874727249145508, 0.008465886116027832, 0.009057044982910156, 0.00964820384979248, 0.010239362716674805, 0.010830521583557129, 0.011421680450439453, 0.012012839317321777, 0.012603998184204102, 0.013195157051086426, 0.01378631591796875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 26.0, 74.0, 252.0, 1777.0, 4190838.0, 1133.0, 121.0, 34.0, 15.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9248046875, -1.8851165771484375, -1.845428466796875, -1.8057403564453125, -1.76605224609375, -1.7263641357421875, -1.686676025390625, -1.6469879150390625, -1.6072998046875, -1.5676116943359375, -1.527923583984375, -1.4882354736328125, -1.44854736328125, -1.4088592529296875, -1.369171142578125, -1.3294830322265625, -1.289794921875, -1.2501068115234375, -1.210418701171875, -1.1707305908203125, -1.13104248046875, -1.0913543701171875, -1.051666259765625, -1.0119781494140625, -0.9722900390625, -0.9326019287109375, -0.892913818359375, -0.8532257080078125, -0.81353759765625, -0.7738494873046875, -0.734161376953125, -0.6944732666015625, -0.65478515625, -0.6150970458984375, -0.575408935546875, -0.5357208251953125, -0.49603271484375, -0.4563446044921875, -0.416656494140625, -0.3769683837890625, -0.3372802734375, -0.2975921630859375, -0.257904052734375, -0.2182159423828125, -0.17852783203125, -0.1388397216796875, -0.099151611328125, -0.0594635009765625, -0.019775390625, 0.0199127197265625, 0.059600830078125, 0.0992889404296875, 0.13897705078125, 0.1786651611328125, 0.218353271484375, 0.2580413818359375, 0.2977294921875, 0.3374176025390625, 0.377105712890625, 0.4167938232421875, 0.45648193359375, 0.4961700439453125, 0.535858154296875, 0.5755462646484375, 0.615234375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 12.0, 75.0, 520.0, 3243.0, 177.0, 27.0, 11.0, 6.0, 5.0, 2.0], "bins": [-0.1739501953125, -0.1709139347076416, -0.1678776741027832, -0.1648414134979248, -0.1618051528930664, -0.158768892288208, -0.1557326316833496, -0.1526963710784912, -0.1496601104736328, -0.14662384986877441, -0.14358758926391602, -0.14055132865905762, -0.13751506805419922, -0.13447880744934082, -0.13144254684448242, -0.12840628623962402, -0.12537002563476562, -0.12233376502990723, -0.11929750442504883, -0.11626124382019043, -0.11322498321533203, -0.11018872261047363, -0.10715246200561523, -0.10411620140075684, -0.10107994079589844, -0.09804368019104004, -0.09500741958618164, -0.09197115898132324, -0.08893489837646484, -0.08589863777160645, -0.08286237716674805, -0.07982611656188965, -0.07678985595703125, -0.07375359535217285, -0.07071733474731445, -0.06768107414245605, -0.06464481353759766, -0.06160855293273926, -0.05857229232788086, -0.05553603172302246, -0.05249977111816406, -0.049463510513305664, -0.046427249908447266, -0.04339098930358887, -0.04035472869873047, -0.03731846809387207, -0.03428220748901367, -0.031245946884155273, -0.028209686279296875, -0.025173425674438477, -0.022137165069580078, -0.01910090446472168, -0.01606464385986328, -0.013028383255004883, -0.009992122650146484, -0.006955862045288086, -0.0039196014404296875, -0.0008833408355712891, 0.0021529197692871094, 0.005189180374145508, 0.008225440979003906, 0.011261701583862305, 0.014297962188720703, 0.0173342227935791, 0.0203704833984375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 11.0, 92.0, 733.0, 140.0, 19.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0652590990066528, -1.0414105653762817, -1.0175621509552002, -0.9937136173248291, -0.969865083694458, -0.9460166096687317, -0.9221681356430054, -0.8983196020126343, -0.8744710683822632, -0.8506225943565369, -0.8267740607261658, -0.8029255867004395, -0.7790770530700684, -0.755228579044342, -0.7313801050186157, -0.7075315713882446, -0.6836830973625183, -0.659834623336792, -0.6359860897064209, -0.6121376156806946, -0.5882890820503235, -0.5644406080245972, -0.5405920743942261, -0.5167436003684998, -0.49289509654045105, -0.46904659271240234, -0.44519808888435364, -0.42134958505630493, -0.3975011110305786, -0.3736525774002075, -0.3498041033744812, -0.3259555995464325, -0.3021070957183838, -0.2782585918903351, -0.2544100880622864, -0.23056159913539886, -0.20671309530735016, -0.18286459147930145, -0.15901610255241394, -0.13516759872436523, -0.11131909489631653, -0.08747059106826782, -0.06362209469079971, -0.039773598313331604, -0.015925094485282898, 0.007923409342765808, 0.03177189826965332, 0.055620402097702026, 0.07946890592575073, 0.10331740975379944, 0.12716591358184814, 0.15101440250873566, 0.17486290633678436, 0.19871141016483307, 0.22255989909172058, 0.2464084029197693, 0.270256906747818, 0.2941054105758667, 0.3179539144039154, 0.3418024182319641, 0.36565089225769043, 0.3894994258880615, 0.41334789991378784, 0.43719640374183655, 0.46104490756988525]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 8.0, 12.0, 16.0, 31.0, 43.0, 82.0, 84.0, 106.0, 132.0, 125.0, 121.0, 73.0, 63.0, 46.0, 25.0, 17.0, 13.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3769615888595581, -0.3662453293800354, -0.3555290699005127, -0.34481281042099, -0.3340965807437897, -0.32338032126426697, -0.31266406178474426, -0.30194780230522156, -0.29123157262802124, -0.28051531314849854, -0.26979905366897583, -0.2590827941894531, -0.2483665645122528, -0.2376503050327301, -0.2269340455532074, -0.2162177860736847, -0.205501526594162, -0.19478526711463928, -0.18406902253627777, -0.17335276305675507, -0.16263651847839355, -0.15192025899887085, -0.14120399951934814, -0.13048774003982544, -0.11977149546146393, -0.10905524343252182, -0.09833899140357971, -0.087622731924057, -0.0769064798951149, -0.06619022786617279, -0.055473968386650085, -0.04475771635770798, -0.03404146432876587, -0.023325210437178612, -0.012608956545591354, -0.0018927007913589478, 0.00882355123758316, 0.01953980326652527, 0.030256062746047974, 0.04097231477499008, 0.05168856680393219, 0.0624048188328743, 0.0731210708618164, 0.08383733034133911, 0.09455358237028122, 0.10526983439922333, 0.11598609387874603, 0.12670233845710754, 0.13741859793663025, 0.14813485741615295, 0.15885110199451447, 0.16956736147403717, 0.18028360605239868, 0.1909998655319214, 0.2017161250114441, 0.2124323844909668, 0.2231486290693283, 0.233864888548851, 0.24458113312721252, 0.25529739260673523, 0.26601365208625793, 0.27672988176345825, 0.28744614124298096, 0.29816240072250366, 0.30887866020202637]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 3.0, 5.0, 6.0, 12.0, 8.0, 23.0, 21.0, 35.0, 47.0, 63.0, 109.0, 155.0, 238.0, 356.0, 754.0, 1685.0, 4975.0, 20497.0, 146978.0, 736978.0, 111053.0, 17023.0, 4320.0, 1461.0, 657.0, 364.0, 193.0, 150.0, 102.0, 77.0, 47.0, 36.0, 36.0, 26.0, 15.0, 12.0, 8.0, 5.0, 4.0, 4.0, 4.0, 3.0, 5.0], "bins": [-0.1190185546875, -0.11607551574707031, -0.11313247680664062, -0.11018943786621094, -0.10724639892578125, -0.10430335998535156, -0.10136032104492188, -0.09841728210449219, -0.0954742431640625, -0.09253120422363281, -0.08958816528320312, -0.08664512634277344, -0.08370208740234375, -0.08075904846191406, -0.07781600952148438, -0.07487297058105469, -0.071929931640625, -0.06898689270019531, -0.06604385375976562, -0.06310081481933594, -0.06015777587890625, -0.05721473693847656, -0.054271697998046875, -0.05132865905761719, -0.0483856201171875, -0.04544258117675781, -0.042499542236328125, -0.03955650329589844, -0.03661346435546875, -0.03367042541503906, -0.030727386474609375, -0.027784347534179688, -0.02484130859375, -0.021898269653320312, -0.018955230712890625, -0.016012191772460938, -0.01306915283203125, -0.010126113891601562, -0.007183074951171875, -0.0042400360107421875, -0.0012969970703125, 0.0016460418701171875, 0.004589080810546875, 0.0075321197509765625, 0.01047515869140625, 0.013418197631835938, 0.016361236572265625, 0.019304275512695312, 0.022247314453125, 0.025190353393554688, 0.028133392333984375, 0.031076431274414062, 0.03401947021484375, 0.03696250915527344, 0.039905548095703125, 0.04284858703613281, 0.0457916259765625, 0.04873466491699219, 0.051677703857421875, 0.05462074279785156, 0.05756378173828125, 0.06050682067871094, 0.06344985961914062, 0.06639289855957031, 0.0693359375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 10.0, 17.0, 30.0, 62.0, 64.0, 84.0, 104.0, 135.0, 123.0, 98.0, 88.0, 72.0, 43.0, 32.0, 14.0, 10.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031707763671875, -0.030848264694213867, -0.029988765716552734, -0.0291292667388916, -0.02826976776123047, -0.027410268783569336, -0.026550769805908203, -0.02569127082824707, -0.024831771850585938, -0.023972272872924805, -0.023112773895263672, -0.02225327491760254, -0.021393775939941406, -0.020534276962280273, -0.01967477798461914, -0.018815279006958008, -0.017955780029296875, -0.017096281051635742, -0.01623678207397461, -0.015377283096313477, -0.014517784118652344, -0.013658285140991211, -0.012798786163330078, -0.011939287185668945, -0.011079788208007812, -0.01022028923034668, -0.009360790252685547, -0.008501291275024414, -0.007641792297363281, -0.0067822933197021484, -0.005922794342041016, -0.005063295364379883, -0.00420379638671875, -0.003344297409057617, -0.0024847984313964844, -0.0016252994537353516, -0.0007658004760742188, 9.369850158691406e-05, 0.0009531974792480469, 0.0018126964569091797, 0.0026721954345703125, 0.0035316944122314453, 0.004391193389892578, 0.005250692367553711, 0.006110191345214844, 0.0069696903228759766, 0.00782918930053711, 0.008688688278198242, 0.009548187255859375, 0.010407686233520508, 0.01126718521118164, 0.012126684188842773, 0.012986183166503906, 0.013845682144165039, 0.014705181121826172, 0.015564680099487305, 0.016424179077148438, 0.01728367805480957, 0.018143177032470703, 0.019002676010131836, 0.01986217498779297, 0.0207216739654541, 0.021581172943115234, 0.022440671920776367, 0.0233001708984375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 5.0, 13.0, 8.0, 11.0, 9.0, 12.0, 17.0, 31.0, 50.0, 69.0, 118.0, 238.0, 636.0, 2028.0, 11841.0, 250890.0, 748875.0, 28451.0, 3580.0, 895.0, 323.0, 172.0, 90.0, 54.0, 39.0, 25.0, 21.0, 13.0, 13.0, 5.0, 5.0, 6.0, 1.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09295654296875, -0.08965778350830078, -0.08635902404785156, -0.08306026458740234, -0.07976150512695312, -0.0764627456665039, -0.07316398620605469, -0.06986522674560547, -0.06656646728515625, -0.06326770782470703, -0.05996894836425781, -0.056670188903808594, -0.053371429443359375, -0.050072669982910156, -0.04677391052246094, -0.04347515106201172, -0.0401763916015625, -0.03687763214111328, -0.03357887268066406, -0.030280113220214844, -0.026981353759765625, -0.023682594299316406, -0.020383834838867188, -0.01708507537841797, -0.01378631591796875, -0.010487556457519531, -0.0071887969970703125, -0.0038900375366210938, -0.000591278076171875, 0.0027074813842773438, 0.0060062408447265625, 0.009305000305175781, 0.012603759765625, 0.01590251922607422, 0.019201278686523438, 0.022500038146972656, 0.025798797607421875, 0.029097557067871094, 0.03239631652832031, 0.03569507598876953, 0.03899383544921875, 0.04229259490966797, 0.04559135437011719, 0.048890113830566406, 0.052188873291015625, 0.055487632751464844, 0.05878639221191406, 0.06208515167236328, 0.0653839111328125, 0.06868267059326172, 0.07198143005371094, 0.07528018951416016, 0.07857894897460938, 0.0818777084350586, 0.08517646789550781, 0.08847522735595703, 0.09177398681640625, 0.09507274627685547, 0.09837150573730469, 0.1016702651977539, 0.10496902465820312, 0.10826778411865234, 0.11156654357910156, 0.11486530303955078, 0.1181640625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 10.0, 13.0, 8.0, 5.0, 4.0, 22.0, 25.0, 26.0, 32.0, 34.0, 53.0, 48.0, 78.0, 73.0, 78.0, 60.0, 65.0, 56.0, 42.0, 55.0, 37.0, 37.0, 29.0, 21.0, 18.0, 11.0, 16.0, 9.0, 7.0, 4.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0604248046875, -0.058467864990234375, -0.05651092529296875, -0.054553985595703125, -0.0525970458984375, -0.050640106201171875, -0.04868316650390625, -0.046726226806640625, -0.044769287109375, -0.042812347412109375, -0.04085540771484375, -0.038898468017578125, -0.0369415283203125, -0.034984588623046875, -0.03302764892578125, -0.031070709228515625, -0.02911376953125, -0.027156829833984375, -0.02519989013671875, -0.023242950439453125, -0.0212860107421875, -0.019329071044921875, -0.01737213134765625, -0.015415191650390625, -0.013458251953125, -0.011501312255859375, -0.00954437255859375, -0.007587432861328125, -0.0056304931640625, -0.003673553466796875, -0.00171661376953125, 0.000240325927734375, 0.002197265625, 0.004154205322265625, 0.00611114501953125, 0.008068084716796875, 0.0100250244140625, 0.011981964111328125, 0.01393890380859375, 0.015895843505859375, 0.017852783203125, 0.019809722900390625, 0.02176666259765625, 0.023723602294921875, 0.0256805419921875, 0.027637481689453125, 0.02959442138671875, 0.031551361083984375, 0.03350830078125, 0.035465240478515625, 0.03742218017578125, 0.039379119873046875, 0.0413360595703125, 0.043292999267578125, 0.04524993896484375, 0.047206878662109375, 0.049163818359375, 0.051120758056640625, 0.05307769775390625, 0.055034637451171875, 0.0569915771484375, 0.058948516845703125, 0.06090545654296875, 0.06286239624023438, 0.0648193359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 4.0, 3.0, 8.0, 8.0, 11.0, 9.0, 21.0, 18.0, 32.0, 31.0, 63.0, 113.0, 242.0, 511.0, 1315.0, 3959.0, 19563.0, 437584.0, 554420.0, 23698.0, 4371.0, 1366.0, 584.0, 278.0, 116.0, 66.0, 42.0, 31.0, 26.0, 15.0, 7.0, 5.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.035552978515625, -0.03444337844848633, -0.033333778381347656, -0.032224178314208984, -0.031114578247070312, -0.03000497817993164, -0.02889537811279297, -0.027785778045654297, -0.026676177978515625, -0.025566577911376953, -0.02445697784423828, -0.02334737777709961, -0.022237777709960938, -0.021128177642822266, -0.020018577575683594, -0.018908977508544922, -0.01779937744140625, -0.016689777374267578, -0.015580177307128906, -0.014470577239990234, -0.013360977172851562, -0.01225137710571289, -0.011141777038574219, -0.010032176971435547, -0.008922576904296875, -0.007812976837158203, -0.006703376770019531, -0.005593776702880859, -0.0044841766357421875, -0.0033745765686035156, -0.0022649765014648438, -0.0011553764343261719, -4.57763671875e-05, 0.0010638236999511719, 0.0021734237670898438, 0.0032830238342285156, 0.0043926239013671875, 0.005502223968505859, 0.006611824035644531, 0.007721424102783203, 0.008831024169921875, 0.009940624237060547, 0.011050224304199219, 0.01215982437133789, 0.013269424438476562, 0.014379024505615234, 0.015488624572753906, 0.016598224639892578, 0.01770782470703125, 0.018817424774169922, 0.019927024841308594, 0.021036624908447266, 0.022146224975585938, 0.02325582504272461, 0.02436542510986328, 0.025475025177001953, 0.026584625244140625, 0.027694225311279297, 0.02880382537841797, 0.02991342544555664, 0.031023025512695312, 0.032132625579833984, 0.033242225646972656, 0.03435182571411133, 0.03546142578125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 9.0, 5.0, 8.0, 17.0, 21.0, 45.0, 74.0, 153.0, 244.0, 185.0, 119.0, 57.0, 30.0, 11.0, 11.0, 8.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013363361358642578, -0.0001286473125219345, -0.00012366101145744324, -0.00011867471039295197, -0.0001136884093284607, -0.00010870210826396942, -0.00010371580719947815, -9.872950613498688e-05, -9.37432050704956e-05, -8.875690400600433e-05, -8.377060294151306e-05, -7.878430187702179e-05, -7.379800081253052e-05, -6.881169974803925e-05, -6.382539868354797e-05, -5.88390976190567e-05, -5.385279655456543e-05, -4.886649549007416e-05, -4.3880194425582886e-05, -3.8893893361091614e-05, -3.390759229660034e-05, -2.892129123210907e-05, -2.3934990167617798e-05, -1.8948689103126526e-05, -1.3962388038635254e-05, -8.976086974143982e-06, -3.98978590965271e-06, 9.96515154838562e-07, 5.982816219329834e-06, 1.0969117283821106e-05, 1.5955418348312378e-05, 2.094171941280365e-05, 2.5928020477294922e-05, 3.0914321541786194e-05, 3.5900622606277466e-05, 4.088692367076874e-05, 4.587322473526001e-05, 5.085952579975128e-05, 5.5845826864242554e-05, 6.0832127928733826e-05, 6.58184289932251e-05, 7.080473005771637e-05, 7.579103112220764e-05, 8.077733218669891e-05, 8.576363325119019e-05, 9.074993431568146e-05, 9.573623538017273e-05, 0.000100722536444664, 0.00010570883750915527, 0.00011069513857364655, 0.00011568143963813782, 0.00012066774070262909, 0.00012565404176712036, 0.00013064034283161163, 0.0001356266438961029, 0.00014061294496059418, 0.00014559924602508545, 0.00015058554708957672, 0.000155571848154068, 0.00016055814921855927, 0.00016554445028305054, 0.0001705307513475418, 0.00017551705241203308, 0.00018050335347652435, 0.00018548965454101562]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 2.0, 8.0, 11.0, 12.0, 26.0, 35.0, 56.0, 89.0, 194.0, 416.0, 1239.0, 8454.0, 302121.0, 717642.0, 15434.0, 1857.0, 489.0, 199.0, 103.0, 50.0, 42.0, 24.0, 16.0, 14.0, 7.0, 2.0, 5.0, 7.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051422119140625, -0.049820899963378906, -0.04821968078613281, -0.04661846160888672, -0.045017242431640625, -0.04341602325439453, -0.04181480407714844, -0.040213584899902344, -0.03861236572265625, -0.037011146545410156, -0.03540992736816406, -0.03380870819091797, -0.032207489013671875, -0.03060626983642578, -0.029005050659179688, -0.027403831481933594, -0.0258026123046875, -0.024201393127441406, -0.022600173950195312, -0.02099895477294922, -0.019397735595703125, -0.01779651641845703, -0.016195297241210938, -0.014594078063964844, -0.01299285888671875, -0.011391639709472656, -0.009790420532226562, -0.008189201354980469, -0.006587982177734375, -0.004986763000488281, -0.0033855438232421875, -0.0017843246459960938, -0.00018310546875, 0.0014181137084960938, 0.0030193328857421875, 0.004620552062988281, 0.006221771240234375, 0.007822990417480469, 0.009424209594726562, 0.011025428771972656, 0.01262664794921875, 0.014227867126464844, 0.015829086303710938, 0.01743030548095703, 0.019031524658203125, 0.02063274383544922, 0.022233963012695312, 0.023835182189941406, 0.0254364013671875, 0.027037620544433594, 0.028638839721679688, 0.03024005889892578, 0.031841278076171875, 0.03344249725341797, 0.03504371643066406, 0.036644935607910156, 0.03824615478515625, 0.039847373962402344, 0.04144859313964844, 0.04304981231689453, 0.044651031494140625, 0.04625225067138672, 0.04785346984863281, 0.049454689025878906, 0.051055908203125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 7.0, 16.0, 13.0, 21.0, 35.0, 82.0, 80.0, 136.0, 176.0, 179.0, 105.0, 51.0, 32.0, 21.0, 16.0, 10.0, 6.0, 5.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037811279296875, -0.036685943603515625, -0.03556060791015625, -0.034435272216796875, -0.0333099365234375, -0.032184600830078125, -0.03105926513671875, -0.029933929443359375, -0.02880859375, -0.027683258056640625, -0.02655792236328125, -0.025432586669921875, -0.0243072509765625, -0.023181915283203125, -0.02205657958984375, -0.020931243896484375, -0.019805908203125, -0.018680572509765625, -0.01755523681640625, -0.016429901123046875, -0.0153045654296875, -0.014179229736328125, -0.01305389404296875, -0.011928558349609375, -0.01080322265625, -0.009677886962890625, -0.00855255126953125, -0.007427215576171875, -0.0063018798828125, -0.005176544189453125, -0.00405120849609375, -0.002925872802734375, -0.001800537109375, -0.000675201416015625, 0.00045013427734375, 0.001575469970703125, 0.0027008056640625, 0.003826141357421875, 0.00495147705078125, 0.006076812744140625, 0.0072021484375, 0.008327484130859375, 0.00945281982421875, 0.010578155517578125, 0.0117034912109375, 0.012828826904296875, 0.01395416259765625, 0.015079498291015625, 0.016204833984375, 0.017330169677734375, 0.01845550537109375, 0.019580841064453125, 0.0207061767578125, 0.021831512451171875, 0.02295684814453125, 0.024082183837890625, 0.02520751953125, 0.026332855224609375, 0.02745819091796875, 0.028583526611328125, 0.0297088623046875, 0.030834197998046875, 0.03195953369140625, 0.033084869384765625, 0.034210205078125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 11.0, 44.0, 244.0, 491.0, 163.0, 32.0, 11.0, 5.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6486761569976807, -0.6230819225311279, -0.5974876880645752, -0.5718934535980225, -0.5462992191314697, -0.520704984664917, -0.49511075019836426, -0.4695165157318115, -0.4439222812652588, -0.41832804679870605, -0.3927338123321533, -0.3671395778656006, -0.34154534339904785, -0.3159511089324951, -0.2903568744659424, -0.26476263999938965, -0.23916837573051453, -0.2135741412639618, -0.18797990679740906, -0.16238567233085632, -0.1367914378643036, -0.11119718849658966, -0.08560295403003693, -0.06000871956348419, -0.03441448509693146, -0.008820248767733574, 0.01677398756146431, 0.04236822575330734, 0.06796246021986008, 0.09355670213699341, 0.11915093660354614, 0.14474517107009888, 0.1703394055366516, 0.19593364000320435, 0.22152787446975708, 0.24712210893630981, 0.27271634340286255, 0.2983105778694153, 0.323904812335968, 0.34949904680252075, 0.3750932812690735, 0.4006875157356262, 0.42628175020217896, 0.4518759846687317, 0.4774702191352844, 0.5030644536018372, 0.5286586880683899, 0.5542529225349426, 0.5798472166061401, 0.6054414510726929, 0.6310356855392456, 0.6566299200057983, 0.6822241544723511, 0.7078183889389038, 0.7334126234054565, 0.7590068578720093, 0.784601092338562, 0.8101953268051147, 0.8357895612716675, 0.8613837957382202, 0.886978030204773, 0.9125722646713257, 0.9381664991378784, 0.9637607336044312, 0.9893549680709839]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 8.0, 3.0, 10.0, 7.0, 12.0, 18.0, 20.0, 22.0, 21.0, 32.0, 41.0, 50.0, 41.0, 54.0, 56.0, 62.0, 63.0, 62.0, 56.0, 46.0, 36.0, 57.0, 31.0, 39.0, 29.0, 26.0, 20.0, 14.0, 16.0, 12.0, 3.0, 11.0, 8.0, 6.0, 2.0, 1.0, 2.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.36685633659362793, -0.35721081495285034, -0.34756529331207275, -0.33791977167129517, -0.3282742500305176, -0.31862872838974, -0.3089832067489624, -0.2993376553058624, -0.28969213366508484, -0.28004661202430725, -0.27040109038352966, -0.2607555687427521, -0.2511100471019745, -0.2414645105600357, -0.23181898891925812, -0.22217345237731934, -0.21252794563770294, -0.20288242399692535, -0.19323690235614777, -0.18359136581420898, -0.1739458441734314, -0.1643003225326538, -0.15465480089187622, -0.14500927925109863, -0.13536375761032104, -0.12571823596954346, -0.11607270687818527, -0.10642718523740768, -0.0967816561460495, -0.08713613450527191, -0.07749061286449432, -0.06784508377313614, -0.058199554681777954, -0.04855402931571007, -0.03890850394964218, -0.029262982308864594, -0.019617456942796707, -0.00997193157672882, -0.0003264099359512329, 0.009319119155406952, 0.01896464079618454, 0.028610166162252426, 0.03825569152832031, 0.0479012131690979, 0.05754673853516579, 0.06719226390123367, 0.07683778554201126, 0.08648331463336945, 0.09612883627414703, 0.10577435791492462, 0.1154198870062828, 0.125065416097641, 0.13471093773841858, 0.14435645937919617, 0.15400198101997375, 0.16364750266075134, 0.17329302430152893, 0.18293854594230652, 0.1925840675830841, 0.2022295892238617, 0.21187512576580048, 0.22152064740657806, 0.23116616904735565, 0.24081170558929443, 0.250457227230072]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 12.0, 10.0, 10.0, 19.0, 18.0, 39.0, 56.0, 58.0, 91.0, 132.0, 215.0, 373.0, 706.0, 1682.0, 4847.0, 23899.0, 871070.0, 3250987.0, 32040.0, 5352.0, 1527.0, 570.0, 266.0, 145.0, 58.0, 31.0, 18.0, 11.0, 9.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1861572265625, -0.1819324493408203, -0.17770767211914062, -0.17348289489746094, -0.16925811767578125, -0.16503334045410156, -0.16080856323242188, -0.1565837860107422, -0.1523590087890625, -0.1481342315673828, -0.14390945434570312, -0.13968467712402344, -0.13545989990234375, -0.13123512268066406, -0.12701034545898438, -0.12278556823730469, -0.118560791015625, -0.11433601379394531, -0.11011123657226562, -0.10588645935058594, -0.10166168212890625, -0.09743690490722656, -0.09321212768554688, -0.08898735046386719, -0.0847625732421875, -0.08053779602050781, -0.07631301879882812, -0.07208824157714844, -0.06786346435546875, -0.06363868713378906, -0.059413909912109375, -0.05518913269042969, -0.05096435546875, -0.04673957824707031, -0.042514801025390625, -0.03829002380371094, -0.03406524658203125, -0.029840469360351562, -0.025615692138671875, -0.021390914916992188, -0.0171661376953125, -0.012941360473632812, -0.008716583251953125, -0.0044918060302734375, -0.00026702880859375, 0.0039577484130859375, 0.008182525634765625, 0.012407302856445312, 0.016632080078125, 0.020856857299804688, 0.025081634521484375, 0.029306411743164062, 0.03353118896484375, 0.03775596618652344, 0.041980743408203125, 0.04620552062988281, 0.0504302978515625, 0.05465507507324219, 0.058879852294921875, 0.06310462951660156, 0.06732940673828125, 0.07155418395996094, 0.07577896118164062, 0.08000373840332031, 0.084228515625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 7.0, 9.0, 18.0, 39.0, 43.0, 52.0, 70.0, 105.0, 80.0, 104.0, 103.0, 81.0, 84.0, 66.0, 32.0, 42.0, 24.0, 15.0, 12.0, 5.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02783203125, -0.027129650115966797, -0.026427268981933594, -0.02572488784790039, -0.025022506713867188, -0.024320125579833984, -0.02361774444580078, -0.022915363311767578, -0.022212982177734375, -0.021510601043701172, -0.02080821990966797, -0.020105838775634766, -0.019403457641601562, -0.01870107650756836, -0.017998695373535156, -0.017296314239501953, -0.01659393310546875, -0.015891551971435547, -0.015189170837402344, -0.01448678970336914, -0.013784408569335938, -0.013082027435302734, -0.012379646301269531, -0.011677265167236328, -0.010974884033203125, -0.010272502899169922, -0.009570121765136719, -0.008867740631103516, -0.008165359497070312, -0.007462978363037109, -0.006760597229003906, -0.006058216094970703, -0.0053558349609375, -0.004653453826904297, -0.003951072692871094, -0.0032486915588378906, -0.0025463104248046875, -0.0018439292907714844, -0.0011415481567382812, -0.0004391670227050781, 0.000263214111328125, 0.0009655952453613281, 0.0016679763793945312, 0.0023703575134277344, 0.0030727386474609375, 0.0037751197814941406, 0.004477500915527344, 0.005179882049560547, 0.00588226318359375, 0.006584644317626953, 0.007287025451660156, 0.00798940658569336, 0.008691787719726562, 0.009394168853759766, 0.010096549987792969, 0.010798931121826172, 0.011501312255859375, 0.012203693389892578, 0.012906074523925781, 0.013608455657958984, 0.014310836791992188, 0.01501321792602539, 0.015715599060058594, 0.016417980194091797, 0.017120361328125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 9.0, 14.0, 24.0, 45.0, 78.0, 195.0, 857.0, 4190736.0, 1761.0, 257.0, 120.0, 78.0, 54.0, 25.0, 22.0, 4.0, 6.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50732421875, -0.48146820068359375, -0.4556121826171875, -0.42975616455078125, -0.403900146484375, -0.37804412841796875, -0.3521881103515625, -0.32633209228515625, -0.30047607421875, -0.27462005615234375, -0.2487640380859375, -0.22290802001953125, -0.197052001953125, -0.17119598388671875, -0.1453399658203125, -0.11948394775390625, -0.0936279296875, -0.06777191162109375, -0.0419158935546875, -0.01605987548828125, 0.009796142578125, 0.03565216064453125, 0.0615081787109375, 0.08736419677734375, 0.11322021484375, 0.13907623291015625, 0.1649322509765625, 0.19078826904296875, 0.216644287109375, 0.24250030517578125, 0.2683563232421875, 0.29421234130859375, 0.320068359375, 0.34592437744140625, 0.3717803955078125, 0.39763641357421875, 0.423492431640625, 0.44934844970703125, 0.4752044677734375, 0.5010604858398438, 0.52691650390625, 0.5527725219726562, 0.5786285400390625, 0.6044845581054688, 0.630340576171875, 0.6561965942382812, 0.6820526123046875, 0.7079086303710938, 0.7337646484375, 0.7596206665039062, 0.7854766845703125, 0.8113327026367188, 0.837188720703125, 0.8630447387695312, 0.8889007568359375, 0.9147567749023438, 0.94061279296875, 0.9664688110351562, 0.9923248291015625, 1.0181808471679688, 1.044036865234375, 1.0698928833007812, 1.0957489013671875, 1.1216049194335938, 1.1474609375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 19.0, 377.0, 3581.0, 89.0, 14.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07818603515625, -0.07413005828857422, -0.07007408142089844, -0.06601810455322266, -0.061962127685546875, -0.057906150817871094, -0.05385017395019531, -0.04979419708251953, -0.04573822021484375, -0.04168224334716797, -0.03762626647949219, -0.033570289611816406, -0.029514312744140625, -0.025458335876464844, -0.021402359008789062, -0.01734638214111328, -0.0132904052734375, -0.009234428405761719, -0.0051784515380859375, -0.0011224746704101562, 0.002933502197265625, 0.006989479064941406, 0.011045455932617188, 0.015101432800292969, 0.01915740966796875, 0.02321338653564453, 0.027269363403320312, 0.031325340270996094, 0.035381317138671875, 0.039437294006347656, 0.04349327087402344, 0.04754924774169922, 0.051605224609375, 0.05566120147705078, 0.05971717834472656, 0.06377315521240234, 0.06782913208007812, 0.0718851089477539, 0.07594108581542969, 0.07999706268310547, 0.08405303955078125, 0.08810901641845703, 0.09216499328613281, 0.0962209701538086, 0.10027694702148438, 0.10433292388916016, 0.10838890075683594, 0.11244487762451172, 0.1165008544921875, 0.12055683135986328, 0.12461280822753906, 0.12866878509521484, 0.13272476196289062, 0.1367807388305664, 0.1408367156982422, 0.14489269256591797, 0.14894866943359375, 0.15300464630126953, 0.1570606231689453, 0.1611166000366211, 0.16517257690429688, 0.16922855377197266, 0.17328453063964844, 0.17734050750732422, 0.181396484375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 57.0, 930.0, 15.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2481105327606201, -1.2117807865142822, -1.1754511594772339, -1.139121413230896, -1.1027917861938477, -1.0664620399475098, -1.0301324129104614, -0.9938026666641235, -0.9574729800224304, -0.9211432933807373, -0.8848136067390442, -0.8484839200973511, -0.8121541738510132, -0.7758245468139648, -0.739494800567627, -0.7031651139259338, -0.6668354272842407, -0.6305057406425476, -0.5941760540008545, -0.5578463673591614, -0.5215166807174683, -0.48518696427345276, -0.44885724782943726, -0.41252756118774414, -0.376197874546051, -0.3398681879043579, -0.3035385012626648, -0.2672087848186493, -0.23087909817695618, -0.19454941153526306, -0.15821970999240875, -0.12189000844955444, -0.08556032180786133, -0.049230627715587616, -0.012900933623313904, 0.02342876046895981, 0.05975845456123352, 0.09608814120292664, 0.13241784274578094, 0.16874754428863525, 0.20507723093032837, 0.24140691757202148, 0.2777366042137146, 0.3140663206577301, 0.3503960072994232, 0.38672569394111633, 0.42305541038513184, 0.45938509702682495, 0.49571478366851807, 0.5320444703102112, 0.5683741569519043, 0.6047038435935974, 0.6410335302352905, 0.6773632764816284, 0.7136929631233215, 0.7500226497650146, 0.7863523364067078, 0.8226820230484009, 0.859011709690094, 0.8953413963317871, 0.931671142578125, 0.9680007696151733, 1.0043305158615112, 1.0406601428985596, 1.0769898891448975]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 9.0, 33.0, 55.0, 82.0, 127.0, 186.0, 166.0, 141.0, 103.0, 56.0, 22.0, 9.0, 12.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.31947869062423706, -0.31115612387657166, -0.30283358693122864, -0.29451102018356323, -0.2861884534358978, -0.2778659164905548, -0.2695433497428894, -0.261220782995224, -0.252898246049881, -0.24457569420337677, -0.23625312745571136, -0.22793057560920715, -0.21960802376270294, -0.21128547191619873, -0.20296290516853333, -0.1946403533220291, -0.1863177865743637, -0.1779952347278595, -0.1696726679801941, -0.16135011613368988, -0.15302756428718567, -0.14470499753952026, -0.13638244569301605, -0.12805989384651184, -0.11973733454942703, -0.11141477525234222, -0.10309222340583801, -0.0947696641087532, -0.0864471048116684, -0.07812455296516418, -0.06980199366807938, -0.061479438096284866, -0.053156882524490356, -0.04483432695269585, -0.03651177138090134, -0.02818921208381653, -0.01986665651202202, -0.011544100940227509, -0.0032215416431427, 0.00510101392865181, 0.01342356950044632, 0.02174612507224083, 0.03006868250668049, 0.03839123994112015, 0.04671379551291466, 0.05503635108470917, 0.06335891038179398, 0.07168146967887878, 0.080004021525383, 0.0883265808224678, 0.09664913266897202, 0.10497169196605682, 0.11329424381256104, 0.12161680310964584, 0.12993936240673065, 0.13826191425323486, 0.14658448100090027, 0.15490703284740448, 0.16322959959506989, 0.1715521514415741, 0.1798747032880783, 0.18819725513458252, 0.19651982188224792, 0.20484237372875214, 0.21316492557525635]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 4.0, 5.0, 8.0, 17.0, 16.0, 25.0, 50.0, 57.0, 91.0, 195.0, 353.0, 712.0, 1671.0, 5402.0, 26673.0, 246046.0, 671447.0, 78602.0, 11975.0, 2976.0, 1064.0, 489.0, 267.0, 137.0, 97.0, 66.0, 47.0, 20.0, 12.0, 6.0, 10.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.066650390625, -0.06437301635742188, -0.06209564208984375, -0.059818267822265625, -0.0575408935546875, -0.055263519287109375, -0.05298614501953125, -0.050708770751953125, -0.048431396484375, -0.046154022216796875, -0.04387664794921875, -0.041599273681640625, -0.0393218994140625, -0.037044525146484375, -0.03476715087890625, -0.032489776611328125, -0.03021240234375, -0.027935028076171875, -0.02565765380859375, -0.023380279541015625, -0.0211029052734375, -0.018825531005859375, -0.01654815673828125, -0.014270782470703125, -0.011993408203125, -0.009716033935546875, -0.00743865966796875, -0.005161285400390625, -0.0028839111328125, -0.000606536865234375, 0.00167083740234375, 0.003948211669921875, 0.0062255859375, 0.008502960205078125, 0.01078033447265625, 0.013057708740234375, 0.0153350830078125, 0.017612457275390625, 0.01988983154296875, 0.022167205810546875, 0.024444580078125, 0.026721954345703125, 0.02899932861328125, 0.031276702880859375, 0.0335540771484375, 0.035831451416015625, 0.03810882568359375, 0.040386199951171875, 0.04266357421875, 0.044940948486328125, 0.04721832275390625, 0.049495697021484375, 0.0517730712890625, 0.054050445556640625, 0.05632781982421875, 0.058605194091796875, 0.060882568359375, 0.06315994262695312, 0.06543731689453125, 0.06771469116210938, 0.0699920654296875, 0.07226943969726562, 0.07454681396484375, 0.07682418823242188, 0.0791015625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 6.0, 18.0, 22.0, 27.0, 35.0, 41.0, 52.0, 60.0, 81.0, 83.0, 81.0, 79.0, 79.0, 65.0, 62.0, 41.0, 45.0, 36.0, 17.0, 27.0, 14.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0207977294921875, -0.020245790481567383, -0.019693851470947266, -0.01914191246032715, -0.01858997344970703, -0.018038034439086914, -0.017486095428466797, -0.01693415641784668, -0.016382217407226562, -0.015830278396606445, -0.015278339385986328, -0.014726400375366211, -0.014174461364746094, -0.013622522354125977, -0.01307058334350586, -0.012518644332885742, -0.011966705322265625, -0.011414766311645508, -0.01086282730102539, -0.010310888290405273, -0.009758949279785156, -0.009207010269165039, -0.008655071258544922, -0.008103132247924805, -0.0075511932373046875, -0.00699925422668457, -0.006447315216064453, -0.005895376205444336, -0.005343437194824219, -0.0047914981842041016, -0.004239559173583984, -0.003687620162963867, -0.00313568115234375, -0.002583742141723633, -0.0020318031311035156, -0.0014798641204833984, -0.0009279251098632812, -0.00037598609924316406, 0.00017595291137695312, 0.0007278919219970703, 0.0012798309326171875, 0.0018317699432373047, 0.002383708953857422, 0.002935647964477539, 0.0034875869750976562, 0.0040395259857177734, 0.004591464996337891, 0.005143404006958008, 0.005695343017578125, 0.006247282028198242, 0.006799221038818359, 0.0073511600494384766, 0.007903099060058594, 0.008455038070678711, 0.009006977081298828, 0.009558916091918945, 0.010110855102539062, 0.01066279411315918, 0.011214733123779297, 0.011766672134399414, 0.012318611145019531, 0.012870550155639648, 0.013422489166259766, 0.013974428176879883, 0.0145263671875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 4.0, 13.0, 16.0, 18.0, 29.0, 27.0, 57.0, 102.0, 158.0, 361.0, 801.0, 2702.0, 15939.0, 416008.0, 586802.0, 20610.0, 3158.0, 914.0, 358.0, 164.0, 121.0, 63.0, 29.0, 23.0, 17.0, 16.0, 14.0, 1.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0], "bins": [-0.11724853515625, -0.11424636840820312, -0.11124420166015625, -0.10824203491210938, -0.1052398681640625, -0.10223770141601562, -0.09923553466796875, -0.09623336791992188, -0.093231201171875, -0.09022903442382812, -0.08722686767578125, -0.08422470092773438, -0.0812225341796875, -0.07822036743164062, -0.07521820068359375, -0.07221603393554688, -0.0692138671875, -0.06621170043945312, -0.06320953369140625, -0.060207366943359375, -0.0572052001953125, -0.054203033447265625, -0.05120086669921875, -0.048198699951171875, -0.045196533203125, -0.042194366455078125, -0.03919219970703125, -0.036190032958984375, -0.0331878662109375, -0.030185699462890625, -0.02718353271484375, -0.024181365966796875, -0.02117919921875, -0.018177032470703125, -0.01517486572265625, -0.012172698974609375, -0.0091705322265625, -0.006168365478515625, -0.00316619873046875, -0.000164031982421875, 0.002838134765625, 0.005840301513671875, 0.00884246826171875, 0.011844635009765625, 0.0148468017578125, 0.017848968505859375, 0.02085113525390625, 0.023853302001953125, 0.02685546875, 0.029857635498046875, 0.03285980224609375, 0.035861968994140625, 0.0388641357421875, 0.041866302490234375, 0.04486846923828125, 0.047870635986328125, 0.050872802734375, 0.053874969482421875, 0.05687713623046875, 0.059879302978515625, 0.0628814697265625, 0.06588363647460938, 0.06888580322265625, 0.07188796997070312, 0.07489013671875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 3.0, 1.0, 5.0, 4.0, 7.0, 9.0, 17.0, 17.0, 19.0, 23.0, 43.0, 56.0, 59.0, 60.0, 87.0, 69.0, 84.0, 73.0, 64.0, 61.0, 60.0, 38.0, 36.0, 27.0, 22.0, 16.0, 8.0, 13.0, 6.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08001708984375, -0.07781362533569336, -0.07561016082763672, -0.07340669631958008, -0.07120323181152344, -0.0689997673034668, -0.06679630279541016, -0.06459283828735352, -0.062389373779296875, -0.060185909271240234, -0.057982444763183594, -0.05577898025512695, -0.05357551574707031, -0.05137205123901367, -0.04916858673095703, -0.04696512222290039, -0.04476165771484375, -0.04255819320678711, -0.04035472869873047, -0.03815126419067383, -0.03594779968261719, -0.03374433517456055, -0.031540870666503906, -0.029337406158447266, -0.027133941650390625, -0.024930477142333984, -0.022727012634277344, -0.020523548126220703, -0.018320083618164062, -0.016116619110107422, -0.013913154602050781, -0.01170969009399414, -0.0095062255859375, -0.007302761077880859, -0.005099296569824219, -0.002895832061767578, -0.0006923675537109375, 0.0015110969543457031, 0.0037145614624023438, 0.005918025970458984, 0.008121490478515625, 0.010324954986572266, 0.012528419494628906, 0.014731884002685547, 0.016935348510742188, 0.019138813018798828, 0.02134227752685547, 0.02354574203491211, 0.02574920654296875, 0.02795267105102539, 0.03015613555908203, 0.03235960006713867, 0.03456306457519531, 0.03676652908325195, 0.038969993591308594, 0.041173458099365234, 0.043376922607421875, 0.045580387115478516, 0.047783851623535156, 0.0499873161315918, 0.05219078063964844, 0.05439424514770508, 0.05659770965576172, 0.05880117416381836, 0.061004638671875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 3.0, 3.0, 3.0, 10.0, 5.0, 4.0, 8.0, 20.0, 30.0, 55.0, 115.0, 229.0, 438.0, 919.0, 2675.0, 12770.0, 220704.0, 757702.0, 44627.0, 5364.0, 1568.0, 659.0, 264.0, 150.0, 100.0, 50.0, 31.0, 17.0, 8.0, 9.0, 8.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0164642333984375, -0.015651464462280273, -0.014838695526123047, -0.01402592658996582, -0.013213157653808594, -0.012400388717651367, -0.01158761978149414, -0.010774850845336914, -0.009962081909179688, -0.009149312973022461, -0.008336544036865234, -0.007523775100708008, -0.006711006164550781, -0.005898237228393555, -0.005085468292236328, -0.0042726993560791016, -0.003459930419921875, -0.0026471614837646484, -0.0018343925476074219, -0.0010216236114501953, -0.00020885467529296875, 0.0006039142608642578, 0.0014166831970214844, 0.002229452133178711, 0.0030422210693359375, 0.003854990005493164, 0.004667758941650391, 0.005480527877807617, 0.006293296813964844, 0.00710606575012207, 0.007918834686279297, 0.008731603622436523, 0.00954437255859375, 0.010357141494750977, 0.011169910430908203, 0.01198267936706543, 0.012795448303222656, 0.013608217239379883, 0.01442098617553711, 0.015233755111694336, 0.016046524047851562, 0.01685929298400879, 0.017672061920166016, 0.018484830856323242, 0.01929759979248047, 0.020110368728637695, 0.020923137664794922, 0.02173590660095215, 0.022548675537109375, 0.0233614444732666, 0.024174213409423828, 0.024986982345581055, 0.02579975128173828, 0.026612520217895508, 0.027425289154052734, 0.02823805809020996, 0.029050827026367188, 0.029863595962524414, 0.03067636489868164, 0.03148913383483887, 0.032301902770996094, 0.03311467170715332, 0.03392744064331055, 0.03474020957946777, 0.035552978515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 12.0, 3.0, 14.0, 22.0, 25.0, 31.0, 50.0, 64.0, 72.0, 119.0, 121.0, 131.0, 83.0, 74.0, 51.0, 38.0, 27.0, 19.0, 15.0, 10.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.033348083496094e-05, -6.787478923797607e-05, -6.541609764099121e-05, -6.295740604400635e-05, -6.0498714447021484e-05, -5.804002285003662e-05, -5.558133125305176e-05, -5.3122639656066895e-05, -5.066394805908203e-05, -4.820525646209717e-05, -4.5746564865112305e-05, -4.328787326812744e-05, -4.082918167114258e-05, -3.8370490074157715e-05, -3.591179847717285e-05, -3.345310688018799e-05, -3.0994415283203125e-05, -2.8535723686218262e-05, -2.60770320892334e-05, -2.3618340492248535e-05, -2.1159648895263672e-05, -1.870095729827881e-05, -1.6242265701293945e-05, -1.3783574104309082e-05, -1.1324882507324219e-05, -8.866190910339355e-06, -6.407499313354492e-06, -3.948807716369629e-06, -1.4901161193847656e-06, 9.685754776000977e-07, 3.427267074584961e-06, 5.885958671569824e-06, 8.344650268554688e-06, 1.080334186553955e-05, 1.3262033462524414e-05, 1.5720725059509277e-05, 1.817941665649414e-05, 2.0638108253479004e-05, 2.3096799850463867e-05, 2.555549144744873e-05, 2.8014183044433594e-05, 3.0472874641418457e-05, 3.293156623840332e-05, 3.5390257835388184e-05, 3.784894943237305e-05, 4.030764102935791e-05, 4.2766332626342773e-05, 4.522502422332764e-05, 4.76837158203125e-05, 5.014240741729736e-05, 5.2601099014282227e-05, 5.505979061126709e-05, 5.751848220825195e-05, 5.9977173805236816e-05, 6.243586540222168e-05, 6.489455699920654e-05, 6.73532485961914e-05, 6.981194019317627e-05, 7.227063179016113e-05, 7.4729323387146e-05, 7.718801498413086e-05, 7.964670658111572e-05, 8.210539817810059e-05, 8.456408977508545e-05, 8.702278137207031e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 1.0, 14.0, 25.0, 27.0, 50.0, 84.0, 187.0, 377.0, 1164.0, 4819.0, 76620.0, 907482.0, 51875.0, 4114.0, 975.0, 392.0, 160.0, 75.0, 44.0, 25.0, 18.0, 9.0, 4.0, 5.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039306640625, -0.03822827339172363, -0.037149906158447266, -0.0360715389251709, -0.03499317169189453, -0.033914804458618164, -0.0328364372253418, -0.03175806999206543, -0.030679702758789062, -0.029601335525512695, -0.028522968292236328, -0.02744460105895996, -0.026366233825683594, -0.025287866592407227, -0.02420949935913086, -0.023131132125854492, -0.022052764892578125, -0.020974397659301758, -0.01989603042602539, -0.018817663192749023, -0.017739295959472656, -0.01666092872619629, -0.015582561492919922, -0.014504194259643555, -0.013425827026367188, -0.01234745979309082, -0.011269092559814453, -0.010190725326538086, -0.009112358093261719, -0.008033990859985352, -0.006955623626708984, -0.005877256393432617, -0.00479888916015625, -0.003720521926879883, -0.0026421546936035156, -0.0015637874603271484, -0.00048542022705078125, 0.0005929470062255859, 0.0016713142395019531, 0.0027496814727783203, 0.0038280487060546875, 0.004906415939331055, 0.005984783172607422, 0.007063150405883789, 0.008141517639160156, 0.009219884872436523, 0.01029825210571289, 0.011376619338989258, 0.012454986572265625, 0.013533353805541992, 0.01461172103881836, 0.015690088272094727, 0.016768455505371094, 0.01784682273864746, 0.018925189971923828, 0.020003557205200195, 0.021081924438476562, 0.02216029167175293, 0.023238658905029297, 0.024317026138305664, 0.02539539337158203, 0.0264737606048584, 0.027552127838134766, 0.028630495071411133, 0.0297088623046875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 6.0, 14.0, 18.0, 30.0, 59.0, 97.0, 129.0, 170.0, 151.0, 106.0, 80.0, 44.0, 41.0, 18.0, 16.0, 9.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.029632568359375, -0.02885293960571289, -0.02807331085205078, -0.027293682098388672, -0.026514053344726562, -0.025734424591064453, -0.024954795837402344, -0.024175167083740234, -0.023395538330078125, -0.022615909576416016, -0.021836280822753906, -0.021056652069091797, -0.020277023315429688, -0.019497394561767578, -0.01871776580810547, -0.01793813705444336, -0.01715850830078125, -0.01637887954711914, -0.015599250793457031, -0.014819622039794922, -0.014039993286132812, -0.013260364532470703, -0.012480735778808594, -0.011701107025146484, -0.010921478271484375, -0.010141849517822266, -0.009362220764160156, -0.008582592010498047, -0.0078029632568359375, -0.007023334503173828, -0.006243705749511719, -0.005464076995849609, -0.0046844482421875, -0.0039048194885253906, -0.0031251907348632812, -0.002345561981201172, -0.0015659332275390625, -0.0007863044738769531, -6.67572021484375e-06, 0.0007729530334472656, 0.001552581787109375, 0.0023322105407714844, 0.0031118392944335938, 0.003891468048095703, 0.0046710968017578125, 0.005450725555419922, 0.006230354309082031, 0.007009983062744141, 0.00778961181640625, 0.00856924057006836, 0.009348869323730469, 0.010128498077392578, 0.010908126831054688, 0.011687755584716797, 0.012467384338378906, 0.013247013092041016, 0.014026641845703125, 0.014806270599365234, 0.015585899353027344, 0.016365528106689453, 0.017145156860351562, 0.017924785614013672, 0.01870441436767578, 0.01948404312133789, 0.020263671875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 16.0, 36.0, 148.0, 414.0, 279.0, 70.0, 23.0, 7.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.119673252105713, -1.0980406999588013, -1.0764080286026, -1.0547754764556885, -1.0331428050994873, -1.0115102529525757, -0.9898776412010193, -0.9682450294494629, -0.9466124773025513, -0.9249798655509949, -0.9033472537994385, -0.8817147016525269, -0.8600820899009705, -0.8384494781494141, -0.8168168663978577, -0.7951842546463013, -0.7735516428947449, -0.7519190311431885, -0.7302864193916321, -0.7086538076400757, -0.6870212554931641, -0.6653886437416077, -0.6437560319900513, -0.6221234202384949, -0.6004908084869385, -0.5788581967353821, -0.5572255849838257, -0.5355930328369141, -0.5139604210853577, -0.49232780933380127, -0.4706951975822449, -0.4490625858306885, -0.42743003368377686, -0.40579742193222046, -0.38416483998298645, -0.36253222823143005, -0.34089964628219604, -0.31926703453063965, -0.29763442277908325, -0.27600181102752686, -0.25436922907829285, -0.23273663222789764, -0.21110403537750244, -0.18947142362594604, -0.16783882677555084, -0.14620622992515564, -0.12457361817359924, -0.10294102132320404, -0.08130842447280884, -0.05967582389712334, -0.038043223321437836, -0.016410619020462036, 0.0052219778299331665, 0.02685457468032837, 0.048487186431884766, 0.07011978328227997, 0.09175238013267517, 0.11338497698307037, 0.13501757383346558, 0.15665018558502197, 0.17828278243541718, 0.19991537928581238, 0.22154799103736877, 0.24318058788776398, 0.2648131847381592]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 5.0, 4.0, 11.0, 11.0, 13.0, 8.0, 19.0, 19.0, 22.0, 34.0, 30.0, 31.0, 32.0, 42.0, 48.0, 43.0, 44.0, 48.0, 58.0, 50.0, 45.0, 47.0, 35.0, 42.0, 37.0, 33.0, 25.0, 24.0, 28.0, 23.0, 20.0, 13.0, 15.0, 7.0, 6.0, 10.0, 5.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.2805614471435547, -0.27219751477241516, -0.26383358240127563, -0.2554696500301361, -0.24710571765899658, -0.23874178528785706, -0.23037786781787872, -0.2220139354467392, -0.21365000307559967, -0.20528607070446014, -0.19692213833332062, -0.1885582059621811, -0.18019428849220276, -0.17183035612106323, -0.1634664237499237, -0.15510249137878418, -0.14673855900764465, -0.13837462663650513, -0.1300106942653656, -0.12164676934480667, -0.11328283697366714, -0.10491890460252762, -0.09655497968196869, -0.08819104731082916, -0.07982711493968964, -0.07146318256855011, -0.06309925019741058, -0.054735325276851654, -0.04637139290571213, -0.0380074605345726, -0.029643531888723373, -0.021279603242874146, -0.01291567087173462, -0.004551740363240242, 0.003812190145254135, 0.012176120653748512, 0.02054005116224289, 0.028903983533382416, 0.037267912179231644, 0.04563184082508087, 0.0539957731962204, 0.062359705567359924, 0.07072363793849945, 0.07908756285905838, 0.0874514952301979, 0.09581542760133743, 0.10417935252189636, 0.11254328489303589, 0.12090721726417542, 0.12927114963531494, 0.13763508200645447, 0.145999014377594, 0.15436294674873352, 0.16272687911987305, 0.17109079658985138, 0.1794547289609909, 0.18781866133213043, 0.19618259370326996, 0.20454652607440948, 0.212910458445549, 0.22127437591552734, 0.22963830828666687, 0.2380022406578064, 0.24636617302894592, 0.25473010540008545]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 5.0, 7.0, 11.0, 18.0, 14.0, 20.0, 32.0, 34.0, 47.0, 91.0, 111.0, 160.0, 292.0, 542.0, 985.0, 1983.0, 4878.0, 16834.0, 113996.0, 3815720.0, 207713.0, 21622.0, 5494.0, 1902.0, 849.0, 426.0, 198.0, 120.0, 59.0, 39.0, 23.0, 13.0, 12.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1282958984375, -0.12497138977050781, -0.12164688110351562, -0.11832237243652344, -0.11499786376953125, -0.11167335510253906, -0.10834884643554688, -0.10502433776855469, -0.1016998291015625, -0.09837532043457031, -0.09505081176757812, -0.09172630310058594, -0.08840179443359375, -0.08507728576660156, -0.08175277709960938, -0.07842826843261719, -0.075103759765625, -0.07177925109863281, -0.06845474243164062, -0.06513023376464844, -0.06180572509765625, -0.05848121643066406, -0.055156707763671875, -0.05183219909667969, -0.0485076904296875, -0.04518318176269531, -0.041858673095703125, -0.03853416442871094, -0.03520965576171875, -0.03188514709472656, -0.028560638427734375, -0.025236129760742188, -0.02191162109375, -0.018587112426757812, -0.015262603759765625, -0.011938095092773438, -0.00861358642578125, -0.0052890777587890625, -0.001964569091796875, 0.0013599395751953125, 0.0046844482421875, 0.008008956909179688, 0.011333465576171875, 0.014657974243164062, 0.01798248291015625, 0.021306991577148438, 0.024631500244140625, 0.027956008911132812, 0.031280517578125, 0.03460502624511719, 0.037929534912109375, 0.04125404357910156, 0.04457855224609375, 0.04790306091308594, 0.051227569580078125, 0.05455207824707031, 0.0578765869140625, 0.06120109558105469, 0.06452560424804688, 0.06785011291503906, 0.07117462158203125, 0.07449913024902344, 0.07782363891601562, 0.08114814758300781, 0.08447265625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 6.0, 9.0, 8.0, 17.0, 16.0, 27.0, 39.0, 45.0, 47.0, 62.0, 60.0, 74.0, 88.0, 79.0, 75.0, 70.0, 54.0, 49.0, 36.0, 38.0, 30.0, 25.0, 19.0, 11.0, 4.0, 9.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0184783935546875, -0.017963767051696777, -0.017449140548706055, -0.016934514045715332, -0.01641988754272461, -0.015905261039733887, -0.015390634536743164, -0.014876008033752441, -0.014361381530761719, -0.013846755027770996, -0.013332128524780273, -0.01281750202178955, -0.012302875518798828, -0.011788249015808105, -0.011273622512817383, -0.01075899600982666, -0.010244369506835938, -0.009729743003845215, -0.009215116500854492, -0.00870048999786377, -0.008185863494873047, -0.007671236991882324, -0.0071566104888916016, -0.006641983985900879, -0.006127357482910156, -0.005612730979919434, -0.005098104476928711, -0.004583477973937988, -0.004068851470947266, -0.003554224967956543, -0.0030395984649658203, -0.0025249719619750977, -0.002010345458984375, -0.0014957189559936523, -0.0009810924530029297, -0.00046646595001220703, 4.8160552978515625e-05, 0.0005627870559692383, 0.001077413558959961, 0.0015920400619506836, 0.0021066665649414062, 0.002621293067932129, 0.0031359195709228516, 0.0036505460739135742, 0.004165172576904297, 0.0046797990798950195, 0.005194425582885742, 0.005709052085876465, 0.0062236785888671875, 0.00673830509185791, 0.007252931594848633, 0.0077675580978393555, 0.008282184600830078, 0.0087968111038208, 0.009311437606811523, 0.009826064109802246, 0.010340690612792969, 0.010855317115783691, 0.011369943618774414, 0.011884570121765137, 0.01239919662475586, 0.012913823127746582, 0.013428449630737305, 0.013943076133728027, 0.01445770263671875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 9.0, 11.0, 16.0, 13.0, 26.0, 45.0, 52.0, 90.0, 211.0, 448.0, 1044.0, 4115.0, 37933.0, 4111928.0, 32617.0, 4026.0, 982.0, 356.0, 143.0, 89.0, 42.0, 32.0, 19.0, 11.0, 7.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.21630859375, -0.21053695678710938, -0.20476531982421875, -0.19899368286132812, -0.1932220458984375, -0.18745040893554688, -0.18167877197265625, -0.17590713500976562, -0.170135498046875, -0.16436386108398438, -0.15859222412109375, -0.15282058715820312, -0.1470489501953125, -0.14127731323242188, -0.13550567626953125, -0.12973403930664062, -0.12396240234375, -0.11819076538085938, -0.11241912841796875, -0.10664749145507812, -0.1008758544921875, -0.09510421752929688, -0.08933258056640625, -0.08356094360351562, -0.077789306640625, -0.07201766967773438, -0.06624603271484375, -0.060474395751953125, -0.0547027587890625, -0.048931121826171875, -0.04315948486328125, -0.037387847900390625, -0.0316162109375, -0.025844573974609375, -0.02007293701171875, -0.014301300048828125, -0.0085296630859375, -0.002758026123046875, 0.00301361083984375, 0.008785247802734375, 0.014556884765625, 0.020328521728515625, 0.02610015869140625, 0.031871795654296875, 0.0376434326171875, 0.043415069580078125, 0.04918670654296875, 0.054958343505859375, 0.06072998046875, 0.06650161743164062, 0.07227325439453125, 0.07804489135742188, 0.0838165283203125, 0.08958816528320312, 0.09535980224609375, 0.10113143920898438, 0.106903076171875, 0.11267471313476562, 0.11844635009765625, 0.12421798706054688, 0.1299896240234375, 0.13576126098632812, 0.14153289794921875, 0.14730453491210938, 0.153076171875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 0.0, 6.0, 2.0, 7.0, 7.0, 16.0, 29.0, 55.0, 132.0, 541.0, 2425.0, 583.0, 135.0, 59.0, 24.0, 12.0, 14.0, 5.0, 4.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07086181640625, -0.06911277770996094, -0.06736373901367188, -0.06561470031738281, -0.06386566162109375, -0.06211662292480469, -0.060367584228515625, -0.05861854553222656, -0.0568695068359375, -0.05512046813964844, -0.053371429443359375, -0.05162239074707031, -0.04987335205078125, -0.04812431335449219, -0.046375274658203125, -0.04462623596191406, -0.042877197265625, -0.04112815856933594, -0.039379119873046875, -0.03763008117675781, -0.03588104248046875, -0.03413200378417969, -0.032382965087890625, -0.030633926391601562, -0.0288848876953125, -0.027135848999023438, -0.025386810302734375, -0.023637771606445312, -0.02188873291015625, -0.020139694213867188, -0.018390655517578125, -0.016641616821289062, -0.014892578125, -0.013143539428710938, -0.011394500732421875, -0.009645462036132812, -0.00789642333984375, -0.0061473846435546875, -0.004398345947265625, -0.0026493072509765625, -0.0009002685546875, 0.0008487701416015625, 0.002597808837890625, 0.0043468475341796875, 0.00609588623046875, 0.007844924926757812, 0.009593963623046875, 0.011343002319335938, 0.013092041015625, 0.014841079711914062, 0.016590118408203125, 0.018339157104492188, 0.02008819580078125, 0.021837234497070312, 0.023586273193359375, 0.025335311889648438, 0.0270843505859375, 0.028833389282226562, 0.030582427978515625, 0.03233146667480469, 0.03408050537109375, 0.03582954406738281, 0.037578582763671875, 0.03932762145996094, 0.04107666015625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 68.0, 819.0, 107.0, 12.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0050221681594849, -0.9751108288764954, -0.9451994299888611, -0.9152880907058716, -0.8853766918182373, -0.8554653525352478, -0.8255540132522583, -0.795642614364624, -0.7657312154769897, -0.7358198761940002, -0.705908477306366, -0.6759971380233765, -0.6460857391357422, -0.6161743998527527, -0.5862630605697632, -0.5563516616821289, -0.5264403223991394, -0.4965289533138275, -0.4666175842285156, -0.4367062449455261, -0.40679484605789185, -0.37688350677490234, -0.34697213768959045, -0.31706076860427856, -0.2871493995189667, -0.2572380304336548, -0.2273266613483429, -0.1974153071641922, -0.1675039380788803, -0.13759256899356842, -0.10768121480941772, -0.07776984572410583, -0.047858476638793945, -0.017947111278772354, 0.011964254081249237, 0.04187561571598053, 0.07178698480129242, 0.10169835388660431, 0.131609708070755, 0.1615210771560669, 0.19143244624137878, 0.22134381532669067, 0.25125518441200256, 0.28116655349731445, 0.31107789278030396, 0.34098929166793823, 0.37090063095092773, 0.4008120000362396, 0.4307233691215515, 0.4606347382068634, 0.4905461072921753, 0.5204574465751648, 0.5503688454627991, 0.5802801847457886, 0.6101915836334229, 0.6401029229164124, 0.6700142621994019, 0.6999256014823914, 0.7298370003700256, 0.7597483396530151, 0.7896597385406494, 0.8195710778236389, 0.8494824171066284, 0.8793938159942627, 0.909305214881897]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 11.0, 12.0, 24.0, 27.0, 23.0, 37.0, 31.0, 59.0, 60.0, 66.0, 90.0, 77.0, 83.0, 73.0, 60.0, 66.0, 47.0, 33.0, 42.0, 16.0, 17.0, 13.0, 10.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.17158102989196777, -0.16578951478004456, -0.15999801456928253, -0.1542065143585205, -0.1484149992465973, -0.14262348413467407, -0.13683198392391205, -0.13104048371315002, -0.1252489686012268, -0.11945746093988419, -0.11366595327854156, -0.10787444561719894, -0.10208293795585632, -0.0962914302945137, -0.09049992263317108, -0.08470841497182846, -0.07891690731048584, -0.07312539964914322, -0.0673338919878006, -0.06154238432645798, -0.055750876665115356, -0.049959369003772736, -0.044167861342430115, -0.038376353681087494, -0.03258484601974487, -0.026793338358402252, -0.02100183069705963, -0.01521032303571701, -0.00941881537437439, -0.003627307713031769, 0.002164199948310852, 0.007955707609653473, 0.013747215270996094, 0.019538722932338715, 0.025330230593681335, 0.031121738255023956, 0.03691324591636658, 0.0427047535777092, 0.04849626123905182, 0.05428776890039444, 0.06007927656173706, 0.06587078422307968, 0.0716622918844223, 0.07745379954576492, 0.08324530720710754, 0.08903681486845016, 0.09482832252979279, 0.1006198301911354, 0.10641133785247803, 0.11220284551382065, 0.11799435317516327, 0.12378586083650589, 0.1295773684978485, 0.13536888360977173, 0.14116038382053375, 0.14695188403129578, 0.152743399143219, 0.1585349142551422, 0.16432641446590424, 0.17011791467666626, 0.17590942978858948, 0.1817009449005127, 0.18749244511127472, 0.19328394532203674, 0.19907546043395996]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 10.0, 6.0, 11.0, 23.0, 23.0, 34.0, 51.0, 65.0, 135.0, 225.0, 319.0, 659.0, 1363.0, 3774.0, 14374.0, 92521.0, 587744.0, 298142.0, 37174.0, 7410.0, 2306.0, 994.0, 465.0, 273.0, 151.0, 87.0, 62.0, 47.0, 38.0, 14.0, 19.0, 13.0, 9.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059326171875, -0.05756950378417969, -0.055812835693359375, -0.05405616760253906, -0.05229949951171875, -0.05054283142089844, -0.048786163330078125, -0.04702949523925781, -0.0452728271484375, -0.04351615905761719, -0.041759490966796875, -0.04000282287597656, -0.03824615478515625, -0.03648948669433594, -0.034732818603515625, -0.03297615051269531, -0.031219482421875, -0.029462814331054688, -0.027706146240234375, -0.025949478149414062, -0.02419281005859375, -0.022436141967773438, -0.020679473876953125, -0.018922805786132812, -0.0171661376953125, -0.015409469604492188, -0.013652801513671875, -0.011896133422851562, -0.01013946533203125, -0.008382797241210938, -0.006626129150390625, -0.0048694610595703125, -0.00311279296875, -0.0013561248779296875, 0.000400543212890625, 0.0021572113037109375, 0.00391387939453125, 0.0056705474853515625, 0.007427215576171875, 0.009183883666992188, 0.0109405517578125, 0.012697219848632812, 0.014453887939453125, 0.016210556030273438, 0.01796722412109375, 0.019723892211914062, 0.021480560302734375, 0.023237228393554688, 0.024993896484375, 0.026750564575195312, 0.028507232666015625, 0.030263900756835938, 0.03202056884765625, 0.03377723693847656, 0.035533905029296875, 0.03729057312011719, 0.0390472412109375, 0.04080390930175781, 0.042560577392578125, 0.04431724548339844, 0.04607391357421875, 0.04783058166503906, 0.049587249755859375, 0.05134391784667969, 0.0531005859375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 9.0, 18.0, 24.0, 35.0, 59.0, 75.0, 82.0, 111.0, 137.0, 95.0, 112.0, 64.0, 60.0, 45.0, 33.0, 17.0, 15.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027801513671875, -0.027116060256958008, -0.026430606842041016, -0.025745153427124023, -0.02505970001220703, -0.02437424659729004, -0.023688793182373047, -0.023003339767456055, -0.022317886352539062, -0.02163243293762207, -0.020946979522705078, -0.020261526107788086, -0.019576072692871094, -0.0188906192779541, -0.01820516586303711, -0.017519712448120117, -0.016834259033203125, -0.016148805618286133, -0.01546335220336914, -0.014777898788452148, -0.014092445373535156, -0.013406991958618164, -0.012721538543701172, -0.01203608512878418, -0.011350631713867188, -0.010665178298950195, -0.009979724884033203, -0.009294271469116211, -0.008608818054199219, -0.007923364639282227, -0.007237911224365234, -0.006552457809448242, -0.00586700439453125, -0.005181550979614258, -0.004496097564697266, -0.0038106441497802734, -0.0031251907348632812, -0.002439737319946289, -0.0017542839050292969, -0.0010688304901123047, -0.0003833770751953125, 0.0003020763397216797, 0.0009875297546386719, 0.001672983169555664, 0.0023584365844726562, 0.0030438899993896484, 0.0037293434143066406, 0.004414796829223633, 0.005100250244140625, 0.005785703659057617, 0.006471157073974609, 0.0071566104888916016, 0.007842063903808594, 0.008527517318725586, 0.009212970733642578, 0.00989842414855957, 0.010583877563476562, 0.011269330978393555, 0.011954784393310547, 0.012640237808227539, 0.013325691223144531, 0.014011144638061523, 0.014696598052978516, 0.015382051467895508, 0.0160675048828125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 8.0, 14.0, 16.0, 22.0, 37.0, 48.0, 79.0, 103.0, 177.0, 301.0, 707.0, 2123.0, 8722.0, 51212.0, 347532.0, 521447.0, 96278.0, 14499.0, 3252.0, 1008.0, 387.0, 209.0, 121.0, 80.0, 47.0, 32.0, 25.0, 19.0, 13.0, 9.0, 8.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03668212890625, -0.035424232482910156, -0.03416633605957031, -0.03290843963623047, -0.031650543212890625, -0.03039264678955078, -0.029134750366210938, -0.027876853942871094, -0.02661895751953125, -0.025361061096191406, -0.024103164672851562, -0.02284526824951172, -0.021587371826171875, -0.02032947540283203, -0.019071578979492188, -0.017813682556152344, -0.0165557861328125, -0.015297889709472656, -0.014039993286132812, -0.012782096862792969, -0.011524200439453125, -0.010266304016113281, -0.009008407592773438, -0.007750511169433594, -0.00649261474609375, -0.005234718322753906, -0.0039768218994140625, -0.0027189254760742188, -0.001461029052734375, -0.00020313262939453125, 0.0010547637939453125, 0.0023126602172851562, 0.003570556640625, 0.004828453063964844, 0.0060863494873046875, 0.007344245910644531, 0.008602142333984375, 0.009860038757324219, 0.011117935180664062, 0.012375831604003906, 0.01363372802734375, 0.014891624450683594, 0.016149520874023438, 0.01740741729736328, 0.018665313720703125, 0.01992321014404297, 0.021181106567382812, 0.022439002990722656, 0.0236968994140625, 0.024954795837402344, 0.026212692260742188, 0.02747058868408203, 0.028728485107421875, 0.02998638153076172, 0.031244277954101562, 0.032502174377441406, 0.03376007080078125, 0.035017967224121094, 0.03627586364746094, 0.03753376007080078, 0.038791656494140625, 0.04004955291748047, 0.04130744934082031, 0.042565345764160156, 0.0438232421875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 1.0, 6.0, 11.0, 5.0, 20.0, 12.0, 23.0, 20.0, 36.0, 32.0, 25.0, 41.0, 55.0, 42.0, 51.0, 55.0, 56.0, 44.0, 56.0, 50.0, 41.0, 50.0, 40.0, 36.0, 30.0, 43.0, 22.0, 17.0, 12.0, 13.0, 14.0, 11.0, 9.0, 5.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03607177734375, -0.03478431701660156, -0.033496856689453125, -0.03220939636230469, -0.03092193603515625, -0.029634475708007812, -0.028347015380859375, -0.027059555053710938, -0.0257720947265625, -0.024484634399414062, -0.023197174072265625, -0.021909713745117188, -0.02062225341796875, -0.019334793090820312, -0.018047332763671875, -0.016759872436523438, -0.015472412109375, -0.014184951782226562, -0.012897491455078125, -0.011610031127929688, -0.01032257080078125, -0.009035110473632812, -0.007747650146484375, -0.0064601898193359375, -0.0051727294921875, -0.0038852691650390625, -0.002597808837890625, -0.0013103485107421875, -2.288818359375e-05, 0.0012645721435546875, 0.002552032470703125, 0.0038394927978515625, 0.005126953125, 0.0064144134521484375, 0.007701873779296875, 0.008989334106445312, 0.01027679443359375, 0.011564254760742188, 0.012851715087890625, 0.014139175415039062, 0.0154266357421875, 0.016714096069335938, 0.018001556396484375, 0.019289016723632812, 0.02057647705078125, 0.021863937377929688, 0.023151397705078125, 0.024438858032226562, 0.025726318359375, 0.027013778686523438, 0.028301239013671875, 0.029588699340820312, 0.03087615966796875, 0.03216361999511719, 0.033451080322265625, 0.03473854064941406, 0.0360260009765625, 0.03731346130371094, 0.038600921630859375, 0.03988838195800781, 0.04117584228515625, 0.04246330261230469, 0.043750762939453125, 0.04503822326660156, 0.04632568359375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 10.0, 15.0, 20.0, 27.0, 43.0, 91.0, 184.0, 360.0, 795.0, 1952.0, 6678.0, 43836.0, 542001.0, 412887.0, 31085.0, 5434.0, 1747.0, 715.0, 321.0, 153.0, 76.0, 45.0, 28.0, 7.0, 10.0, 9.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0195465087890625, -0.018934249877929688, -0.018321990966796875, -0.017709732055664062, -0.01709747314453125, -0.016485214233398438, -0.015872955322265625, -0.015260696411132812, -0.0146484375, -0.014036178588867188, -0.013423919677734375, -0.012811660766601562, -0.01219940185546875, -0.011587142944335938, -0.010974884033203125, -0.010362625122070312, -0.0097503662109375, -0.009138107299804688, -0.008525848388671875, -0.007913589477539062, -0.00730133056640625, -0.0066890716552734375, -0.006076812744140625, -0.0054645538330078125, -0.004852294921875, -0.0042400360107421875, -0.003627777099609375, -0.0030155181884765625, -0.00240325927734375, -0.0017910003662109375, -0.001178741455078125, -0.0005664825439453125, 4.57763671875e-05, 0.0006580352783203125, 0.001270294189453125, 0.0018825531005859375, 0.00249481201171875, 0.0031070709228515625, 0.003719329833984375, 0.0043315887451171875, 0.00494384765625, 0.0055561065673828125, 0.006168365478515625, 0.0067806243896484375, 0.00739288330078125, 0.008005142211914062, 0.008617401123046875, 0.009229660034179688, 0.0098419189453125, 0.010454177856445312, 0.011066436767578125, 0.011678695678710938, 0.01229095458984375, 0.012903213500976562, 0.013515472412109375, 0.014127731323242188, 0.014739990234375, 0.015352249145507812, 0.015964508056640625, 0.016576766967773438, 0.01718902587890625, 0.017801284790039062, 0.018413543701171875, 0.019025802612304688, 0.0196380615234375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [6.0, 7.0, 5.0, 11.0, 19.0, 51.0, 88.0, 154.0, 214.0, 195.0, 128.0, 66.0, 44.0, 16.0, 7.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.987550735473633e-05, -3.5363249480724335e-05, -3.085099160671234e-05, -2.6338733732700348e-05, -2.1826475858688354e-05, -1.731421798467636e-05, -1.2801960110664368e-05, -8.289702236652374e-06, -3.777444362640381e-06, 7.348135113716125e-07, 5.247071385383606e-06, 9.7593292593956e-06, 1.4271587133407593e-05, 1.8783845007419586e-05, 2.329610288143158e-05, 2.7808360755443573e-05, 3.2320618629455566e-05, 3.683287650346756e-05, 4.134513437747955e-05, 4.585739225149155e-05, 5.036965012550354e-05, 5.4881907999515533e-05, 5.939416587352753e-05, 6.390642374753952e-05, 6.841868162155151e-05, 7.293093949556351e-05, 7.74431973695755e-05, 8.19554552435875e-05, 8.646771311759949e-05, 9.097997099161148e-05, 9.549222886562347e-05, 0.00010000448673963547, 0.00010451674461364746, 0.00010902900248765945, 0.00011354126036167145, 0.00011805351823568344, 0.00012256577610969543, 0.00012707803398370743, 0.00013159029185771942, 0.00013610254973173141, 0.0001406148076057434, 0.0001451270654797554, 0.0001496393233537674, 0.0001541515812277794, 0.00015866383910179138, 0.00016317609697580338, 0.00016768835484981537, 0.00017220061272382736, 0.00017671287059783936, 0.00018122512847185135, 0.00018573738634586334, 0.00019024964421987534, 0.00019476190209388733, 0.00019927415996789932, 0.00020378641784191132, 0.0002082986757159233, 0.0002128109335899353, 0.0002173231914639473, 0.0002218354493379593, 0.00022634770721197128, 0.00023085996508598328, 0.00023537222295999527, 0.00023988448083400726, 0.00024439673870801926, 0.00024890899658203125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 5.0, 5.0, 7.0, 16.0, 23.0, 47.0, 69.0, 110.0, 233.0, 449.0, 1332.0, 4940.0, 34316.0, 466919.0, 495566.0, 37033.0, 5051.0, 1398.0, 505.0, 238.0, 114.0, 68.0, 40.0, 21.0, 13.0, 7.0, 9.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0161895751953125, -0.015567302703857422, -0.014945030212402344, -0.014322757720947266, -0.013700485229492188, -0.01307821273803711, -0.012455940246582031, -0.011833667755126953, -0.011211395263671875, -0.010589122772216797, -0.009966850280761719, -0.00934457778930664, -0.008722305297851562, -0.008100032806396484, -0.007477760314941406, -0.006855487823486328, -0.00623321533203125, -0.005610942840576172, -0.004988670349121094, -0.004366397857666016, -0.0037441253662109375, -0.0031218528747558594, -0.0024995803833007812, -0.0018773078918457031, -0.001255035400390625, -0.0006327629089355469, -1.049041748046875e-05, 0.0006117820739746094, 0.0012340545654296875, 0.0018563270568847656, 0.0024785995483398438, 0.003100872039794922, 0.00372314453125, 0.004345417022705078, 0.004967689514160156, 0.005589962005615234, 0.0062122344970703125, 0.006834506988525391, 0.007456779479980469, 0.008079051971435547, 0.008701324462890625, 0.009323596954345703, 0.009945869445800781, 0.01056814193725586, 0.011190414428710938, 0.011812686920166016, 0.012434959411621094, 0.013057231903076172, 0.01367950439453125, 0.014301776885986328, 0.014924049377441406, 0.015546321868896484, 0.016168594360351562, 0.01679086685180664, 0.01741313934326172, 0.018035411834716797, 0.018657684326171875, 0.019279956817626953, 0.01990222930908203, 0.02052450180053711, 0.021146774291992188, 0.021769046783447266, 0.022391319274902344, 0.023013591766357422, 0.0236358642578125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 3.0, 5.0, 3.0, 15.0, 17.0, 16.0, 35.0, 24.0, 39.0, 62.0, 51.0, 82.0, 70.0, 74.0, 76.0, 74.0, 67.0, 63.0, 39.0, 39.0, 34.0, 24.0, 18.0, 12.0, 7.0, 10.0, 3.0, 7.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00983428955078125, -0.009452581405639648, -0.009070873260498047, -0.008689165115356445, -0.008307456970214844, -0.007925748825073242, -0.007544040679931641, -0.007162332534790039, -0.0067806243896484375, -0.006398916244506836, -0.006017208099365234, -0.005635499954223633, -0.005253791809082031, -0.00487208366394043, -0.004490375518798828, -0.0041086673736572266, -0.003726959228515625, -0.0033452510833740234, -0.002963542938232422, -0.0025818347930908203, -0.0022001266479492188, -0.0018184185028076172, -0.0014367103576660156, -0.001055002212524414, -0.0006732940673828125, -0.00029158592224121094, 9.012222290039062e-05, 0.0004718303680419922, 0.0008535385131835938, 0.0012352466583251953, 0.0016169548034667969, 0.0019986629486083984, 0.00238037109375, 0.0027620792388916016, 0.003143787384033203, 0.0035254955291748047, 0.003907203674316406, 0.004288911819458008, 0.004670619964599609, 0.005052328109741211, 0.0054340362548828125, 0.005815744400024414, 0.006197452545166016, 0.006579160690307617, 0.006960868835449219, 0.00734257698059082, 0.007724285125732422, 0.008105993270874023, 0.008487701416015625, 0.008869409561157227, 0.009251117706298828, 0.00963282585144043, 0.010014533996582031, 0.010396242141723633, 0.010777950286865234, 0.011159658432006836, 0.011541366577148438, 0.011923074722290039, 0.01230478286743164, 0.012686491012573242, 0.013068199157714844, 0.013449907302856445, 0.013831615447998047, 0.014213323593139648, 0.01459503173828125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 18.0, 54.0, 136.0, 233.0, 261.0, 172.0, 69.0, 30.0, 10.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18249693512916565, -0.1712089478969574, -0.15992097556591034, -0.1486329883337021, -0.13734501600265503, -0.12605702877044678, -0.11476904153823853, -0.10348106175661087, -0.09219308197498322, -0.08090510219335556, -0.0696171224117279, -0.05832913517951965, -0.047041155397892, -0.03575317561626434, -0.02446518838405609, -0.013177208602428436, -0.0018892288208007812, 0.009398752823472023, 0.020686734467744827, 0.03197471797466278, 0.043262697756290436, 0.05455067753791809, 0.06583866477012634, 0.077126644551754, 0.08841462433338165, 0.09970260411500931, 0.11099058389663696, 0.12227857112884521, 0.13356655836105347, 0.14485453069210052, 0.15614251792430878, 0.16743049025535583, 0.1787184476852417, 0.19000643491744995, 0.201294407248497, 0.21258239448070526, 0.22387036681175232, 0.23515835404396057, 0.24644634127616882, 0.2577343285083771, 0.26902228593826294, 0.2803102731704712, 0.29159826040267944, 0.3028862476348877, 0.31417420506477356, 0.3254621922969818, 0.33675017952919006, 0.3480381667613983, 0.35932615399360657, 0.3706141412258148, 0.38190212845802307, 0.39319008588790894, 0.4044780731201172, 0.41576606035232544, 0.4270540475845337, 0.43834203481674194, 0.4496300220489502, 0.46091800928115845, 0.4722059965133667, 0.48349398374557495, 0.4947819411754608, 0.5060698986053467, 0.5173579454421997, 0.5286458730697632, 0.5399338603019714]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 6.0, 11.0, 10.0, 8.0, 16.0, 14.0, 21.0, 20.0, 21.0, 31.0, 29.0, 36.0, 41.0, 52.0, 39.0, 38.0, 41.0, 46.0, 39.0, 47.0, 39.0, 39.0, 37.0, 28.0, 31.0, 29.0, 36.0, 24.0, 27.0, 24.0, 21.0, 18.0, 18.0, 17.0, 3.0, 8.0, 8.0, 4.0, 2.0, 3.0, 4.0, 4.0, 2.0, 0.0, 3.0], "bins": [-0.2228478193283081, -0.21688516438007355, -0.210922509431839, -0.20495986938476562, -0.19899721443653107, -0.1930345594882965, -0.18707191944122314, -0.1811092644929886, -0.17514660954475403, -0.16918395459651947, -0.1632212996482849, -0.15725865960121155, -0.151296004652977, -0.14533334970474243, -0.13937070965766907, -0.1334080547094345, -0.12744539976119995, -0.1214827448129654, -0.11552009731531143, -0.10955744981765747, -0.10359479486942291, -0.09763213992118835, -0.0916694924235344, -0.08570684492588043, -0.07974418997764587, -0.07378153502941132, -0.06781888753175735, -0.061856236308813095, -0.055893585085868835, -0.049930933862924576, -0.043968282639980316, -0.038005631417036057, -0.0320429801940918, -0.026080328971147537, -0.020117677748203278, -0.014155026525259018, -0.008192375302314758, -0.0022297240793704987, 0.003732927143573761, 0.00969557836651802, 0.01565822958946228, 0.02162088081240654, 0.0275835320353508, 0.03354618325829506, 0.03950883448123932, 0.04547148570418358, 0.05143413692712784, 0.0573967881500721, 0.06335943937301636, 0.06932209432125092, 0.07528474181890488, 0.08124738931655884, 0.0872100442647934, 0.09317269921302795, 0.09913534671068192, 0.10509799420833588, 0.11106064915657043, 0.11702330410480499, 0.12298595160245895, 0.12894859910011292, 0.13491125404834747, 0.14087390899658203, 0.1468365490436554, 0.15279920399188995, 0.1587618589401245]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 8.0, 5.0, 11.0, 12.0, 10.0, 19.0, 22.0, 30.0, 54.0, 74.0, 134.0, 177.0, 345.0, 575.0, 1264.0, 3487.0, 12039.0, 79652.0, 3858660.0, 211215.0, 19168.0, 4540.0, 1574.0, 623.0, 277.0, 140.0, 70.0, 38.0, 17.0, 11.0, 6.0, 9.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.074951171875, -0.07284879684448242, -0.07074642181396484, -0.06864404678344727, -0.06654167175292969, -0.06443929672241211, -0.06233692169189453, -0.06023454666137695, -0.058132171630859375, -0.0560297966003418, -0.05392742156982422, -0.05182504653930664, -0.04972267150878906, -0.047620296478271484, -0.045517921447753906, -0.04341554641723633, -0.04131317138671875, -0.03921079635620117, -0.037108421325683594, -0.035006046295166016, -0.03290367126464844, -0.03080129623413086, -0.02869892120361328, -0.026596546173095703, -0.024494171142578125, -0.022391796112060547, -0.02028942108154297, -0.01818704605102539, -0.016084671020507812, -0.013982295989990234, -0.011879920959472656, -0.009777545928955078, -0.0076751708984375, -0.005572795867919922, -0.0034704208374023438, -0.0013680458068847656, 0.0007343292236328125, 0.0028367042541503906, 0.004939079284667969, 0.007041454315185547, 0.009143829345703125, 0.011246204376220703, 0.013348579406738281, 0.01545095443725586, 0.017553329467773438, 0.019655704498291016, 0.021758079528808594, 0.023860454559326172, 0.02596282958984375, 0.028065204620361328, 0.030167579650878906, 0.032269954681396484, 0.03437232971191406, 0.03647470474243164, 0.03857707977294922, 0.0406794548034668, 0.042781829833984375, 0.04488420486450195, 0.04698657989501953, 0.04908895492553711, 0.05119132995605469, 0.053293704986572266, 0.055396080017089844, 0.05749845504760742, 0.059600830078125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 11.0, 19.0, 17.0, 18.0, 34.0, 62.0, 78.0, 92.0, 83.0, 95.0, 99.0, 105.0, 89.0, 64.0, 56.0, 26.0, 18.0, 15.0, 12.0, 4.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0268096923828125, -0.026166677474975586, -0.025523662567138672, -0.024880647659301758, -0.024237632751464844, -0.02359461784362793, -0.022951602935791016, -0.0223085880279541, -0.021665573120117188, -0.021022558212280273, -0.02037954330444336, -0.019736528396606445, -0.01909351348876953, -0.018450498580932617, -0.017807483673095703, -0.01716446876525879, -0.016521453857421875, -0.01587843894958496, -0.015235424041748047, -0.014592409133911133, -0.013949394226074219, -0.013306379318237305, -0.01266336441040039, -0.012020349502563477, -0.011377334594726562, -0.010734319686889648, -0.010091304779052734, -0.00944828987121582, -0.008805274963378906, -0.008162260055541992, -0.007519245147705078, -0.006876230239868164, -0.00623321533203125, -0.005590200424194336, -0.004947185516357422, -0.004304170608520508, -0.0036611557006835938, -0.0030181407928466797, -0.0023751258850097656, -0.0017321109771728516, -0.0010890960693359375, -0.00044608116149902344, 0.00019693374633789062, 0.0008399486541748047, 0.0014829635620117188, 0.002125978469848633, 0.002768993377685547, 0.003412008285522461, 0.004055023193359375, 0.004698038101196289, 0.005341053009033203, 0.005984067916870117, 0.006627082824707031, 0.007270097732543945, 0.00791311264038086, 0.008556127548217773, 0.009199142456054688, 0.009842157363891602, 0.010485172271728516, 0.01112818717956543, 0.011771202087402344, 0.012414216995239258, 0.013057231903076172, 0.013700246810913086, 0.01434326171875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 13.0, 15.0, 31.0, 50.0, 134.0, 271.0, 820.0, 5748.0, 357925.0, 3814488.0, 12574.0, 1440.0, 372.0, 193.0, 95.0, 53.0, 24.0, 17.0, 4.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0872802734375, -0.08447742462158203, -0.08167457580566406, -0.0788717269897461, -0.07606887817382812, -0.07326602935791016, -0.07046318054199219, -0.06766033172607422, -0.06485748291015625, -0.06205463409423828, -0.05925178527832031, -0.056448936462402344, -0.053646087646484375, -0.050843238830566406, -0.04804039001464844, -0.04523754119873047, -0.0424346923828125, -0.03963184356689453, -0.03682899475097656, -0.034026145935058594, -0.031223297119140625, -0.028420448303222656, -0.025617599487304688, -0.02281475067138672, -0.02001190185546875, -0.01720905303955078, -0.014406204223632812, -0.011603355407714844, -0.008800506591796875, -0.005997657775878906, -0.0031948089599609375, -0.00039196014404296875, 0.002410888671875, 0.005213737487792969, 0.008016586303710938, 0.010819435119628906, 0.013622283935546875, 0.016425132751464844, 0.019227981567382812, 0.02203083038330078, 0.02483367919921875, 0.02763652801513672, 0.030439376831054688, 0.033242225646972656, 0.036045074462890625, 0.038847923278808594, 0.04165077209472656, 0.04445362091064453, 0.0472564697265625, 0.05005931854248047, 0.05286216735839844, 0.055665016174316406, 0.058467864990234375, 0.061270713806152344, 0.06407356262207031, 0.06687641143798828, 0.06967926025390625, 0.07248210906982422, 0.07528495788574219, 0.07808780670166016, 0.08089065551757812, 0.0836935043334961, 0.08649635314941406, 0.08929920196533203, 0.09210205078125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 15.0, 16.0, 39.0, 110.0, 366.0, 2135.0, 1006.0, 219.0, 69.0, 33.0, 22.0, 9.0, 9.0, 7.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0215606689453125, -0.020723581314086914, -0.019886493682861328, -0.019049406051635742, -0.018212318420410156, -0.01737523078918457, -0.016538143157958984, -0.0157010555267334, -0.014863967895507812, -0.014026880264282227, -0.01318979263305664, -0.012352705001831055, -0.011515617370605469, -0.010678529739379883, -0.009841442108154297, -0.009004354476928711, -0.008167266845703125, -0.007330179214477539, -0.006493091583251953, -0.005656003952026367, -0.004818916320800781, -0.003981828689575195, -0.0031447410583496094, -0.0023076534271240234, -0.0014705657958984375, -0.0006334781646728516, 0.00020360946655273438, 0.0010406970977783203, 0.0018777847290039062, 0.002714872360229492, 0.003551959991455078, 0.004389047622680664, 0.00522613525390625, 0.006063222885131836, 0.006900310516357422, 0.007737398147583008, 0.008574485778808594, 0.00941157341003418, 0.010248661041259766, 0.011085748672485352, 0.011922836303710938, 0.012759923934936523, 0.01359701156616211, 0.014434099197387695, 0.015271186828613281, 0.016108274459838867, 0.016945362091064453, 0.01778244972229004, 0.018619537353515625, 0.01945662498474121, 0.020293712615966797, 0.021130800247192383, 0.02196788787841797, 0.022804975509643555, 0.02364206314086914, 0.024479150772094727, 0.025316238403320312, 0.0261533260345459, 0.026990413665771484, 0.02782750129699707, 0.028664588928222656, 0.029501676559448242, 0.030338764190673828, 0.031175851821899414, 0.032012939453125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 30.0, 667.0, 300.0, 10.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46417441964149475, -0.4495387673377991, -0.4349031150341034, -0.4202674627304077, -0.4056318402290344, -0.39099618792533875, -0.37636053562164307, -0.3617248833179474, -0.3470892310142517, -0.33245357871055603, -0.31781792640686035, -0.30318230390548706, -0.2885466516017914, -0.2739109992980957, -0.2592753469944, -0.24463969469070435, -0.23000407218933105, -0.21536841988563538, -0.2007327824831009, -0.1860971301794052, -0.17146149277687073, -0.15682584047317505, -0.14219018816947937, -0.1275545358657837, -0.1129188984632492, -0.09828325361013412, -0.08364760875701904, -0.06901195645332336, -0.05437631160020828, -0.0397406667470932, -0.025105014443397522, -0.01046936959028244, 0.004166305065155029, 0.01880195178091526, 0.03343759849667549, 0.04807324707508087, 0.06270889192819595, 0.07734453678131104, 0.09198018908500671, 0.1066158339381218, 0.12125147879123688, 0.13588713109493256, 0.15052276849746704, 0.16515842080116272, 0.1797940731048584, 0.19442971050739288, 0.20906536281108856, 0.22370100021362305, 0.23833665251731873, 0.2529723048210144, 0.2676079571247101, 0.28224360942840576, 0.29687923192977905, 0.31151488423347473, 0.3261505365371704, 0.3407861888408661, 0.35542184114456177, 0.37005749344825745, 0.3846931457519531, 0.3993287682533264, 0.4139644205570221, 0.4286000728607178, 0.44323572516441345, 0.45787137746810913, 0.4725069999694824]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 11.0, 14.0, 15.0, 31.0, 46.0, 51.0, 70.0, 81.0, 104.0, 93.0, 87.0, 95.0, 72.0, 70.0, 55.0, 44.0, 27.0, 12.0, 7.0, 9.0, 8.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08634567260742188, -0.08315745741128922, -0.07996924221515656, -0.0767810270190239, -0.07359281182289124, -0.07040458917617798, -0.06721637398004532, -0.06402815878391266, -0.06083994358778, -0.05765172839164734, -0.05446351319551468, -0.05127529427409172, -0.04808707907795906, -0.0448988638818264, -0.04171064496040344, -0.03852242976427078, -0.03533421456813812, -0.03214599937200546, -0.028957782313227654, -0.025769565254449844, -0.022581350058317184, -0.019393134862184525, -0.016204917803406715, -0.013016700744628906, -0.009828485548496246, -0.006640269421041012, -0.0034520532935857773, -0.00026383716613054276, 0.0029243789613246918, 0.006112594157457352, 0.00930081121623516, 0.01248902827501297, 0.01567724347114563, 0.01886545866727829, 0.0220536757260561, 0.025241892784833908, 0.028430107980966568, 0.03161832317709923, 0.034806542098522186, 0.037994757294654846, 0.041182972490787506, 0.044371187686920166, 0.047559402883052826, 0.050747621804475784, 0.053935837000608444, 0.057124052196741104, 0.06031227111816406, 0.06350048631429672, 0.06668870151042938, 0.06987691670656204, 0.0730651319026947, 0.07625334709882736, 0.07944156229496002, 0.08262978494167328, 0.08581800013780594, 0.0890062153339386, 0.09219443053007126, 0.09538264572620392, 0.09857086092233658, 0.10175907611846924, 0.1049472987651825, 0.10813550651073456, 0.11132372915744781, 0.11451194435358047, 0.11770015954971313]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 5.0, 15.0, 16.0, 31.0, 35.0, 67.0, 105.0, 153.0, 310.0, 533.0, 1157.0, 2861.0, 9740.0, 51933.0, 376177.0, 506541.0, 79104.0, 13284.0, 3642.0, 1408.0, 605.0, 344.0, 174.0, 110.0, 65.0, 49.0, 30.0, 16.0, 14.0, 11.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0357666015625, -0.03439664840698242, -0.033026695251464844, -0.031656742095947266, -0.030286788940429688, -0.02891683578491211, -0.02754688262939453, -0.026176929473876953, -0.024806976318359375, -0.023437023162841797, -0.02206707000732422, -0.02069711685180664, -0.019327163696289062, -0.017957210540771484, -0.016587257385253906, -0.015217304229736328, -0.01384735107421875, -0.012477397918701172, -0.011107444763183594, -0.009737491607666016, -0.008367538452148438, -0.006997585296630859, -0.005627632141113281, -0.004257678985595703, -0.002887725830078125, -0.0015177726745605469, -0.00014781951904296875, 0.0012221336364746094, 0.0025920867919921875, 0.003962039947509766, 0.005331993103027344, 0.006701946258544922, 0.0080718994140625, 0.009441852569580078, 0.010811805725097656, 0.012181758880615234, 0.013551712036132812, 0.01492166519165039, 0.01629161834716797, 0.017661571502685547, 0.019031524658203125, 0.020401477813720703, 0.02177143096923828, 0.02314138412475586, 0.024511337280273438, 0.025881290435791016, 0.027251243591308594, 0.028621196746826172, 0.02999114990234375, 0.03136110305786133, 0.032731056213378906, 0.034101009368896484, 0.03547096252441406, 0.03684091567993164, 0.03821086883544922, 0.0395808219909668, 0.040950775146484375, 0.04232072830200195, 0.04369068145751953, 0.04506063461303711, 0.04643058776855469, 0.047800540924072266, 0.049170494079589844, 0.05054044723510742, 0.051910400390625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 8.0, 14.0, 17.0, 19.0, 22.0, 35.0, 57.0, 49.0, 91.0, 74.0, 92.0, 82.0, 89.0, 71.0, 75.0, 63.0, 44.0, 31.0, 20.0, 11.0, 12.0, 8.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0208587646484375, -0.020325183868408203, -0.019791603088378906, -0.01925802230834961, -0.018724441528320312, -0.018190860748291016, -0.01765727996826172, -0.017123699188232422, -0.016590118408203125, -0.016056537628173828, -0.015522956848144531, -0.014989376068115234, -0.014455795288085938, -0.01392221450805664, -0.013388633728027344, -0.012855052947998047, -0.01232147216796875, -0.011787891387939453, -0.011254310607910156, -0.01072072982788086, -0.010187149047851562, -0.009653568267822266, -0.009119987487792969, -0.008586406707763672, -0.008052825927734375, -0.007519245147705078, -0.006985664367675781, -0.006452083587646484, -0.0059185028076171875, -0.005384922027587891, -0.004851341247558594, -0.004317760467529297, -0.0037841796875, -0.003250598907470703, -0.0027170181274414062, -0.0021834373474121094, -0.0016498565673828125, -0.0011162757873535156, -0.0005826950073242188, -4.9114227294921875e-05, 0.000484466552734375, 0.0010180473327636719, 0.0015516281127929688, 0.0020852088928222656, 0.0026187896728515625, 0.0031523704528808594, 0.0036859512329101562, 0.004219532012939453, 0.00475311279296875, 0.005286693572998047, 0.005820274353027344, 0.006353855133056641, 0.0068874359130859375, 0.007421016693115234, 0.007954597473144531, 0.008488178253173828, 0.009021759033203125, 0.009555339813232422, 0.010088920593261719, 0.010622501373291016, 0.011156082153320312, 0.01168966293334961, 0.012223243713378906, 0.012756824493408203, 0.0132904052734375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 1.0, 3.0, 3.0, 4.0, 7.0, 9.0, 12.0, 14.0, 32.0, 31.0, 37.0, 51.0, 63.0, 80.0, 140.0, 220.0, 366.0, 753.0, 1737.0, 4649.0, 15486.0, 64106.0, 281224.0, 471811.0, 157409.0, 35269.0, 9356.0, 3078.0, 1145.0, 527.0, 290.0, 186.0, 115.0, 87.0, 59.0, 54.0, 42.0, 20.0, 11.0, 25.0, 13.0, 8.0, 7.0, 8.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0274505615234375, -0.02660059928894043, -0.02575063705444336, -0.02490067481994629, -0.02405071258544922, -0.02320075035095215, -0.022350788116455078, -0.021500825881958008, -0.020650863647460938, -0.019800901412963867, -0.018950939178466797, -0.018100976943969727, -0.017251014709472656, -0.016401052474975586, -0.015551090240478516, -0.014701128005981445, -0.013851165771484375, -0.013001203536987305, -0.012151241302490234, -0.011301279067993164, -0.010451316833496094, -0.009601354598999023, -0.008751392364501953, -0.007901430130004883, -0.0070514678955078125, -0.006201505661010742, -0.005351543426513672, -0.0045015811920166016, -0.0036516189575195312, -0.002801656723022461, -0.0019516944885253906, -0.0011017322540283203, -0.00025177001953125, 0.0005981922149658203, 0.0014481544494628906, 0.002298116683959961, 0.0031480789184570312, 0.0039980411529541016, 0.004848003387451172, 0.005697965621948242, 0.0065479278564453125, 0.007397890090942383, 0.008247852325439453, 0.009097814559936523, 0.009947776794433594, 0.010797739028930664, 0.011647701263427734, 0.012497663497924805, 0.013347625732421875, 0.014197587966918945, 0.015047550201416016, 0.015897512435913086, 0.016747474670410156, 0.017597436904907227, 0.018447399139404297, 0.019297361373901367, 0.020147323608398438, 0.020997285842895508, 0.021847248077392578, 0.02269721031188965, 0.02354717254638672, 0.02439713478088379, 0.02524709701538086, 0.02609705924987793, 0.026947021484375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 4.0, 5.0, 6.0, 8.0, 9.0, 13.0, 12.0, 11.0, 23.0, 25.0, 9.0, 27.0, 24.0, 19.0, 31.0, 29.0, 24.0, 38.0, 36.0, 43.0, 45.0, 43.0, 41.0, 47.0, 48.0, 28.0, 39.0, 36.0, 33.0, 25.0, 30.0, 24.0, 28.0, 23.0, 20.0, 16.0, 12.0, 14.0, 12.0, 7.0, 9.0, 5.0, 4.0, 4.0, 7.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.027587890625, -0.026635169982910156, -0.025682449340820312, -0.02472972869873047, -0.023777008056640625, -0.02282428741455078, -0.021871566772460938, -0.020918846130371094, -0.01996612548828125, -0.019013404846191406, -0.018060684204101562, -0.01710796356201172, -0.016155242919921875, -0.015202522277832031, -0.014249801635742188, -0.013297080993652344, -0.0123443603515625, -0.011391639709472656, -0.010438919067382812, -0.009486198425292969, -0.008533477783203125, -0.007580757141113281, -0.0066280364990234375, -0.005675315856933594, -0.00472259521484375, -0.0037698745727539062, -0.0028171539306640625, -0.0018644332885742188, -0.000911712646484375, 4.100799560546875e-05, 0.0009937286376953125, 0.0019464492797851562, 0.002899169921875, 0.0038518905639648438, 0.0048046112060546875, 0.005757331848144531, 0.006710052490234375, 0.007662773132324219, 0.008615493774414062, 0.009568214416503906, 0.01052093505859375, 0.011473655700683594, 0.012426376342773438, 0.013379096984863281, 0.014331817626953125, 0.015284538269042969, 0.016237258911132812, 0.017189979553222656, 0.0181427001953125, 0.019095420837402344, 0.020048141479492188, 0.02100086212158203, 0.021953582763671875, 0.02290630340576172, 0.023859024047851562, 0.024811744689941406, 0.02576446533203125, 0.026717185974121094, 0.027669906616210938, 0.02862262725830078, 0.029575347900390625, 0.03052806854248047, 0.03148078918457031, 0.032433509826660156, 0.03338623046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 11.0, 9.0, 10.0, 17.0, 15.0, 34.0, 58.0, 79.0, 145.0, 226.0, 369.0, 793.0, 1712.0, 4839.0, 19252.0, 131142.0, 572529.0, 268290.0, 36875.0, 7437.0, 2441.0, 1036.0, 476.0, 303.0, 164.0, 101.0, 58.0, 38.0, 26.0, 14.0, 10.0, 11.0, 7.0, 7.0, 4.0, 7.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01129150390625, -0.010911107063293457, -0.010530710220336914, -0.010150313377380371, -0.009769916534423828, -0.009389519691467285, -0.009009122848510742, -0.0086287260055542, -0.008248329162597656, -0.007867932319641113, -0.00748753547668457, -0.007107138633728027, -0.006726741790771484, -0.006346344947814941, -0.0059659481048583984, -0.0055855512619018555, -0.0052051544189453125, -0.0048247575759887695, -0.0044443607330322266, -0.004063963890075684, -0.0036835670471191406, -0.0033031702041625977, -0.0029227733612060547, -0.0025423765182495117, -0.0021619796752929688, -0.0017815828323364258, -0.0014011859893798828, -0.0010207891464233398, -0.0006403923034667969, -0.0002599954605102539, 0.00012040138244628906, 0.000500798225402832, 0.000881195068359375, 0.001261591911315918, 0.001641988754272461, 0.002022385597229004, 0.002402782440185547, 0.00278317928314209, 0.003163576126098633, 0.0035439729690551758, 0.003924369812011719, 0.004304766654968262, 0.004685163497924805, 0.005065560340881348, 0.005445957183837891, 0.005826354026794434, 0.0062067508697509766, 0.0065871477127075195, 0.0069675445556640625, 0.0073479413986206055, 0.0077283382415771484, 0.008108735084533691, 0.008489131927490234, 0.008869528770446777, 0.00924992561340332, 0.009630322456359863, 0.010010719299316406, 0.01039111614227295, 0.010771512985229492, 0.011151909828186035, 0.011532306671142578, 0.011912703514099121, 0.012293100357055664, 0.012673497200012207, 0.01305389404296875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 7.0, 7.0, 14.0, 25.0, 28.0, 40.0, 61.0, 90.0, 159.0, 166.0, 126.0, 90.0, 63.0, 45.0, 34.0, 18.0, 19.0, 8.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00015103816986083984, -0.00014770496636629105, -0.00014437176287174225, -0.00014103855937719345, -0.00013770535588264465, -0.00013437215238809586, -0.00013103894889354706, -0.00012770574539899826, -0.00012437254190444946, -0.00012103933840990067, -0.00011770613491535187, -0.00011437293142080307, -0.00011103972792625427, -0.00010770652443170547, -0.00010437332093715668, -0.00010104011744260788, -9.770691394805908e-05, -9.437371045351028e-05, -9.104050695896149e-05, -8.770730346441269e-05, -8.437409996986389e-05, -8.10408964753151e-05, -7.77076929807663e-05, -7.43744894862175e-05, -7.10412859916687e-05, -6.77080824971199e-05, -6.43748790025711e-05, -6.104167550802231e-05, -5.770847201347351e-05, -5.437526851892471e-05, -5.1042065024375916e-05, -4.770886152982712e-05, -4.437565803527832e-05, -4.104245454072952e-05, -3.7709251046180725e-05, -3.437604755163193e-05, -3.104284405708313e-05, -2.7709640562534332e-05, -2.4376437067985535e-05, -2.1043233573436737e-05, -1.771003007888794e-05, -1.4376826584339142e-05, -1.1043623089790344e-05, -7.710419595241547e-06, -4.377216100692749e-06, -1.0440126061439514e-06, 2.289190888404846e-06, 5.622394382953644e-06, 8.955597877502441e-06, 1.2288801372051239e-05, 1.5622004866600037e-05, 1.8955208361148834e-05, 2.2288411855697632e-05, 2.562161535024643e-05, 2.8954818844795227e-05, 3.2288022339344025e-05, 3.562122583389282e-05, 3.895442932844162e-05, 4.228763282299042e-05, 4.5620836317539215e-05, 4.895403981208801e-05, 5.228724330663681e-05, 5.562044680118561e-05, 5.8953650295734406e-05, 6.22868537902832e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 15.0, 6.0, 17.0, 19.0, 35.0, 59.0, 133.0, 241.0, 524.0, 1393.0, 5384.0, 52852.0, 640553.0, 322552.0, 19947.0, 3098.0, 938.0, 386.0, 188.0, 92.0, 55.0, 23.0, 15.0, 7.0, 8.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0232086181640625, -0.022653579711914062, -0.022098541259765625, -0.021543502807617188, -0.02098846435546875, -0.020433425903320312, -0.019878387451171875, -0.019323348999023438, -0.018768310546875, -0.018213272094726562, -0.017658233642578125, -0.017103195190429688, -0.01654815673828125, -0.015993118286132812, -0.015438079833984375, -0.014883041381835938, -0.0143280029296875, -0.013772964477539062, -0.013217926025390625, -0.012662887573242188, -0.01210784912109375, -0.011552810668945312, -0.010997772216796875, -0.010442733764648438, -0.0098876953125, -0.009332656860351562, -0.008777618408203125, -0.008222579956054688, -0.00766754150390625, -0.0071125030517578125, -0.006557464599609375, -0.0060024261474609375, -0.0054473876953125, -0.0048923492431640625, -0.004337310791015625, -0.0037822723388671875, -0.00322723388671875, -0.0026721954345703125, -0.002117156982421875, -0.0015621185302734375, -0.001007080078125, -0.0004520416259765625, 0.000102996826171875, 0.0006580352783203125, 0.00121307373046875, 0.0017681121826171875, 0.002323150634765625, 0.0028781890869140625, 0.0034332275390625, 0.0039882659912109375, 0.004543304443359375, 0.0050983428955078125, 0.00565338134765625, 0.0062084197998046875, 0.006763458251953125, 0.0073184967041015625, 0.00787353515625, 0.008428573608398438, 0.008983612060546875, 0.009538650512695312, 0.01009368896484375, 0.010648727416992188, 0.011203765869140625, 0.011758804321289062, 0.0123138427734375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 8.0, 8.0, 17.0, 20.0, 39.0, 46.0, 54.0, 77.0, 70.0, 86.0, 102.0, 72.0, 82.0, 72.0, 65.0, 55.0, 36.0, 20.0, 31.0, 16.0, 8.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0160369873046875, -0.015634894371032715, -0.01523280143737793, -0.014830708503723145, -0.01442861557006836, -0.014026522636413574, -0.013624429702758789, -0.013222336769104004, -0.012820243835449219, -0.012418150901794434, -0.012016057968139648, -0.011613965034484863, -0.011211872100830078, -0.010809779167175293, -0.010407686233520508, -0.010005593299865723, -0.009603500366210938, -0.009201407432556152, -0.008799314498901367, -0.008397221565246582, -0.007995128631591797, -0.007593035697937012, -0.0071909427642822266, -0.006788849830627441, -0.006386756896972656, -0.005984663963317871, -0.005582571029663086, -0.005180478096008301, -0.004778385162353516, -0.0043762922286987305, -0.003974199295043945, -0.00357210636138916, -0.003170013427734375, -0.00276792049407959, -0.0023658275604248047, -0.0019637346267700195, -0.0015616416931152344, -0.0011595487594604492, -0.0007574558258056641, -0.0003553628921508789, 4.673004150390625e-05, 0.0004488229751586914, 0.0008509159088134766, 0.0012530088424682617, 0.0016551017761230469, 0.002057194709777832, 0.002459287643432617, 0.0028613805770874023, 0.0032634735107421875, 0.0036655664443969727, 0.004067659378051758, 0.004469752311706543, 0.004871845245361328, 0.005273938179016113, 0.0056760311126708984, 0.006078124046325684, 0.006480216979980469, 0.006882309913635254, 0.007284402847290039, 0.007686495780944824, 0.00808858871459961, 0.008490681648254395, 0.00889277458190918, 0.009294867515563965, 0.00969696044921875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 10.0, 36.0, 220.0, 437.0, 232.0, 59.0, 10.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7505373358726501, -0.7315293550491333, -0.7125213742256165, -0.6935133934020996, -0.6745054125785828, -0.6554974317550659, -0.6364894509315491, -0.6174814701080322, -0.5984734892845154, -0.5794655084609985, -0.5604575276374817, -0.5414495468139648, -0.522441565990448, -0.5034335851669312, -0.4844256043434143, -0.46541762351989746, -0.4464096426963806, -0.42740166187286377, -0.4083936810493469, -0.3893857002258301, -0.37037771940231323, -0.3513697385787964, -0.33236175775527954, -0.3133537769317627, -0.29434579610824585, -0.275337815284729, -0.25632983446121216, -0.2373218536376953, -0.21831387281417847, -0.19930589199066162, -0.18029791116714478, -0.16128993034362793, -0.14228200912475586, -0.12327402830123901, -0.10426604747772217, -0.08525806665420532, -0.06625008583068848, -0.04724210500717163, -0.028234124183654785, -0.00922614336013794, 0.009781837463378906, 0.028789818286895752, 0.0477977991104126, 0.06680577993392944, 0.08581376075744629, 0.10482174158096313, 0.12382972240447998, 0.14283770322799683, 0.16184568405151367, 0.18085366487503052, 0.19986164569854736, 0.2188696265220642, 0.23787760734558105, 0.2568855881690979, 0.27589356899261475, 0.2949015498161316, 0.31390953063964844, 0.3329175114631653, 0.35192549228668213, 0.370933473110199, 0.3899414539337158, 0.40894943475723267, 0.4279574155807495, 0.44696539640426636, 0.4659733772277832]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 8.0, 3.0, 8.0, 14.0, 16.0, 6.0, 23.0, 10.0, 23.0, 18.0, 33.0, 35.0, 45.0, 35.0, 24.0, 38.0, 32.0, 43.0, 46.0, 45.0, 41.0, 38.0, 53.0, 42.0, 38.0, 34.0, 30.0, 23.0, 20.0, 24.0, 30.0, 18.0, 18.0, 6.0, 13.0, 17.0, 8.0, 2.0, 12.0, 5.0, 2.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15470582246780396, -0.14950239658355713, -0.1442989706993103, -0.13909555971622467, -0.13389213383197784, -0.12868870794773102, -0.12348528206348419, -0.11828185617923737, -0.11307843774557114, -0.10787501186132431, -0.10267159342765808, -0.09746816754341125, -0.09226474165916443, -0.0870613232254982, -0.08185789734125137, -0.07665447890758514, -0.07145105302333832, -0.06624762713909149, -0.06104420870542526, -0.055840782821178436, -0.05063736066222191, -0.04543393850326538, -0.040230512619018555, -0.03502709046006203, -0.0298236683011055, -0.02462024614214897, -0.019416822120547295, -0.014213399030268192, -0.00900997593998909, -0.0038065537810325623, 0.0013968702405691147, 0.006600294262170792, 0.01180371642112732, 0.017007138580083847, 0.022210562601685524, 0.0274139866232872, 0.03261740878224373, 0.037820830941200256, 0.04302425682544708, 0.04822767898440361, 0.05343110114336014, 0.058634523302316666, 0.0638379454612732, 0.06904137134552002, 0.07424479722976685, 0.07944821566343307, 0.0846516415476799, 0.08985505998134613, 0.09505848586559296, 0.10026191174983978, 0.10546533018350601, 0.11066875606775284, 0.11587217450141907, 0.1210756003856659, 0.12627902626991272, 0.13148245215415955, 0.13668587803840637, 0.1418893039226532, 0.14709272980690002, 0.15229614078998566, 0.15749956667423248, 0.1627029925584793, 0.16790641844272614, 0.17310984432697296, 0.1783132553100586]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 10.0, 23.0, 49.0, 171.0, 615.0, 5855.0, 3993125.0, 191412.0, 2594.0, 332.0, 71.0, 19.0, 11.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06634521484375, -0.06075000762939453, -0.05515480041503906, -0.049559593200683594, -0.043964385986328125, -0.038369178771972656, -0.03277397155761719, -0.02717876434326172, -0.02158355712890625, -0.01598834991455078, -0.010393142700195312, -0.004797935485839844, 0.000797271728515625, 0.006392478942871094, 0.011987686157226562, 0.01758289337158203, 0.0231781005859375, 0.02877330780029297, 0.03436851501464844, 0.039963722229003906, 0.045558929443359375, 0.051154136657714844, 0.05674934387207031, 0.06234455108642578, 0.06793975830078125, 0.07353496551513672, 0.07913017272949219, 0.08472537994384766, 0.09032058715820312, 0.0959157943725586, 0.10151100158691406, 0.10710620880126953, 0.112701416015625, 0.11829662322998047, 0.12389183044433594, 0.1294870376586914, 0.13508224487304688, 0.14067745208740234, 0.1462726593017578, 0.15186786651611328, 0.15746307373046875, 0.16305828094482422, 0.1686534881591797, 0.17424869537353516, 0.17984390258789062, 0.1854391098022461, 0.19103431701660156, 0.19662952423095703, 0.2022247314453125, 0.20781993865966797, 0.21341514587402344, 0.2190103530883789, 0.22460556030273438, 0.23020076751708984, 0.2357959747314453, 0.24139118194580078, 0.24698638916015625, 0.2525815963745117, 0.2581768035888672, 0.26377201080322266, 0.2693672180175781, 0.2749624252319336, 0.28055763244628906, 0.28615283966064453, 0.291748046875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 9.0, 8.0, 13.0, 27.0, 27.0, 40.0, 49.0, 57.0, 72.0, 77.0, 82.0, 96.0, 82.0, 64.0, 63.0, 56.0, 41.0, 46.0, 30.0, 17.0, 9.0, 14.0, 2.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0197601318359375, -0.019243836402893066, -0.018727540969848633, -0.0182112455368042, -0.017694950103759766, -0.017178654670715332, -0.0166623592376709, -0.016146063804626465, -0.01562976837158203, -0.015113472938537598, -0.014597177505493164, -0.01408088207244873, -0.013564586639404297, -0.013048291206359863, -0.01253199577331543, -0.012015700340270996, -0.011499404907226562, -0.010983109474182129, -0.010466814041137695, -0.009950518608093262, -0.009434223175048828, -0.008917927742004395, -0.008401632308959961, -0.007885336875915527, -0.007369041442871094, -0.00685274600982666, -0.0063364505767822266, -0.005820155143737793, -0.005303859710693359, -0.004787564277648926, -0.004271268844604492, -0.0037549734115600586, -0.003238677978515625, -0.0027223825454711914, -0.002206087112426758, -0.0016897916793823242, -0.0011734962463378906, -0.000657200813293457, -0.00014090538024902344, 0.00037539005279541016, 0.0008916854858398438, 0.0014079809188842773, 0.001924276351928711, 0.0024405717849731445, 0.002956867218017578, 0.0034731626510620117, 0.003989458084106445, 0.004505753517150879, 0.0050220489501953125, 0.005538344383239746, 0.00605463981628418, 0.006570935249328613, 0.007087230682373047, 0.0076035261154174805, 0.008119821548461914, 0.008636116981506348, 0.009152412414550781, 0.009668707847595215, 0.010185003280639648, 0.010701298713684082, 0.011217594146728516, 0.01173388957977295, 0.012250185012817383, 0.012766480445861816, 0.01328277587890625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 6.0, 8.0, 15.0, 30.0, 41.0, 76.0, 153.0, 312.0, 729.0, 1929.0, 7623.0, 55141.0, 3460514.0, 633392.0, 26618.0, 4969.0, 1457.0, 591.0, 271.0, 163.0, 90.0, 53.0, 38.0, 9.0, 11.0, 6.0, 3.0, 12.0, 2.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.03857421875, -0.03718852996826172, -0.03580284118652344, -0.034417152404785156, -0.033031463623046875, -0.031645774841308594, -0.030260086059570312, -0.02887439727783203, -0.02748870849609375, -0.02610301971435547, -0.024717330932617188, -0.023331642150878906, -0.021945953369140625, -0.020560264587402344, -0.019174575805664062, -0.01778888702392578, -0.0164031982421875, -0.015017509460449219, -0.013631820678710938, -0.012246131896972656, -0.010860443115234375, -0.009474754333496094, -0.008089065551757812, -0.006703376770019531, -0.00531768798828125, -0.003931999206542969, -0.0025463104248046875, -0.0011606216430664062, 0.000225067138671875, 0.0016107559204101562, 0.0029964447021484375, 0.004382133483886719, 0.005767822265625, 0.007153511047363281, 0.008539199829101562, 0.009924888610839844, 0.011310577392578125, 0.012696266174316406, 0.014081954956054688, 0.015467643737792969, 0.01685333251953125, 0.01823902130126953, 0.019624710083007812, 0.021010398864746094, 0.022396087646484375, 0.023781776428222656, 0.025167465209960938, 0.02655315399169922, 0.0279388427734375, 0.02932453155517578, 0.030710220336914062, 0.032095909118652344, 0.033481597900390625, 0.034867286682128906, 0.03625297546386719, 0.03763866424560547, 0.03902435302734375, 0.04041004180908203, 0.04179573059082031, 0.043181419372558594, 0.044567108154296875, 0.045952796936035156, 0.04733848571777344, 0.04872417449951172, 0.05010986328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 9.0, 4.0, 8.0, 14.0, 36.0, 49.0, 96.0, 130.0, 394.0, 1552.0, 1142.0, 311.0, 129.0, 66.0, 46.0, 26.0, 26.0, 6.0, 7.0, 7.0, 8.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0174102783203125, -0.016785383224487305, -0.01616048812866211, -0.015535593032836914, -0.014910697937011719, -0.014285802841186523, -0.013660907745361328, -0.013036012649536133, -0.012411117553710938, -0.011786222457885742, -0.011161327362060547, -0.010536432266235352, -0.009911537170410156, -0.009286642074584961, -0.008661746978759766, -0.00803685188293457, -0.007411956787109375, -0.00678706169128418, -0.006162166595458984, -0.005537271499633789, -0.004912376403808594, -0.0042874813079833984, -0.003662586212158203, -0.003037691116333008, -0.0024127960205078125, -0.0017879009246826172, -0.0011630058288574219, -0.0005381107330322266, 8.678436279296875e-05, 0.0007116794586181641, 0.0013365745544433594, 0.0019614696502685547, 0.00258636474609375, 0.0032112598419189453, 0.0038361549377441406, 0.004461050033569336, 0.005085945129394531, 0.0057108402252197266, 0.006335735321044922, 0.006960630416870117, 0.0075855255126953125, 0.008210420608520508, 0.008835315704345703, 0.009460210800170898, 0.010085105895996094, 0.010710000991821289, 0.011334896087646484, 0.01195979118347168, 0.012584686279296875, 0.01320958137512207, 0.013834476470947266, 0.014459371566772461, 0.015084266662597656, 0.01570916175842285, 0.016334056854248047, 0.016958951950073242, 0.017583847045898438, 0.018208742141723633, 0.018833637237548828, 0.019458532333374023, 0.02008342742919922, 0.020708322525024414, 0.02133321762084961, 0.021958112716674805, 0.0225830078125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 10.0, 39.0, 159.0, 327.0, 270.0, 132.0, 40.0, 17.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16127228736877441, -0.15617221593856812, -0.15107214450836182, -0.14597207307815552, -0.14087198674678802, -0.13577191531658173, -0.13067184388637543, -0.12557177245616913, -0.12047170102596283, -0.11537162959575653, -0.11027155071496964, -0.10517147928476334, -0.10007140785455704, -0.09497132897377014, -0.08987125754356384, -0.08477118611335754, -0.07967110723257065, -0.07457103580236435, -0.06947095692157745, -0.06437088549137115, -0.059270814061164856, -0.05417073890566826, -0.04907066375017166, -0.04397059231996536, -0.038870517164468765, -0.03377044200897217, -0.02867037057876587, -0.023570295423269272, -0.018470222130417824, -0.013370148837566376, -0.008270073682069778, -0.0031700022518634796, 0.0019300729036331177, 0.007030146662145853, 0.012130220420658588, 0.01723029464483261, 0.02233036793768406, 0.027430441230535507, 0.032530516386032104, 0.0376305878162384, 0.042730662971735, 0.0478307381272316, 0.0529308095574379, 0.058030884712934494, 0.06313095986843109, 0.06823103129863739, 0.07333110272884369, 0.07843117415904999, 0.08353125303983688, 0.08863132447004318, 0.09373140335083008, 0.09883147478103638, 0.10393154621124268, 0.10903161764144897, 0.11413169652223587, 0.11923176795244217, 0.12433184683322906, 0.12943191826343536, 0.13453198969364166, 0.13963207602500916, 0.14473214745521545, 0.14983221888542175, 0.15493229031562805, 0.16003236174583435, 0.16513243317604065]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 7.0, 2.0, 7.0, 9.0, 10.0, 19.0, 24.0, 26.0, 37.0, 35.0, 56.0, 55.0, 57.0, 65.0, 73.0, 62.0, 60.0, 69.0, 52.0, 50.0, 50.0, 48.0, 37.0, 24.0, 19.0, 22.0, 9.0, 9.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05652731657028198, -0.05409948527812958, -0.05167165398597717, -0.049243826419115067, -0.04681599512696266, -0.04438816383481026, -0.04196033626794815, -0.039532504975795746, -0.03710467368364334, -0.034676842391490936, -0.03224901109933853, -0.029821183532476425, -0.02739335224032402, -0.024965520948171616, -0.02253769151866436, -0.020109862089157104, -0.0176820307970047, -0.01525420043617487, -0.01282637007534504, -0.01039853971451521, -0.007970709353685379, -0.005542878992855549, -0.0031150486320257187, -0.0006872192025184631, 0.0017406120896339417, 0.004168442450463772, 0.006596272811293602, 0.009024103172123432, 0.011451933532953262, 0.013879763893783092, 0.016307594254612923, 0.018735423684120178, 0.021163254976272583, 0.023591086268424988, 0.026018915697932243, 0.0284467451274395, 0.030874576419591904, 0.03330240771174431, 0.035730235278606415, 0.03815806657075882, 0.040585897862911224, 0.04301372915506363, 0.045441560447216034, 0.04786938801407814, 0.050297219306230545, 0.05272505059838295, 0.055152878165245056, 0.05758070945739746, 0.060008540749549866, 0.06243637204170227, 0.06486420333385468, 0.06729203462600708, 0.06971986591815948, 0.07214768975973129, 0.0745755210518837, 0.0770033523440361, 0.07943118363618851, 0.08185901492834091, 0.08428684622049332, 0.08671467751264572, 0.08914250135421753, 0.09157033264636993, 0.09399816393852234, 0.09642599523067474, 0.09885382652282715]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 0.0, 5.0, 11.0, 4.0, 19.0, 21.0, 33.0, 35.0, 79.0, 109.0, 255.0, 420.0, 931.0, 2295.0, 7202.0, 37997.0, 432017.0, 509301.0, 45185.0, 8123.0, 2485.0, 989.0, 446.0, 236.0, 135.0, 75.0, 51.0, 31.0, 17.0, 12.0, 7.0, 10.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05389404296875, -0.05215787887573242, -0.050421714782714844, -0.048685550689697266, -0.04694938659667969, -0.04521322250366211, -0.04347705841064453, -0.04174089431762695, -0.040004730224609375, -0.0382685661315918, -0.03653240203857422, -0.03479623794555664, -0.03306007385253906, -0.031323909759521484, -0.029587745666503906, -0.027851581573486328, -0.02611541748046875, -0.024379253387451172, -0.022643089294433594, -0.020906925201416016, -0.019170761108398438, -0.01743459701538086, -0.01569843292236328, -0.013962268829345703, -0.012226104736328125, -0.010489940643310547, -0.008753776550292969, -0.007017612457275391, -0.0052814483642578125, -0.0035452842712402344, -0.0018091201782226562, -7.295608520507812e-05, 0.0016632080078125, 0.003399372100830078, 0.005135536193847656, 0.006871700286865234, 0.008607864379882812, 0.01034402847290039, 0.012080192565917969, 0.013816356658935547, 0.015552520751953125, 0.017288684844970703, 0.01902484893798828, 0.02076101303100586, 0.022497177124023438, 0.024233341217041016, 0.025969505310058594, 0.027705669403076172, 0.02944183349609375, 0.031177997589111328, 0.032914161682128906, 0.034650325775146484, 0.03638648986816406, 0.03812265396118164, 0.03985881805419922, 0.0415949821472168, 0.043331146240234375, 0.04506731033325195, 0.04680347442626953, 0.04853963851928711, 0.05027580261230469, 0.052011966705322266, 0.053748130798339844, 0.05548429489135742, 0.057220458984375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 10.0, 11.0, 18.0, 19.0, 29.0, 44.0, 56.0, 61.0, 60.0, 66.0, 96.0, 91.0, 75.0, 61.0, 66.0, 47.0, 49.0, 40.0, 31.0, 13.0, 13.0, 15.0, 5.0, 6.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.018280029296875, -0.017775416374206543, -0.017270803451538086, -0.01676619052886963, -0.016261577606201172, -0.015756964683532715, -0.015252351760864258, -0.0147477388381958, -0.014243125915527344, -0.013738512992858887, -0.01323390007019043, -0.012729287147521973, -0.012224674224853516, -0.011720061302185059, -0.011215448379516602, -0.010710835456848145, -0.010206222534179688, -0.00970160961151123, -0.009196996688842773, -0.008692383766174316, -0.00818777084350586, -0.007683157920837402, -0.007178544998168945, -0.006673932075500488, -0.006169319152832031, -0.005664706230163574, -0.005160093307495117, -0.00465548038482666, -0.004150867462158203, -0.003646254539489746, -0.003141641616821289, -0.002637028694152832, -0.002132415771484375, -0.001627802848815918, -0.001123189926147461, -0.0006185770034790039, -0.00011396408081054688, 0.00039064884185791016, 0.0008952617645263672, 0.0013998746871948242, 0.0019044876098632812, 0.0024091005325317383, 0.0029137134552001953, 0.0034183263778686523, 0.003922939300537109, 0.004427552223205566, 0.0049321651458740234, 0.0054367780685424805, 0.0059413909912109375, 0.0064460039138793945, 0.0069506168365478516, 0.007455229759216309, 0.007959842681884766, 0.008464455604553223, 0.00896906852722168, 0.009473681449890137, 0.009978294372558594, 0.01048290729522705, 0.010987520217895508, 0.011492133140563965, 0.011996746063232422, 0.012501358985900879, 0.013005971908569336, 0.013510584831237793, 0.01401519775390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 8.0, 8.0, 4.0, 7.0, 8.0, 19.0, 24.0, 28.0, 33.0, 35.0, 64.0, 83.0, 108.0, 173.0, 339.0, 594.0, 1647.0, 5798.0, 28495.0, 191882.0, 594827.0, 187896.0, 27579.0, 5670.0, 1615.0, 599.0, 320.0, 185.0, 127.0, 96.0, 58.0, 46.0, 40.0, 34.0, 24.0, 13.0, 16.0, 8.0, 15.0, 4.0, 8.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.03326416015625, -0.03224039077758789, -0.03121662139892578, -0.030192852020263672, -0.029169082641601562, -0.028145313262939453, -0.027121543884277344, -0.026097774505615234, -0.025074005126953125, -0.024050235748291016, -0.023026466369628906, -0.022002696990966797, -0.020978927612304688, -0.019955158233642578, -0.01893138885498047, -0.01790761947631836, -0.01688385009765625, -0.01586008071899414, -0.014836311340332031, -0.013812541961669922, -0.012788772583007812, -0.011765003204345703, -0.010741233825683594, -0.009717464447021484, -0.008693695068359375, -0.007669925689697266, -0.006646156311035156, -0.005622386932373047, -0.0045986175537109375, -0.003574848175048828, -0.0025510787963867188, -0.0015273094177246094, -0.0005035400390625, 0.0005202293395996094, 0.0015439987182617188, 0.002567768096923828, 0.0035915374755859375, 0.004615306854248047, 0.005639076232910156, 0.006662845611572266, 0.007686614990234375, 0.008710384368896484, 0.009734153747558594, 0.010757923126220703, 0.011781692504882812, 0.012805461883544922, 0.013829231262207031, 0.01485300064086914, 0.01587677001953125, 0.01690053939819336, 0.01792430877685547, 0.018948078155517578, 0.019971847534179688, 0.020995616912841797, 0.022019386291503906, 0.023043155670166016, 0.024066925048828125, 0.025090694427490234, 0.026114463806152344, 0.027138233184814453, 0.028162002563476562, 0.029185771942138672, 0.03020954132080078, 0.03123331069946289, 0.032257080078125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 8.0, 9.0, 11.0, 9.0, 10.0, 11.0, 16.0, 18.0, 25.0, 29.0, 37.0, 57.0, 38.0, 39.0, 46.0, 57.0, 56.0, 62.0, 45.0, 45.0, 37.0, 63.0, 49.0, 45.0, 29.0, 26.0, 27.0, 19.0, 14.0, 14.0, 7.0, 10.0, 10.0, 10.0, 4.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03741455078125, -0.036124229431152344, -0.03483390808105469, -0.03354358673095703, -0.032253265380859375, -0.03096294403076172, -0.029672622680664062, -0.028382301330566406, -0.02709197998046875, -0.025801658630371094, -0.024511337280273438, -0.02322101593017578, -0.021930694580078125, -0.02064037322998047, -0.019350051879882812, -0.018059730529785156, -0.0167694091796875, -0.015479087829589844, -0.014188766479492188, -0.012898445129394531, -0.011608123779296875, -0.010317802429199219, -0.009027481079101562, -0.007737159729003906, -0.00644683837890625, -0.005156517028808594, -0.0038661956787109375, -0.0025758743286132812, -0.001285552978515625, 4.76837158203125e-06, 0.0012950897216796875, 0.0025854110717773438, 0.003875732421875, 0.005166053771972656, 0.0064563751220703125, 0.007746696472167969, 0.009037017822265625, 0.010327339172363281, 0.011617660522460938, 0.012907981872558594, 0.01419830322265625, 0.015488624572753906, 0.016778945922851562, 0.01806926727294922, 0.019359588623046875, 0.02064990997314453, 0.021940231323242188, 0.023230552673339844, 0.0245208740234375, 0.025811195373535156, 0.027101516723632812, 0.02839183807373047, 0.029682159423828125, 0.03097248077392578, 0.03226280212402344, 0.033553123474121094, 0.03484344482421875, 0.036133766174316406, 0.03742408752441406, 0.03871440887451172, 0.040004730224609375, 0.04129505157470703, 0.04258537292480469, 0.043875694274902344, 0.045166015625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 8.0, 18.0, 54.0, 119.0, 318.0, 1952.0, 913108.0, 131502.0, 1062.0, 245.0, 97.0, 40.0, 16.0, 14.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.072265625, -0.06999874114990234, -0.06773185729980469, -0.06546497344970703, -0.06319808959960938, -0.06093120574951172, -0.05866432189941406, -0.056397438049316406, -0.05413055419921875, -0.051863670349121094, -0.04959678649902344, -0.04732990264892578, -0.045063018798828125, -0.04279613494873047, -0.04052925109863281, -0.038262367248535156, -0.0359954833984375, -0.033728599548339844, -0.03146171569824219, -0.02919483184814453, -0.026927947998046875, -0.02466106414794922, -0.022394180297851562, -0.020127296447753906, -0.01786041259765625, -0.015593528747558594, -0.013326644897460938, -0.011059761047363281, -0.008792877197265625, -0.006525993347167969, -0.0042591094970703125, -0.0019922256469726562, 0.000274658203125, 0.0025415420532226562, 0.0048084259033203125, 0.007075309753417969, 0.009342193603515625, 0.011609077453613281, 0.013875961303710938, 0.016142845153808594, 0.01840972900390625, 0.020676612854003906, 0.022943496704101562, 0.02521038055419922, 0.027477264404296875, 0.02974414825439453, 0.03201103210449219, 0.034277915954589844, 0.0365447998046875, 0.038811683654785156, 0.04107856750488281, 0.04334545135498047, 0.045612335205078125, 0.04787921905517578, 0.05014610290527344, 0.052412986755371094, 0.05467987060546875, 0.056946754455566406, 0.05921363830566406, 0.06148052215576172, 0.06374740600585938, 0.06601428985595703, 0.06828117370605469, 0.07054805755615234, 0.07281494140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 24.0, 110.0, 339.0, 381.0, 101.0, 35.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0005464553833007812, -0.0005337707698345184, -0.0005210861563682556, -0.0005084015429019928, -0.00049571692943573, -0.00048303231596946716, -0.00047034770250320435, -0.00045766308903694153, -0.0004449784755706787, -0.0004322938621044159, -0.0004196092486381531, -0.00040692463517189026, -0.00039424002170562744, -0.0003815554082393646, -0.0003688707947731018, -0.000356186181306839, -0.00034350156784057617, -0.00033081695437431335, -0.00031813234090805054, -0.0003054477274417877, -0.0002927631139755249, -0.0002800785005092621, -0.00026739388704299927, -0.00025470927357673645, -0.00024202466011047363, -0.00022934004664421082, -0.000216655433177948, -0.00020397081971168518, -0.00019128620624542236, -0.00017860159277915955, -0.00016591697931289673, -0.0001532323658466339, -0.0001405477523803711, -0.00012786313891410828, -0.00011517852544784546, -0.00010249391198158264, -8.980929851531982e-05, -7.712468504905701e-05, -6.444007158279419e-05, -5.175545811653137e-05, -3.9070844650268555e-05, -2.6386231184005737e-05, -1.370161771774292e-05, -1.0170042514801025e-06, 1.1667609214782715e-05, 2.4352222681045532e-05, 3.703683614730835e-05, 4.972144961357117e-05, 6.240606307983398e-05, 7.50906765460968e-05, 8.777529001235962e-05, 0.00010045990347862244, 0.00011314451694488525, 0.00012582913041114807, 0.0001385137438774109, 0.0001511983573436737, 0.00016388297080993652, 0.00017656758427619934, 0.00018925219774246216, 0.00020193681120872498, 0.0002146214246749878, 0.0002273060381412506, 0.00023999065160751343, 0.00025267526507377625, 0.00026535987854003906]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 8.0, 17.0, 51.0, 113.0, 321.0, 1494.0, 838401.0, 206700.0, 1051.0, 247.0, 88.0, 39.0, 8.0, 9.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.10040283203125, -0.0980076789855957, -0.0956125259399414, -0.09321737289428711, -0.09082221984863281, -0.08842706680297852, -0.08603191375732422, -0.08363676071166992, -0.08124160766601562, -0.07884645462036133, -0.07645130157470703, -0.07405614852905273, -0.07166099548339844, -0.06926584243774414, -0.06687068939208984, -0.06447553634643555, -0.06208038330078125, -0.05968523025512695, -0.057290077209472656, -0.05489492416381836, -0.05249977111816406, -0.050104618072509766, -0.04770946502685547, -0.04531431198120117, -0.042919158935546875, -0.04052400588989258, -0.03812885284423828, -0.035733699798583984, -0.03333854675292969, -0.03094339370727539, -0.028548240661621094, -0.026153087615966797, -0.0237579345703125, -0.021362781524658203, -0.018967628479003906, -0.01657247543334961, -0.014177322387695312, -0.011782169342041016, -0.009387016296386719, -0.006991863250732422, -0.004596710205078125, -0.002201557159423828, 0.00019359588623046875, 0.0025887489318847656, 0.0049839019775390625, 0.007379055023193359, 0.009774208068847656, 0.012169361114501953, 0.01456451416015625, 0.016959667205810547, 0.019354820251464844, 0.02174997329711914, 0.024145126342773438, 0.026540279388427734, 0.02893543243408203, 0.03133058547973633, 0.033725738525390625, 0.03612089157104492, 0.03851604461669922, 0.040911197662353516, 0.04330635070800781, 0.04570150375366211, 0.048096656799316406, 0.0504918098449707, 0.052886962890625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 11.0, 22.0, 27.0, 117.0, 258.0, 325.0, 162.0, 58.0, 23.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07177734375, -0.07007789611816406, -0.06837844848632812, -0.06667900085449219, -0.06497955322265625, -0.06328010559082031, -0.061580657958984375, -0.05988121032714844, -0.0581817626953125, -0.05648231506347656, -0.054782867431640625, -0.05308341979980469, -0.05138397216796875, -0.04968452453613281, -0.047985076904296875, -0.04628562927246094, -0.044586181640625, -0.04288673400878906, -0.041187286376953125, -0.03948783874511719, -0.03778839111328125, -0.03608894348144531, -0.034389495849609375, -0.03269004821777344, -0.0309906005859375, -0.029291152954101562, -0.027591705322265625, -0.025892257690429688, -0.02419281005859375, -0.022493362426757812, -0.020793914794921875, -0.019094467163085938, -0.01739501953125, -0.015695571899414062, -0.013996124267578125, -0.012296676635742188, -0.01059722900390625, -0.008897781372070312, -0.007198333740234375, -0.0054988861083984375, -0.0037994384765625, -0.0020999908447265625, -0.000400543212890625, 0.0012989044189453125, 0.00299835205078125, 0.0046977996826171875, 0.006397247314453125, 0.008096694946289062, 0.009796142578125, 0.011495590209960938, 0.013195037841796875, 0.014894485473632812, 0.01659393310546875, 0.018293380737304688, 0.019992828369140625, 0.021692276000976562, 0.0233917236328125, 0.025091171264648438, 0.026790618896484375, 0.028490066528320312, 0.03018951416015625, 0.03188896179199219, 0.033588409423828125, 0.03528785705566406, 0.0369873046875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 28.0, 121.0, 345.0, 320.0, 123.0, 40.0, 13.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5841373205184937, -0.5686408281326294, -0.5531442761421204, -0.5376477837562561, -0.5221512913703918, -0.5066547989845276, -0.49115824699401855, -0.4756617546081543, -0.46016526222229004, -0.4446687400341034, -0.42917224764823914, -0.4136757254600525, -0.39817923307418823, -0.3826827108860016, -0.36718618869781494, -0.3516896963119507, -0.33619317412376404, -0.3206966519355774, -0.30520015954971313, -0.2897036373615265, -0.27420714497566223, -0.2587106227874756, -0.24321411550045013, -0.22771760821342468, -0.21222110092639923, -0.19672459363937378, -0.18122808635234833, -0.16573157906532288, -0.15023505687713623, -0.13473856449127197, -0.11924204230308533, -0.10374553501605988, -0.08824902772903442, -0.07275252044200897, -0.05725600942969322, -0.04175949841737747, -0.02626299113035202, -0.010766483843326569, 0.00473003089427948, 0.02022653818130493, 0.03572304546833038, 0.051219552755355835, 0.06671606004238129, 0.08221257477998734, 0.09770908206701279, 0.11320558935403824, 0.1287021040916443, 0.14419861137866974, 0.1596951186656952, 0.17519162595272064, 0.1906881332397461, 0.20618465542793274, 0.221681147813797, 0.23717767000198364, 0.2526741623878479, 0.26817068457603455, 0.2836672067642212, 0.29916372895240784, 0.3146602213382721, 0.33015674352645874, 0.345653235912323, 0.36114975810050964, 0.3766462802886963, 0.39214277267456055, 0.4076392650604248]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 4.0, 7.0, 4.0, 7.0, 13.0, 7.0, 13.0, 16.0, 24.0, 20.0, 36.0, 24.0, 28.0, 32.0, 32.0, 34.0, 43.0, 41.0, 33.0, 41.0, 47.0, 45.0, 50.0, 43.0, 45.0, 35.0, 37.0, 31.0, 36.0, 30.0, 19.0, 31.0, 17.0, 15.0, 12.0, 6.0, 12.0, 11.0, 8.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1760135293006897, -0.17053663730621338, -0.16505974531173706, -0.15958286821842194, -0.15410597622394562, -0.1486290842294693, -0.14315220713615417, -0.13767531514167786, -0.13219842314720154, -0.12672153115272522, -0.1212446466088295, -0.11576776206493378, -0.11029087007045746, -0.10481397807598114, -0.09933709353208542, -0.0938602089881897, -0.08838331699371338, -0.08290642499923706, -0.07742954045534134, -0.07195265591144562, -0.0664757639169693, -0.06099887564778328, -0.05552198737859726, -0.05004509910941124, -0.04456821084022522, -0.0390913225710392, -0.03361443430185318, -0.02813754603266716, -0.02266065776348114, -0.01718376949429512, -0.0117068812251091, -0.0062299929559230804, -0.0007531046867370605, 0.004723783582448959, 0.01020067185163498, 0.015677560120821, 0.02115444839000702, 0.02663133665919304, 0.03210822492837906, 0.03758511319756508, 0.0430620014667511, 0.04853888973593712, 0.05401577800512314, 0.05949266627430916, 0.06496955454349518, 0.0704464465379715, 0.07592333108186722, 0.08140021562576294, 0.08687710762023926, 0.09235399961471558, 0.0978308841586113, 0.10330776870250702, 0.10878466069698334, 0.11426155269145966, 0.11973843723535538, 0.1252153217792511, 0.13069221377372742, 0.13616910576820374, 0.14164599776268005, 0.14712287485599518, 0.1525997668504715, 0.15807665884494781, 0.16355353593826294, 0.16903042793273926, 0.17450731992721558]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 1.0, 4.0, 6.0, 9.0, 11.0, 8.0, 15.0, 14.0, 26.0, 33.0, 54.0, 60.0, 111.0, 165.0, 326.0, 559.0, 1044.0, 2215.0, 5395.0, 16160.0, 85561.0, 3555786.0, 471026.0, 38110.0, 10104.0, 3857.0, 1706.0, 812.0, 429.0, 230.0, 162.0, 91.0, 74.0, 42.0, 24.0, 14.0, 12.0, 10.0, 7.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03717041015625, -0.03592252731323242, -0.034674644470214844, -0.033426761627197266, -0.03217887878417969, -0.03093099594116211, -0.02968311309814453, -0.028435230255126953, -0.027187347412109375, -0.025939464569091797, -0.02469158172607422, -0.02344369888305664, -0.022195816040039062, -0.020947933197021484, -0.019700050354003906, -0.018452167510986328, -0.01720428466796875, -0.015956401824951172, -0.014708518981933594, -0.013460636138916016, -0.012212753295898438, -0.01096487045288086, -0.009716987609863281, -0.008469104766845703, -0.007221221923828125, -0.005973339080810547, -0.004725456237792969, -0.0034775733947753906, -0.0022296905517578125, -0.0009818077087402344, 0.00026607513427734375, 0.0015139579772949219, 0.0027618408203125, 0.004009723663330078, 0.005257606506347656, 0.006505489349365234, 0.0077533721923828125, 0.00900125503540039, 0.010249137878417969, 0.011497020721435547, 0.012744903564453125, 0.013992786407470703, 0.015240669250488281, 0.01648855209350586, 0.017736434936523438, 0.018984317779541016, 0.020232200622558594, 0.021480083465576172, 0.02272796630859375, 0.023975849151611328, 0.025223731994628906, 0.026471614837646484, 0.027719497680664062, 0.02896738052368164, 0.03021526336669922, 0.0314631462097168, 0.032711029052734375, 0.03395891189575195, 0.03520679473876953, 0.03645467758178711, 0.03770256042480469, 0.038950443267822266, 0.040198326110839844, 0.04144620895385742, 0.042694091796875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 8.0, 9.0, 10.0, 24.0, 32.0, 36.0, 40.0, 55.0, 67.0, 79.0, 87.0, 73.0, 70.0, 68.0, 74.0, 51.0, 44.0, 50.0, 36.0, 21.0, 19.0, 9.0, 14.0, 4.0, 8.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0182342529296875, -0.017725110054016113, -0.017215967178344727, -0.01670682430267334, -0.016197681427001953, -0.015688538551330566, -0.01517939567565918, -0.014670252799987793, -0.014161109924316406, -0.01365196704864502, -0.013142824172973633, -0.012633681297302246, -0.01212453842163086, -0.011615395545959473, -0.011106252670288086, -0.0105971097946167, -0.010087966918945312, -0.009578824043273926, -0.009069681167602539, -0.008560538291931152, -0.008051395416259766, -0.007542252540588379, -0.007033109664916992, -0.0065239667892456055, -0.006014823913574219, -0.005505681037902832, -0.004996538162231445, -0.004487395286560059, -0.003978252410888672, -0.003469109535217285, -0.0029599666595458984, -0.0024508237838745117, -0.001941680908203125, -0.0014325380325317383, -0.0009233951568603516, -0.00041425228118896484, 9.489059448242188e-05, 0.0006040334701538086, 0.0011131763458251953, 0.001622319221496582, 0.0021314620971679688, 0.0026406049728393555, 0.003149747848510742, 0.003658890724182129, 0.004168033599853516, 0.004677176475524902, 0.005186319351196289, 0.005695462226867676, 0.0062046051025390625, 0.006713747978210449, 0.007222890853881836, 0.007732033729553223, 0.00824117660522461, 0.008750319480895996, 0.009259462356567383, 0.00976860523223877, 0.010277748107910156, 0.010786890983581543, 0.01129603385925293, 0.011805176734924316, 0.012314319610595703, 0.01282346248626709, 0.013332605361938477, 0.013841748237609863, 0.01435089111328125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 4.0, 10.0, 27.0, 36.0, 65.0, 117.0, 235.0, 465.0, 1171.0, 4005.0, 28043.0, 3802687.0, 341279.0, 11815.0, 2482.0, 923.0, 438.0, 206.0, 130.0, 70.0, 21.0, 22.0, 11.0, 5.0, 7.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06158447265625, -0.05964851379394531, -0.057712554931640625, -0.05577659606933594, -0.05384063720703125, -0.05190467834472656, -0.049968719482421875, -0.04803276062011719, -0.0460968017578125, -0.04416084289550781, -0.042224884033203125, -0.04028892517089844, -0.03835296630859375, -0.03641700744628906, -0.034481048583984375, -0.03254508972167969, -0.030609130859375, -0.028673171997070312, -0.026737213134765625, -0.024801254272460938, -0.02286529541015625, -0.020929336547851562, -0.018993377685546875, -0.017057418823242188, -0.0151214599609375, -0.013185501098632812, -0.011249542236328125, -0.009313583374023438, -0.00737762451171875, -0.0054416656494140625, -0.003505706787109375, -0.0015697479248046875, 0.0003662109375, 0.0023021697998046875, 0.004238128662109375, 0.0061740875244140625, 0.00811004638671875, 0.010046005249023438, 0.011981964111328125, 0.013917922973632812, 0.0158538818359375, 0.017789840698242188, 0.019725799560546875, 0.021661758422851562, 0.02359771728515625, 0.025533676147460938, 0.027469635009765625, 0.029405593872070312, 0.031341552734375, 0.03327751159667969, 0.035213470458984375, 0.03714942932128906, 0.03908538818359375, 0.04102134704589844, 0.042957305908203125, 0.04489326477050781, 0.0468292236328125, 0.04876518249511719, 0.050701141357421875, 0.05263710021972656, 0.05457305908203125, 0.05650901794433594, 0.058444976806640625, 0.06038093566894531, 0.06231689453125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 3.0, 4.0, 7.0, 20.0, 42.0, 117.0, 290.0, 1772.0, 1412.0, 241.0, 80.0, 26.0, 16.0, 15.0, 9.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0179443359375, -0.017195463180541992, -0.016446590423583984, -0.015697717666625977, -0.014948844909667969, -0.014199972152709961, -0.013451099395751953, -0.012702226638793945, -0.011953353881835938, -0.01120448112487793, -0.010455608367919922, -0.009706735610961914, -0.008957862854003906, -0.008208990097045898, -0.007460117340087891, -0.006711244583129883, -0.005962371826171875, -0.005213499069213867, -0.004464626312255859, -0.0037157535552978516, -0.0029668807983398438, -0.002218008041381836, -0.0014691352844238281, -0.0007202625274658203, 2.86102294921875e-05, 0.0007774829864501953, 0.0015263557434082031, 0.002275228500366211, 0.0030241012573242188, 0.0037729740142822266, 0.004521846771240234, 0.005270719528198242, 0.00601959228515625, 0.006768465042114258, 0.007517337799072266, 0.008266210556030273, 0.009015083312988281, 0.009763956069946289, 0.010512828826904297, 0.011261701583862305, 0.012010574340820312, 0.01275944709777832, 0.013508319854736328, 0.014257192611694336, 0.015006065368652344, 0.01575493812561035, 0.01650381088256836, 0.017252683639526367, 0.018001556396484375, 0.018750429153442383, 0.01949930191040039, 0.0202481746673584, 0.020997047424316406, 0.021745920181274414, 0.022494792938232422, 0.02324366569519043, 0.023992538452148438, 0.024741411209106445, 0.025490283966064453, 0.02623915672302246, 0.02698802947998047, 0.027736902236938477, 0.028485774993896484, 0.029234647750854492, 0.0299835205078125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 8.0, 11.0, 40.0, 132.0, 247.0, 277.0, 179.0, 59.0, 28.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04558504745364189, -0.04158882796764374, -0.03759261220693588, -0.03359639272093773, -0.029600173234939575, -0.02560395374894142, -0.021607736125588417, -0.017611518502235413, -0.013615299016237259, -0.00961908046156168, -0.005622861906886101, -0.0016266433522105217, 0.0023695752024650574, 0.006365794688463211, 0.010362012311816216, 0.01435822993516922, 0.018354449421167374, 0.022350668907165527, 0.026346886530518532, 0.030343104153871536, 0.03433932363986969, 0.038335543125867844, 0.042331762611866, 0.04632797837257385, 0.050324197858572006, 0.05432041734457016, 0.058316633105278015, 0.06231285259127617, 0.06630907207727432, 0.07030528783798218, 0.07430151104927063, 0.07829772680997849, 0.08229395747184753, 0.08629017323255539, 0.09028639644384384, 0.0942826122045517, 0.09827883541584015, 0.102275051176548, 0.10627126693725586, 0.11026749014854431, 0.11426370590925217, 0.11825992166996002, 0.12225614488124847, 0.12625236809253693, 0.13024857640266418, 0.13424479961395264, 0.1382410228252411, 0.14223723113536835, 0.1462334543466568, 0.15022967755794525, 0.1542258858680725, 0.15822210907936096, 0.16221833229064941, 0.16621455550193787, 0.17021076381206512, 0.17420698702335358, 0.17820319533348083, 0.1821994185447693, 0.18619562685489655, 0.190191850066185, 0.19418807327747345, 0.1981842815876007, 0.20218050479888916, 0.2061767280101776, 0.21017295122146606]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 2.0, 5.0, 6.0, 10.0, 21.0, 25.0, 23.0, 24.0, 43.0, 48.0, 50.0, 58.0, 80.0, 83.0, 80.0, 99.0, 59.0, 64.0, 46.0, 48.0, 32.0, 27.0, 20.0, 15.0, 17.0, 6.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06990444660186768, -0.06785410642623901, -0.06580376625061035, -0.06375342607498169, -0.06170308589935303, -0.059652745723724365, -0.0576024055480957, -0.05555206537246704, -0.05350172519683838, -0.05145138502120972, -0.049401044845581055, -0.04735070466995239, -0.04530036449432373, -0.04325002431869507, -0.041199684143066406, -0.039149343967437744, -0.03709900379180908, -0.03504866361618042, -0.03299832344055176, -0.030947983264923096, -0.028897643089294434, -0.02684730291366577, -0.02479696273803711, -0.022746622562408447, -0.020696282386779785, -0.018645942211151123, -0.01659560203552246, -0.014545261859893799, -0.012494921684265137, -0.010444581508636475, -0.008394241333007812, -0.00634390115737915, -0.004293560981750488, -0.002243220806121826, -0.00019288063049316406, 0.001857459545135498, 0.00390779972076416, 0.005958139896392822, 0.008008480072021484, 0.010058820247650146, 0.012109160423278809, 0.01415950059890747, 0.016209840774536133, 0.018260180950164795, 0.020310521125793457, 0.02236086130142212, 0.02441120147705078, 0.026461541652679443, 0.028511881828308105, 0.030562222003936768, 0.03261256217956543, 0.03466290235519409, 0.036713242530822754, 0.038763582706451416, 0.04081392288208008, 0.04286426305770874, 0.0449146032333374, 0.046964943408966064, 0.04901528358459473, 0.05106562376022339, 0.05311596393585205, 0.05516630411148071, 0.057216644287109375, 0.05926698446273804, 0.0613173246383667]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 3.0, 3.0, 10.0, 22.0, 34.0, 69.0, 115.0, 186.0, 422.0, 987.0, 2831.0, 12395.0, 106844.0, 718513.0, 182063.0, 18102.0, 3697.0, 1252.0, 494.0, 211.0, 119.0, 68.0, 43.0, 27.0, 12.0, 9.0, 11.0, 6.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056182861328125, -0.054459571838378906, -0.05273628234863281, -0.05101299285888672, -0.049289703369140625, -0.04756641387939453, -0.04584312438964844, -0.044119834899902344, -0.04239654541015625, -0.040673255920410156, -0.03894996643066406, -0.03722667694091797, -0.035503387451171875, -0.03378009796142578, -0.03205680847167969, -0.030333518981933594, -0.0286102294921875, -0.026886940002441406, -0.025163650512695312, -0.02344036102294922, -0.021717071533203125, -0.01999378204345703, -0.018270492553710938, -0.016547203063964844, -0.01482391357421875, -0.013100624084472656, -0.011377334594726562, -0.009654045104980469, -0.007930755615234375, -0.006207466125488281, -0.0044841766357421875, -0.0027608871459960938, -0.00103759765625, 0.0006856918334960938, 0.0024089813232421875, 0.004132270812988281, 0.005855560302734375, 0.007578849792480469, 0.009302139282226562, 0.011025428771972656, 0.01274871826171875, 0.014472007751464844, 0.016195297241210938, 0.01791858673095703, 0.019641876220703125, 0.02136516571044922, 0.023088455200195312, 0.024811744689941406, 0.0265350341796875, 0.028258323669433594, 0.029981613159179688, 0.03170490264892578, 0.033428192138671875, 0.03515148162841797, 0.03687477111816406, 0.038598060607910156, 0.04032135009765625, 0.042044639587402344, 0.04376792907714844, 0.04549121856689453, 0.047214508056640625, 0.04893779754638672, 0.05066108703613281, 0.052384376525878906, 0.054107666015625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 12.0, 7.0, 9.0, 15.0, 20.0, 35.0, 45.0, 57.0, 89.0, 58.0, 83.0, 83.0, 80.0, 74.0, 73.0, 53.0, 52.0, 46.0, 31.0, 23.0, 16.0, 11.0, 7.0, 8.0, 3.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.019012451171875, -0.01848292350769043, -0.01795339584350586, -0.01742386817932129, -0.01689434051513672, -0.01636481285095215, -0.015835285186767578, -0.015305757522583008, -0.014776229858398438, -0.014246702194213867, -0.013717174530029297, -0.013187646865844727, -0.012658119201660156, -0.012128591537475586, -0.011599063873291016, -0.011069536209106445, -0.010540008544921875, -0.010010480880737305, -0.009480953216552734, -0.008951425552368164, -0.008421897888183594, -0.007892370223999023, -0.007362842559814453, -0.006833314895629883, -0.0063037872314453125, -0.005774259567260742, -0.005244731903076172, -0.0047152042388916016, -0.004185676574707031, -0.003656148910522461, -0.0031266212463378906, -0.0025970935821533203, -0.00206756591796875, -0.0015380382537841797, -0.0010085105895996094, -0.00047898292541503906, 5.054473876953125e-05, 0.0005800724029541016, 0.0011096000671386719, 0.0016391277313232422, 0.0021686553955078125, 0.002698183059692383, 0.003227710723876953, 0.0037572383880615234, 0.004286766052246094, 0.004816293716430664, 0.005345821380615234, 0.005875349044799805, 0.006404876708984375, 0.006934404373168945, 0.007463932037353516, 0.007993459701538086, 0.008522987365722656, 0.009052515029907227, 0.009582042694091797, 0.010111570358276367, 0.010641098022460938, 0.011170625686645508, 0.011700153350830078, 0.012229681015014648, 0.012759208679199219, 0.013288736343383789, 0.01381826400756836, 0.01434779167175293, 0.0148773193359375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 7.0, 5.0, 4.0, 7.0, 10.0, 5.0, 20.0, 27.0, 21.0, 42.0, 56.0, 60.0, 96.0, 170.0, 349.0, 832.0, 3715.0, 22008.0, 167672.0, 616468.0, 204117.0, 26449.0, 4419.0, 1030.0, 390.0, 180.0, 115.0, 64.0, 54.0, 36.0, 35.0, 23.0, 17.0, 20.0, 10.0, 7.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.031982421875, -0.030968666076660156, -0.029954910278320312, -0.02894115447998047, -0.027927398681640625, -0.02691364288330078, -0.025899887084960938, -0.024886131286621094, -0.02387237548828125, -0.022858619689941406, -0.021844863891601562, -0.02083110809326172, -0.019817352294921875, -0.01880359649658203, -0.017789840698242188, -0.016776084899902344, -0.0157623291015625, -0.014748573303222656, -0.013734817504882812, -0.012721061706542969, -0.011707305908203125, -0.010693550109863281, -0.009679794311523438, -0.008666038513183594, -0.00765228271484375, -0.006638526916503906, -0.0056247711181640625, -0.004611015319824219, -0.003597259521484375, -0.0025835037231445312, -0.0015697479248046875, -0.0005559921264648438, 0.000457763671875, 0.0014715194702148438, 0.0024852752685546875, 0.0034990310668945312, 0.004512786865234375, 0.005526542663574219, 0.0065402984619140625, 0.007554054260253906, 0.00856781005859375, 0.009581565856933594, 0.010595321655273438, 0.011609077453613281, 0.012622833251953125, 0.013636589050292969, 0.014650344848632812, 0.015664100646972656, 0.0166778564453125, 0.017691612243652344, 0.018705368041992188, 0.01971912384033203, 0.020732879638671875, 0.02174663543701172, 0.022760391235351562, 0.023774147033691406, 0.02478790283203125, 0.025801658630371094, 0.026815414428710938, 0.02782917022705078, 0.028842926025390625, 0.02985668182373047, 0.030870437622070312, 0.031884193420410156, 0.03289794921875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 10.0, 6.0, 8.0, 9.0, 12.0, 14.0, 20.0, 21.0, 29.0, 29.0, 29.0, 41.0, 39.0, 39.0, 40.0, 43.0, 39.0, 57.0, 47.0, 41.0, 47.0, 36.0, 44.0, 36.0, 37.0, 37.0, 28.0, 23.0, 27.0, 15.0, 16.0, 10.0, 17.0, 12.0, 12.0, 11.0, 9.0, 1.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.039093017578125, -0.038004159927368164, -0.03691530227661133, -0.03582644462585449, -0.034737586975097656, -0.03364872932434082, -0.032559871673583984, -0.03147101402282715, -0.030382156372070312, -0.029293298721313477, -0.02820444107055664, -0.027115583419799805, -0.02602672576904297, -0.024937868118286133, -0.023849010467529297, -0.02276015281677246, -0.021671295166015625, -0.02058243751525879, -0.019493579864501953, -0.018404722213745117, -0.01731586456298828, -0.016227006912231445, -0.01513814926147461, -0.014049291610717773, -0.012960433959960938, -0.011871576309204102, -0.010782718658447266, -0.00969386100769043, -0.008605003356933594, -0.007516145706176758, -0.006427288055419922, -0.005338430404663086, -0.00424957275390625, -0.003160715103149414, -0.002071857452392578, -0.0009829998016357422, 0.00010585784912109375, 0.0011947154998779297, 0.0022835731506347656, 0.0033724308013916016, 0.0044612884521484375, 0.0055501461029052734, 0.006639003753662109, 0.007727861404418945, 0.008816719055175781, 0.009905576705932617, 0.010994434356689453, 0.012083292007446289, 0.013172149658203125, 0.014261007308959961, 0.015349864959716797, 0.016438722610473633, 0.01752758026123047, 0.018616437911987305, 0.01970529556274414, 0.020794153213500977, 0.021883010864257812, 0.02297186851501465, 0.024060726165771484, 0.02514958381652832, 0.026238441467285156, 0.027327299118041992, 0.028416156768798828, 0.029505014419555664, 0.0305938720703125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 14.0, 8.0, 11.0, 16.0, 13.0, 13.0, 29.0, 21.0, 41.0, 44.0, 63.0, 93.0, 113.0, 138.0, 251.0, 447.0, 763.0, 2082.0, 7549.0, 56816.0, 495452.0, 428305.0, 45844.0, 6584.0, 1771.0, 740.0, 420.0, 253.0, 166.0, 107.0, 114.0, 71.0, 55.0, 41.0, 29.0, 18.0, 12.0, 12.0, 11.0, 8.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.01374053955078125, -0.013358354568481445, -0.01297616958618164, -0.012593984603881836, -0.012211799621582031, -0.011829614639282227, -0.011447429656982422, -0.011065244674682617, -0.010683059692382812, -0.010300874710083008, -0.009918689727783203, -0.009536504745483398, -0.009154319763183594, -0.008772134780883789, -0.008389949798583984, -0.00800776481628418, -0.007625579833984375, -0.00724339485168457, -0.006861209869384766, -0.006479024887084961, -0.006096839904785156, -0.0057146549224853516, -0.005332469940185547, -0.004950284957885742, -0.0045680999755859375, -0.004185914993286133, -0.003803730010986328, -0.0034215450286865234, -0.0030393600463867188, -0.002657175064086914, -0.0022749900817871094, -0.0018928050994873047, -0.0015106201171875, -0.0011284351348876953, -0.0007462501525878906, -0.00036406517028808594, 1.811981201171875e-05, 0.00040030479431152344, 0.0007824897766113281, 0.0011646747589111328, 0.0015468597412109375, 0.0019290447235107422, 0.002311229705810547, 0.0026934146881103516, 0.0030755996704101562, 0.003457784652709961, 0.0038399696350097656, 0.00422215461730957, 0.004604339599609375, 0.00498652458190918, 0.005368709564208984, 0.005750894546508789, 0.006133079528808594, 0.0065152645111083984, 0.006897449493408203, 0.007279634475708008, 0.0076618194580078125, 0.008044004440307617, 0.008426189422607422, 0.008808374404907227, 0.009190559387207031, 0.009572744369506836, 0.00995492935180664, 0.010337114334106445, 0.01071929931640625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 7.0, 8.0, 25.0, 56.0, 123.0, 259.0, 267.0, 150.0, 61.0, 30.0, 11.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022554397583007812, -0.00021928176283836365, -0.00021301954984664917, -0.0002067573368549347, -0.00020049512386322021, -0.00019423291087150574, -0.00018797069787979126, -0.00018170848488807678, -0.0001754462718963623, -0.00016918405890464783, -0.00016292184591293335, -0.00015665963292121887, -0.0001503974199295044, -0.00014413520693778992, -0.00013787299394607544, -0.00013161078095436096, -0.00012534856796264648, -0.00011908635497093201, -0.00011282414197921753, -0.00010656192898750305, -0.00010029971599578857, -9.40375030040741e-05, -8.777529001235962e-05, -8.151307702064514e-05, -7.525086402893066e-05, -6.898865103721619e-05, -6.272643804550171e-05, -5.646422505378723e-05, -5.0202012062072754e-05, -4.3939799070358276e-05, -3.76775860786438e-05, -3.141537308692932e-05, -2.5153160095214844e-05, -1.8890947103500366e-05, -1.2628734111785889e-05, -6.366521120071411e-06, -1.043081283569336e-07, 6.157904863357544e-06, 1.2420117855072021e-05, 1.86823308467865e-05, 2.4944543838500977e-05, 3.1206756830215454e-05, 3.746896982192993e-05, 4.373118281364441e-05, 4.999339580535889e-05, 5.6255608797073364e-05, 6.251782178878784e-05, 6.878003478050232e-05, 7.50422477722168e-05, 8.130446076393127e-05, 8.756667375564575e-05, 9.382888674736023e-05, 0.00010009109973907471, 0.00010635331273078918, 0.00011261552572250366, 0.00011887773871421814, 0.00012513995170593262, 0.0001314021646976471, 0.00013766437768936157, 0.00014392659068107605, 0.00015018880367279053, 0.000156451016664505, 0.00016271322965621948, 0.00016897544264793396, 0.00017523765563964844]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 10.0, 7.0, 23.0, 37.0, 63.0, 133.0, 270.0, 626.0, 2040.0, 18186.0, 527355.0, 480339.0, 16357.0, 1984.0, 593.0, 255.0, 129.0, 72.0, 25.0, 21.0, 14.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.0270843505859375, -0.02645421028137207, -0.02582406997680664, -0.02519392967224121, -0.02456378936767578, -0.02393364906311035, -0.023303508758544922, -0.022673368453979492, -0.022043228149414062, -0.021413087844848633, -0.020782947540283203, -0.020152807235717773, -0.019522666931152344, -0.018892526626586914, -0.018262386322021484, -0.017632246017456055, -0.017002105712890625, -0.016371965408325195, -0.015741825103759766, -0.015111684799194336, -0.014481544494628906, -0.013851404190063477, -0.013221263885498047, -0.012591123580932617, -0.011960983276367188, -0.011330842971801758, -0.010700702667236328, -0.010070562362670898, -0.009440422058105469, -0.008810281753540039, -0.00818014144897461, -0.00755000114440918, -0.00691986083984375, -0.00628972053527832, -0.005659580230712891, -0.005029439926147461, -0.004399299621582031, -0.0037691593170166016, -0.003139019012451172, -0.002508878707885742, -0.0018787384033203125, -0.0012485980987548828, -0.0006184577941894531, 1.1682510375976562e-05, 0.0006418228149414062, 0.001271963119506836, 0.0019021034240722656, 0.0025322437286376953, 0.003162384033203125, 0.0037925243377685547, 0.004422664642333984, 0.005052804946899414, 0.005682945251464844, 0.0063130855560302734, 0.006943225860595703, 0.007573366165161133, 0.008203506469726562, 0.008833646774291992, 0.009463787078857422, 0.010093927383422852, 0.010724067687988281, 0.011354207992553711, 0.01198434829711914, 0.01261448860168457, 0.01324462890625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 6.0, 10.0, 22.0, 31.0, 58.0, 89.0, 112.0, 130.0, 145.0, 127.0, 98.0, 73.0, 46.0, 23.0, 13.0, 6.0, 4.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02392578125, -0.023298263549804688, -0.022670745849609375, -0.022043228149414062, -0.02141571044921875, -0.020788192749023438, -0.020160675048828125, -0.019533157348632812, -0.0189056396484375, -0.018278121948242188, -0.017650604248046875, -0.017023086547851562, -0.01639556884765625, -0.015768051147460938, -0.015140533447265625, -0.014513015747070312, -0.013885498046875, -0.013257980346679688, -0.012630462646484375, -0.012002944946289062, -0.01137542724609375, -0.010747909545898438, -0.010120391845703125, -0.009492874145507812, -0.0088653564453125, -0.008237838745117188, -0.007610321044921875, -0.0069828033447265625, -0.00635528564453125, -0.0057277679443359375, -0.005100250244140625, -0.0044727325439453125, -0.00384521484375, -0.0032176971435546875, -0.002590179443359375, -0.0019626617431640625, -0.00133514404296875, -0.0007076263427734375, -8.0108642578125e-05, 0.0005474090576171875, 0.0011749267578125, 0.0018024444580078125, 0.002429962158203125, 0.0030574798583984375, 0.00368499755859375, 0.0043125152587890625, 0.004940032958984375, 0.0055675506591796875, 0.006195068359375, 0.0068225860595703125, 0.007450103759765625, 0.008077621459960938, 0.00870513916015625, 0.009332656860351562, 0.009960174560546875, 0.010587692260742188, 0.0112152099609375, 0.011842727661132812, 0.012470245361328125, 0.013097763061523438, 0.01372528076171875, 0.014352798461914062, 0.014980316162109375, 0.015607833862304688, 0.0162353515625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 10.0, 143.0, 655.0, 192.0, 10.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7687674760818481, -0.7418866753578186, -0.7150059342384338, -0.6881251335144043, -0.6612443923950195, -0.63436359167099, -0.6074827909469604, -0.5806020498275757, -0.5537213087081909, -0.5268405079841614, -0.4999597668647766, -0.47307896614074707, -0.4461982250213623, -0.41931742429733276, -0.3924366533756256, -0.36555588245391846, -0.3386750817298889, -0.31179431080818176, -0.2849135398864746, -0.25803273916244507, -0.2311519831418991, -0.20427121222019196, -0.1773904263973236, -0.15050965547561646, -0.1236288845539093, -0.09674811363220215, -0.0698673352599144, -0.04298655688762665, -0.016105785965919495, 0.010774984955787659, 0.037655770778656006, 0.06453654170036316, 0.09141731262207031, 0.11829808354377747, 0.14517885446548462, 0.17205964028835297, 0.19894041121006012, 0.22582118213176727, 0.2527019679546356, 0.2795827388763428, 0.3064635097980499, 0.3333442807197571, 0.36022505164146423, 0.3871058225631714, 0.4139866232872009, 0.4408673644065857, 0.46774816513061523, 0.4946289360523224, 0.5215097069740295, 0.5483905076980591, 0.5752712488174438, 0.6021520495414734, 0.6290327906608582, 0.6559135913848877, 0.6827943325042725, 0.709675133228302, 0.7365559339523315, 0.7634367346763611, 0.7903174757957458, 0.8171982765197754, 0.8440790176391602, 0.8709598183631897, 0.8978406190872192, 0.924721360206604, 0.9516021013259888]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 6.0, 8.0, 10.0, 12.0, 15.0, 14.0, 15.0, 19.0, 18.0, 19.0, 36.0, 31.0, 43.0, 44.0, 37.0, 36.0, 41.0, 43.0, 47.0, 40.0, 49.0, 40.0, 37.0, 44.0, 51.0, 29.0, 31.0, 35.0, 23.0, 19.0, 14.0, 16.0, 15.0, 9.0, 18.0, 9.0, 11.0, 4.0, 4.0, 10.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16052979230880737, -0.15533432364463806, -0.15013884007930756, -0.14494337141513824, -0.13974788784980774, -0.13455241918563843, -0.12935693562030792, -0.12416146695613861, -0.1189659908413887, -0.1137705147266388, -0.10857503861188889, -0.10337956249713898, -0.09818409383296967, -0.09298861026763916, -0.08779314160346985, -0.08259766548871994, -0.07740218937397003, -0.07220671325922012, -0.06701123714447021, -0.061815764755010605, -0.056620288640260696, -0.05142481252551079, -0.04622934013605118, -0.04103386402130127, -0.03583838790655136, -0.030642911791801453, -0.025447437539696693, -0.020251963287591934, -0.015056487172842026, -0.009861011058092117, -0.004665536805987358, 0.0005299374461174011, 0.00572541356086731, 0.010920888744294643, 0.016116363927721977, 0.021311838179826736, 0.026507314294576645, 0.03170279040932655, 0.03689826279878616, 0.04209373891353607, 0.04728921502828598, 0.05248469114303589, 0.0576801672577858, 0.0628756433725357, 0.06807111203670502, 0.07326659560203552, 0.07846206426620483, 0.08365754038095474, 0.08885301649570465, 0.09404849261045456, 0.09924396872520447, 0.10443944483995438, 0.10963492095470428, 0.1148303896188736, 0.1200258657336235, 0.1252213418483734, 0.13041681051254272, 0.13561227917671204, 0.14080776274204254, 0.14600323140621185, 0.15119871497154236, 0.15639418363571167, 0.16158966720104218, 0.1667851358652115, 0.171980619430542]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 6.0, 11.0, 22.0, 33.0, 67.0, 127.0, 212.0, 488.0, 1526.0, 7132.0, 101771.0, 4048279.0, 28646.0, 4099.0, 1088.0, 361.0, 183.0, 91.0, 56.0, 23.0, 26.0, 10.0, 9.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11083984375, -0.1077871322631836, -0.10473442077636719, -0.10168170928955078, -0.09862899780273438, -0.09557628631591797, -0.09252357482910156, -0.08947086334228516, -0.08641815185546875, -0.08336544036865234, -0.08031272888183594, -0.07726001739501953, -0.07420730590820312, -0.07115459442138672, -0.06810188293457031, -0.0650491714477539, -0.0619964599609375, -0.058943748474121094, -0.05589103698730469, -0.05283832550048828, -0.049785614013671875, -0.04673290252685547, -0.04368019104003906, -0.040627479553222656, -0.03757476806640625, -0.034522056579589844, -0.03146934509277344, -0.02841663360595703, -0.025363922119140625, -0.02231121063232422, -0.019258499145507812, -0.016205787658691406, -0.013153076171875, -0.010100364685058594, -0.0070476531982421875, -0.003994941711425781, -0.000942230224609375, 0.0021104812622070312, 0.0051631927490234375, 0.008215904235839844, 0.01126861572265625, 0.014321327209472656, 0.017374038696289062, 0.02042675018310547, 0.023479461669921875, 0.02653217315673828, 0.029584884643554688, 0.032637596130371094, 0.0356903076171875, 0.038743019104003906, 0.04179573059082031, 0.04484844207763672, 0.047901153564453125, 0.05095386505126953, 0.05400657653808594, 0.057059288024902344, 0.06011199951171875, 0.06316471099853516, 0.06621742248535156, 0.06927013397216797, 0.07232284545898438, 0.07537555694580078, 0.07842826843261719, 0.0814809799194336, 0.08453369140625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 10.0, 15.0, 15.0, 22.0, 37.0, 52.0, 56.0, 64.0, 71.0, 89.0, 84.0, 84.0, 88.0, 69.0, 56.0, 54.0, 30.0, 31.0, 16.0, 14.0, 11.0, 4.0, 4.0, 6.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0192718505859375, -0.018731236457824707, -0.018190622329711914, -0.01765000820159912, -0.017109394073486328, -0.016568779945373535, -0.016028165817260742, -0.01548755168914795, -0.014946937561035156, -0.014406323432922363, -0.01386570930480957, -0.013325095176696777, -0.012784481048583984, -0.012243866920471191, -0.011703252792358398, -0.011162638664245605, -0.010622024536132812, -0.01008141040802002, -0.009540796279907227, -0.009000182151794434, -0.00845956802368164, -0.007918953895568848, -0.007378339767456055, -0.006837725639343262, -0.006297111511230469, -0.005756497383117676, -0.005215883255004883, -0.00467526912689209, -0.004134654998779297, -0.003594040870666504, -0.003053426742553711, -0.002512812614440918, -0.001972198486328125, -0.001431584358215332, -0.0008909702301025391, -0.0003503561019897461, 0.00019025802612304688, 0.0007308721542358398, 0.0012714862823486328, 0.0018121004104614258, 0.0023527145385742188, 0.0028933286666870117, 0.0034339427947998047, 0.003974556922912598, 0.004515171051025391, 0.005055785179138184, 0.0055963993072509766, 0.0061370134353637695, 0.0066776275634765625, 0.0072182416915893555, 0.0077588558197021484, 0.008299469947814941, 0.008840084075927734, 0.009380698204040527, 0.00992131233215332, 0.010461926460266113, 0.011002540588378906, 0.0115431547164917, 0.012083768844604492, 0.012624382972717285, 0.013164997100830078, 0.013705611228942871, 0.014246225357055664, 0.014786839485168457, 0.01532745361328125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 10.0, 11.0, 21.0, 22.0, 46.0, 78.0, 125.0, 218.0, 345.0, 751.0, 1857.0, 6081.0, 29706.0, 767458.0, 3334705.0, 40904.0, 7631.0, 2360.0, 910.0, 420.0, 242.0, 145.0, 88.0, 61.0, 36.0, 20.0, 10.0, 6.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04779052734375, -0.04642820358276367, -0.045065879821777344, -0.043703556060791016, -0.04234123229980469, -0.04097890853881836, -0.03961658477783203, -0.0382542610168457, -0.036891937255859375, -0.03552961349487305, -0.03416728973388672, -0.03280496597290039, -0.03144264221191406, -0.030080318450927734, -0.028717994689941406, -0.027355670928955078, -0.02599334716796875, -0.024631023406982422, -0.023268699645996094, -0.021906375885009766, -0.020544052124023438, -0.01918172836303711, -0.01781940460205078, -0.016457080841064453, -0.015094757080078125, -0.013732433319091797, -0.012370109558105469, -0.01100778579711914, -0.009645462036132812, -0.008283138275146484, -0.006920814514160156, -0.005558490753173828, -0.0041961669921875, -0.002833843231201172, -0.0014715194702148438, -0.00010919570922851562, 0.0012531280517578125, 0.0026154518127441406, 0.003977775573730469, 0.005340099334716797, 0.006702423095703125, 0.008064746856689453, 0.009427070617675781, 0.01078939437866211, 0.012151718139648438, 0.013514041900634766, 0.014876365661621094, 0.016238689422607422, 0.01760101318359375, 0.018963336944580078, 0.020325660705566406, 0.021687984466552734, 0.023050308227539062, 0.02441263198852539, 0.02577495574951172, 0.027137279510498047, 0.028499603271484375, 0.029861927032470703, 0.03122425079345703, 0.03258657455444336, 0.03394889831542969, 0.035311222076416016, 0.036673545837402344, 0.03803586959838867, 0.039398193359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 8.0, 7.0, 9.0, 23.0, 43.0, 62.0, 212.0, 2333.0, 1058.0, 165.0, 65.0, 34.0, 16.0, 16.0, 7.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0221710205078125, -0.02142930030822754, -0.020687580108642578, -0.019945859909057617, -0.019204139709472656, -0.018462419509887695, -0.017720699310302734, -0.016978979110717773, -0.016237258911132812, -0.015495538711547852, -0.01475381851196289, -0.01401209831237793, -0.013270378112792969, -0.012528657913208008, -0.011786937713623047, -0.011045217514038086, -0.010303497314453125, -0.009561777114868164, -0.008820056915283203, -0.008078336715698242, -0.007336616516113281, -0.00659489631652832, -0.005853176116943359, -0.0051114559173583984, -0.0043697357177734375, -0.0036280155181884766, -0.0028862953186035156, -0.0021445751190185547, -0.0014028549194335938, -0.0006611347198486328, 8.058547973632812e-05, 0.0008223056793212891, 0.00156402587890625, 0.002305746078491211, 0.003047466278076172, 0.003789186477661133, 0.004530906677246094, 0.005272626876831055, 0.006014347076416016, 0.0067560672760009766, 0.0074977874755859375, 0.008239507675170898, 0.00898122787475586, 0.00972294807434082, 0.010464668273925781, 0.011206388473510742, 0.011948108673095703, 0.012689828872680664, 0.013431549072265625, 0.014173269271850586, 0.014914989471435547, 0.015656709671020508, 0.01639842987060547, 0.01714015007019043, 0.01788187026977539, 0.01862359046936035, 0.019365310668945312, 0.020107030868530273, 0.020848751068115234, 0.021590471267700195, 0.022332191467285156, 0.023073911666870117, 0.023815631866455078, 0.02455735206604004, 0.025299072265625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 6.0, 25.0, 185.0, 464.0, 260.0, 39.0, 11.0, 5.0, 3.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17471513152122498, -0.16899962723255157, -0.16328412294387817, -0.15756861865520477, -0.15185311436653137, -0.14613761007785797, -0.14042210578918457, -0.13470660150051117, -0.12899109721183777, -0.12327559292316437, -0.11756008863449097, -0.11184458434581757, -0.10612908005714417, -0.10041357576847076, -0.09469807147979736, -0.08898256719112396, -0.08326706290245056, -0.07755155861377716, -0.07183605432510376, -0.06612055003643036, -0.06040504574775696, -0.05468954145908356, -0.048974037170410156, -0.043258532881736755, -0.037543028593063354, -0.031827524304389954, -0.026112020015716553, -0.020396515727043152, -0.014681011438369751, -0.00896550714969635, -0.0032500028610229492, 0.0024655014276504517, 0.008180990815162659, 0.01389649510383606, 0.01961199939250946, 0.02532750368118286, 0.031043007969856262, 0.03675851225852966, 0.042474016547203064, 0.048189520835876465, 0.053905025124549866, 0.05962052941322327, 0.06533603370189667, 0.07105153799057007, 0.07676704227924347, 0.08248254656791687, 0.08819805085659027, 0.09391355514526367, 0.09962905943393707, 0.10534456372261047, 0.11106006801128387, 0.11677557229995728, 0.12249107658863068, 0.12820658087730408, 0.13392208516597748, 0.13963758945465088, 0.14535309374332428, 0.15106859803199768, 0.15678410232067108, 0.16249960660934448, 0.16821511089801788, 0.17393061518669128, 0.17964611947536469, 0.18536162376403809, 0.1910771280527115]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 1.0, 7.0, 7.0, 17.0, 15.0, 13.0, 36.0, 41.0, 66.0, 83.0, 91.0, 111.0, 85.0, 84.0, 85.0, 64.0, 55.0, 41.0, 28.0, 20.0, 15.0, 12.0, 4.0, 6.0, 6.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06244534254074097, -0.060321059077978134, -0.0581967756152153, -0.05607248842716217, -0.05394820496439934, -0.051823921501636505, -0.049699634313583374, -0.04757535085082054, -0.04545106738805771, -0.043326783925294876, -0.04120250046253204, -0.03907821327447891, -0.03695392981171608, -0.03482964634895325, -0.032705359160900116, -0.030581075698137283, -0.02845679223537445, -0.026332508772611618, -0.024208223447203636, -0.022083938121795654, -0.01995965465903282, -0.01783537119626999, -0.015711085870862007, -0.0135868014767766, -0.011462517082691193, -0.009338232688605785, -0.007213948294520378, -0.005089663900434971, -0.0029653795063495636, -0.0008410951122641563, 0.001283189281821251, 0.003407473675906658, 0.005531758069992065, 0.007656042464077473, 0.00978032685816288, 0.011904611252248287, 0.014028895646333694, 0.016153179109096527, 0.01827746443450451, 0.02040174975991249, 0.022526033222675323, 0.024650316685438156, 0.026774602010846138, 0.02889888733625412, 0.031023170799016953, 0.033147454261779785, 0.035271741449832916, 0.03739602491259575, 0.03952030837535858, 0.041644591838121414, 0.04376887530088425, 0.04589316248893738, 0.04801744595170021, 0.05014172941446304, 0.052266016602516174, 0.05439030006527901, 0.05651458352804184, 0.05863886699080467, 0.060763150453567505, 0.06288743764162064, 0.06501172482967377, 0.0671360045671463, 0.06926029175519943, 0.07138457149267197, 0.0735088586807251]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 4.0, 4.0, 8.0, 17.0, 18.0, 37.0, 51.0, 55.0, 85.0, 145.0, 246.0, 473.0, 830.0, 1756.0, 4289.0, 14780.0, 87899.0, 565705.0, 317461.0, 40239.0, 8569.0, 2982.0, 1324.0, 647.0, 346.0, 202.0, 105.0, 79.0, 54.0, 32.0, 29.0, 20.0, 17.0, 10.0, 9.0, 3.0, 6.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04302978515625, -0.0417180061340332, -0.040406227111816406, -0.03909444808959961, -0.03778266906738281, -0.036470890045166016, -0.03515911102294922, -0.03384733200073242, -0.032535552978515625, -0.031223773956298828, -0.02991199493408203, -0.028600215911865234, -0.027288436889648438, -0.02597665786743164, -0.024664878845214844, -0.023353099822998047, -0.02204132080078125, -0.020729541778564453, -0.019417762756347656, -0.01810598373413086, -0.016794204711914062, -0.015482425689697266, -0.014170646667480469, -0.012858867645263672, -0.011547088623046875, -0.010235309600830078, -0.008923530578613281, -0.007611751556396484, -0.0062999725341796875, -0.004988193511962891, -0.0036764144897460938, -0.002364635467529297, -0.0010528564453125, 0.0002589225769042969, 0.0015707015991210938, 0.0028824806213378906, 0.0041942596435546875, 0.005506038665771484, 0.006817817687988281, 0.008129596710205078, 0.009441375732421875, 0.010753154754638672, 0.012064933776855469, 0.013376712799072266, 0.014688491821289062, 0.01600027084350586, 0.017312049865722656, 0.018623828887939453, 0.01993560791015625, 0.021247386932373047, 0.022559165954589844, 0.02387094497680664, 0.025182723999023438, 0.026494503021240234, 0.02780628204345703, 0.029118061065673828, 0.030429840087890625, 0.03174161911010742, 0.03305339813232422, 0.034365177154541016, 0.03567695617675781, 0.03698873519897461, 0.038300514221191406, 0.0396122932434082, 0.040924072265625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 7.0, 13.0, 21.0, 12.0, 27.0, 46.0, 54.0, 62.0, 80.0, 83.0, 72.0, 99.0, 88.0, 82.0, 71.0, 43.0, 40.0, 30.0, 20.0, 11.0, 10.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.020294189453125, -0.019730091094970703, -0.019165992736816406, -0.01860189437866211, -0.018037796020507812, -0.017473697662353516, -0.01690959930419922, -0.016345500946044922, -0.015781402587890625, -0.015217304229736328, -0.014653205871582031, -0.014089107513427734, -0.013525009155273438, -0.01296091079711914, -0.012396812438964844, -0.011832714080810547, -0.01126861572265625, -0.010704517364501953, -0.010140419006347656, -0.00957632064819336, -0.009012222290039062, -0.008448123931884766, -0.007884025573730469, -0.007319927215576172, -0.006755828857421875, -0.006191730499267578, -0.005627632141113281, -0.005063533782958984, -0.0044994354248046875, -0.003935337066650391, -0.0033712387084960938, -0.002807140350341797, -0.0022430419921875, -0.0016789436340332031, -0.0011148452758789062, -0.0005507469177246094, 1.33514404296875e-05, 0.0005774497985839844, 0.0011415481567382812, 0.0017056465148925781, 0.002269744873046875, 0.002833843231201172, 0.0033979415893554688, 0.003962039947509766, 0.0045261383056640625, 0.005090236663818359, 0.005654335021972656, 0.006218433380126953, 0.00678253173828125, 0.007346630096435547, 0.007910728454589844, 0.00847482681274414, 0.009038925170898438, 0.009603023529052734, 0.010167121887207031, 0.010731220245361328, 0.011295318603515625, 0.011859416961669922, 0.012423515319824219, 0.012987613677978516, 0.013551712036132812, 0.01411581039428711, 0.014679908752441406, 0.015244007110595703, 0.01580810546875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 8.0, 5.0, 12.0, 20.0, 23.0, 23.0, 43.0, 47.0, 55.0, 85.0, 113.0, 139.0, 230.0, 347.0, 471.0, 903.0, 1795.0, 4911.0, 17593.0, 86502.0, 436556.0, 398730.0, 75509.0, 15829.0, 4442.0, 1694.0, 908.0, 461.0, 331.0, 205.0, 136.0, 109.0, 74.0, 58.0, 42.0, 37.0, 27.0, 20.0, 18.0, 10.0, 10.0, 9.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.027496337890625, -0.02673172950744629, -0.025967121124267578, -0.025202512741088867, -0.024437904357910156, -0.023673295974731445, -0.022908687591552734, -0.022144079208374023, -0.021379470825195312, -0.0206148624420166, -0.01985025405883789, -0.01908564567565918, -0.01832103729248047, -0.017556428909301758, -0.016791820526123047, -0.016027212142944336, -0.015262603759765625, -0.014497995376586914, -0.013733386993408203, -0.012968778610229492, -0.012204170227050781, -0.01143956184387207, -0.01067495346069336, -0.009910345077514648, -0.009145736694335938, -0.008381128311157227, -0.007616519927978516, -0.006851911544799805, -0.006087303161621094, -0.005322694778442383, -0.004558086395263672, -0.003793478012084961, -0.00302886962890625, -0.002264261245727539, -0.0014996528625488281, -0.0007350444793701172, 2.956390380859375e-05, 0.0007941722869873047, 0.0015587806701660156, 0.0023233890533447266, 0.0030879974365234375, 0.0038526058197021484, 0.004617214202880859, 0.00538182258605957, 0.006146430969238281, 0.006911039352416992, 0.007675647735595703, 0.008440256118774414, 0.009204864501953125, 0.009969472885131836, 0.010734081268310547, 0.011498689651489258, 0.012263298034667969, 0.01302790641784668, 0.01379251480102539, 0.014557123184204102, 0.015321731567382812, 0.016086339950561523, 0.016850948333740234, 0.017615556716918945, 0.018380165100097656, 0.019144773483276367, 0.019909381866455078, 0.02067399024963379, 0.0214385986328125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 5.0, 4.0, 7.0, 11.0, 4.0, 9.0, 18.0, 11.0, 17.0, 17.0, 28.0, 20.0, 27.0, 30.0, 38.0, 36.0, 43.0, 40.0, 39.0, 48.0, 41.0, 45.0, 42.0, 27.0, 43.0, 35.0, 35.0, 40.0, 27.0, 23.0, 33.0, 28.0, 19.0, 25.0, 17.0, 13.0, 10.0, 6.0, 7.0, 6.0, 1.0, 6.0, 8.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.03436279296875, -0.03330183029174805, -0.032240867614746094, -0.03117990493774414, -0.030118942260742188, -0.029057979583740234, -0.02799701690673828, -0.026936054229736328, -0.025875091552734375, -0.024814128875732422, -0.02375316619873047, -0.022692203521728516, -0.021631240844726562, -0.02057027816772461, -0.019509315490722656, -0.018448352813720703, -0.01738739013671875, -0.016326427459716797, -0.015265464782714844, -0.01420450210571289, -0.013143539428710938, -0.012082576751708984, -0.011021614074707031, -0.009960651397705078, -0.008899688720703125, -0.007838726043701172, -0.006777763366699219, -0.005716800689697266, -0.0046558380126953125, -0.0035948753356933594, -0.0025339126586914062, -0.0014729499816894531, -0.0004119873046875, 0.0006489753723144531, 0.0017099380493164062, 0.0027709007263183594, 0.0038318634033203125, 0.004892826080322266, 0.005953788757324219, 0.007014751434326172, 0.008075714111328125, 0.009136676788330078, 0.010197639465332031, 0.011258602142333984, 0.012319564819335938, 0.01338052749633789, 0.014441490173339844, 0.015502452850341797, 0.01656341552734375, 0.017624378204345703, 0.018685340881347656, 0.01974630355834961, 0.020807266235351562, 0.021868228912353516, 0.02292919158935547, 0.023990154266357422, 0.025051116943359375, 0.026112079620361328, 0.02717304229736328, 0.028234004974365234, 0.029294967651367188, 0.03035593032836914, 0.031416893005371094, 0.03247785568237305, 0.033538818359375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 8.0, 13.0, 13.0, 26.0, 45.0, 55.0, 127.0, 256.0, 472.0, 1133.0, 4397.0, 42702.0, 726529.0, 255792.0, 13295.0, 2228.0, 753.0, 312.0, 160.0, 89.0, 50.0, 29.0, 23.0, 22.0, 10.0, 7.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02117919921875, -0.02058720588684082, -0.01999521255493164, -0.01940321922302246, -0.01881122589111328, -0.0182192325592041, -0.017627239227294922, -0.017035245895385742, -0.016443252563476562, -0.015851259231567383, -0.015259265899658203, -0.014667272567749023, -0.014075279235839844, -0.013483285903930664, -0.012891292572021484, -0.012299299240112305, -0.011707305908203125, -0.011115312576293945, -0.010523319244384766, -0.009931325912475586, -0.009339332580566406, -0.008747339248657227, -0.008155345916748047, -0.007563352584838867, -0.0069713592529296875, -0.006379365921020508, -0.005787372589111328, -0.0051953792572021484, -0.004603385925292969, -0.004011392593383789, -0.0034193992614746094, -0.0028274059295654297, -0.00223541259765625, -0.0016434192657470703, -0.0010514259338378906, -0.00045943260192871094, 0.00013256072998046875, 0.0007245540618896484, 0.0013165473937988281, 0.0019085407257080078, 0.0025005340576171875, 0.003092527389526367, 0.003684520721435547, 0.0042765140533447266, 0.004868507385253906, 0.005460500717163086, 0.006052494049072266, 0.006644487380981445, 0.007236480712890625, 0.007828474044799805, 0.008420467376708984, 0.009012460708618164, 0.009604454040527344, 0.010196447372436523, 0.010788440704345703, 0.011380434036254883, 0.011972427368164062, 0.012564420700073242, 0.013156414031982422, 0.013748407363891602, 0.014340400695800781, 0.014932394027709961, 0.01552438735961914, 0.01611638069152832, 0.0167083740234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 13.0, 27.0, 62.0, 111.0, 212.0, 229.0, 174.0, 100.0, 38.0, 20.0, 9.0, 7.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012302398681640625, -0.0001186951994895935, -0.00011436641216278076, -0.00011003762483596802, -0.00010570883750915527, -0.00010138005018234253, -9.705126285552979e-05, -9.272247552871704e-05, -8.83936882019043e-05, -8.406490087509155e-05, -7.973611354827881e-05, -7.540732622146606e-05, -7.107853889465332e-05, -6.674975156784058e-05, -6.242096424102783e-05, -5.809217691421509e-05, -5.3763389587402344e-05, -4.94346022605896e-05, -4.5105814933776855e-05, -4.077702760696411e-05, -3.644824028015137e-05, -3.211945295333862e-05, -2.779066562652588e-05, -2.3461878299713135e-05, -1.913309097290039e-05, -1.4804303646087646e-05, -1.0475516319274902e-05, -6.146728992462158e-06, -1.817941665649414e-06, 2.51084566116333e-06, 6.839632987976074e-06, 1.1168420314788818e-05, 1.5497207641601562e-05, 1.9825994968414307e-05, 2.415478229522705e-05, 2.8483569622039795e-05, 3.281235694885254e-05, 3.714114427566528e-05, 4.146993160247803e-05, 4.579871892929077e-05, 5.0127506256103516e-05, 5.445629358291626e-05, 5.8785080909729004e-05, 6.311386823654175e-05, 6.744265556335449e-05, 7.177144289016724e-05, 7.610023021697998e-05, 8.042901754379272e-05, 8.475780487060547e-05, 8.908659219741821e-05, 9.341537952423096e-05, 9.77441668510437e-05, 0.00010207295417785645, 0.00010640174150466919, 0.00011073052883148193, 0.00011505931615829468, 0.00011938810348510742, 0.00012371689081192017, 0.0001280456781387329, 0.00013237446546554565, 0.0001367032527923584, 0.00014103204011917114, 0.0001453608274459839, 0.00014968961477279663, 0.00015401840209960938]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 12.0, 15.0, 34.0, 66.0, 174.0, 385.0, 1318.0, 12544.0, 747650.0, 279744.0, 5214.0, 843.0, 328.0, 120.0, 63.0, 17.0, 8.0, 4.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0162200927734375, -0.015359640121459961, -0.014499187469482422, -0.013638734817504883, -0.012778282165527344, -0.011917829513549805, -0.011057376861572266, -0.010196924209594727, -0.009336471557617188, -0.008476018905639648, -0.007615566253662109, -0.00675511360168457, -0.005894660949707031, -0.005034208297729492, -0.004173755645751953, -0.003313302993774414, -0.002452850341796875, -0.001592397689819336, -0.0007319450378417969, 0.0001285076141357422, 0.0009889602661132812, 0.0018494129180908203, 0.0027098655700683594, 0.0035703182220458984, 0.0044307708740234375, 0.0052912235260009766, 0.006151676177978516, 0.007012128829956055, 0.007872581481933594, 0.008733034133911133, 0.009593486785888672, 0.010453939437866211, 0.01131439208984375, 0.012174844741821289, 0.013035297393798828, 0.013895750045776367, 0.014756202697753906, 0.015616655349731445, 0.016477108001708984, 0.017337560653686523, 0.018198013305664062, 0.0190584659576416, 0.01991891860961914, 0.02077937126159668, 0.02163982391357422, 0.022500276565551758, 0.023360729217529297, 0.024221181869506836, 0.025081634521484375, 0.025942087173461914, 0.026802539825439453, 0.027662992477416992, 0.02852344512939453, 0.02938389778137207, 0.03024435043334961, 0.03110480308532715, 0.03196525573730469, 0.03282570838928223, 0.033686161041259766, 0.034546613693237305, 0.035407066345214844, 0.03626751899719238, 0.03712797164916992, 0.03798842430114746, 0.038848876953125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 19.0, 49.0, 74.0, 142.0, 193.0, 221.0, 161.0, 79.0, 28.0, 16.0, 14.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0161285400390625, -0.01517796516418457, -0.01422739028930664, -0.013276815414428711, -0.012326240539550781, -0.011375665664672852, -0.010425090789794922, -0.009474515914916992, -0.008523941040039062, -0.007573366165161133, -0.006622791290283203, -0.0056722164154052734, -0.004721641540527344, -0.003771066665649414, -0.0028204917907714844, -0.0018699169158935547, -0.000919342041015625, 3.123283386230469e-05, 0.0009818077087402344, 0.001932382583618164, 0.0028829574584960938, 0.0038335323333740234, 0.004784107208251953, 0.005734682083129883, 0.0066852569580078125, 0.007635831832885742, 0.008586406707763672, 0.009536981582641602, 0.010487556457519531, 0.011438131332397461, 0.01238870620727539, 0.01333928108215332, 0.01428985595703125, 0.01524043083190918, 0.01619100570678711, 0.01714158058166504, 0.01809215545654297, 0.0190427303314209, 0.019993305206298828, 0.020943880081176758, 0.021894454956054688, 0.022845029830932617, 0.023795604705810547, 0.024746179580688477, 0.025696754455566406, 0.026647329330444336, 0.027597904205322266, 0.028548479080200195, 0.029499053955078125, 0.030449628829956055, 0.031400203704833984, 0.032350778579711914, 0.033301353454589844, 0.03425192832946777, 0.0352025032043457, 0.03615307807922363, 0.03710365295410156, 0.03805422782897949, 0.03900480270385742, 0.03995537757873535, 0.04090595245361328, 0.04185652732849121, 0.04280710220336914, 0.04375767707824707, 0.044708251953125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 11.0, 57.0, 179.0, 301.0, 238.0, 142.0, 46.0, 18.0, 7.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17521151900291443, -0.16320161521434784, -0.15119171142578125, -0.13918179273605347, -0.12717190384864807, -0.11516199260950089, -0.1031520813703537, -0.09114217758178711, -0.07913227379322052, -0.06712237000465393, -0.05511246249079704, -0.043102554976940155, -0.031092651188373566, -0.019082747399806976, -0.00707283616065979, 0.004937067627906799, 0.01694697141647339, 0.028956877067685127, 0.040966782718896866, 0.052976690232753754, 0.06498659402132034, 0.07699649780988693, 0.08900640904903412, 0.10101631283760071, 0.1130262166261673, 0.1250361204147339, 0.13704602420330048, 0.14905592799186707, 0.16106584668159485, 0.17307573556900024, 0.18508565425872803, 0.19709555804729462, 0.20910543203353882, 0.2211153358221054, 0.233125239610672, 0.24513515830039978, 0.2571450471878052, 0.26915496587753296, 0.28116488456726074, 0.29317477345466614, 0.30518466234207153, 0.3171945810317993, 0.3292044699192047, 0.3412143886089325, 0.3532242774963379, 0.3652341961860657, 0.37724411487579346, 0.38925400376319885, 0.40126392245292664, 0.4132738411426544, 0.4252837300300598, 0.4372936487197876, 0.449303537607193, 0.4613134562969208, 0.47332334518432617, 0.48533326387405396, 0.49734318256378174, 0.5093531012535095, 0.5213630199432373, 0.5333728790283203, 0.5453827977180481, 0.5573927164077759, 0.5694026350975037, 0.5814125537872314, 0.5934224128723145]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 1.0, 3.0, 5.0, 8.0, 14.0, 15.0, 14.0, 14.0, 14.0, 27.0, 22.0, 22.0, 34.0, 37.0, 33.0, 41.0, 40.0, 41.0, 42.0, 44.0, 50.0, 42.0, 44.0, 54.0, 36.0, 34.0, 30.0, 27.0, 34.0, 23.0, 21.0, 23.0, 20.0, 22.0, 12.0, 17.0, 9.0, 2.0, 6.0, 4.0, 3.0, 2.0, 8.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15338724851608276, -0.14796870946884155, -0.14255017042160034, -0.13713164627552032, -0.1317131072282791, -0.1262945681810379, -0.12087603658437729, -0.11545750498771667, -0.11003896594047546, -0.10462042689323425, -0.09920189529657364, -0.09378336369991302, -0.08836482465267181, -0.0829462856054306, -0.07752775400876999, -0.07210922241210938, -0.06669068336486816, -0.06127214804291725, -0.05585361272096634, -0.05043507739901543, -0.045016542077064514, -0.0395980067551136, -0.03417947143316269, -0.028760936111211777, -0.023342400789260864, -0.017923865467309952, -0.01250533014535904, -0.007086794823408127, -0.0016682595014572144, 0.003750275820493698, 0.00916881114244461, 0.014587346464395523, 0.020005881786346436, 0.025424417108297348, 0.03084295243024826, 0.03626148775219917, 0.041680023074150085, 0.047098558396101, 0.05251709371805191, 0.05793562904000282, 0.06335416436195374, 0.06877270340919495, 0.07419123500585556, 0.07960976660251617, 0.08502830564975739, 0.0904468446969986, 0.09586537629365921, 0.10128390789031982, 0.10670244693756104, 0.11212098598480225, 0.11753951758146286, 0.12295804917812347, 0.12837658822536469, 0.1337951272726059, 0.1392136514186859, 0.14463219046592712, 0.15005072951316833, 0.15546926856040955, 0.16088780760765076, 0.16630633175373077, 0.17172487080097198, 0.1771434098482132, 0.1825619339942932, 0.18798047304153442, 0.19339901208877563]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 6.0, 6.0, 4.0, 9.0, 14.0, 23.0, 23.0, 25.0, 32.0, 55.0, 83.0, 134.0, 237.0, 378.0, 694.0, 1330.0, 2911.0, 7288.0, 24710.0, 253671.0, 3828491.0, 52988.0, 12237.0, 4332.0, 1963.0, 997.0, 573.0, 358.0, 213.0, 150.0, 104.0, 69.0, 57.0, 33.0, 26.0, 14.0, 15.0, 11.0, 7.0, 4.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044464111328125, -0.04308462142944336, -0.04170513153076172, -0.04032564163208008, -0.03894615173339844, -0.0375666618347168, -0.036187171936035156, -0.034807682037353516, -0.033428192138671875, -0.032048702239990234, -0.030669212341308594, -0.029289722442626953, -0.027910232543945312, -0.026530742645263672, -0.02515125274658203, -0.02377176284790039, -0.02239227294921875, -0.02101278305053711, -0.01963329315185547, -0.018253803253173828, -0.016874313354492188, -0.015494823455810547, -0.014115333557128906, -0.012735843658447266, -0.011356353759765625, -0.009976863861083984, -0.008597373962402344, -0.007217884063720703, -0.0058383941650390625, -0.004458904266357422, -0.0030794143676757812, -0.0016999244689941406, -0.0003204345703125, 0.0010590553283691406, 0.0024385452270507812, 0.003818035125732422, 0.0051975250244140625, 0.006577014923095703, 0.007956504821777344, 0.009335994720458984, 0.010715484619140625, 0.012094974517822266, 0.013474464416503906, 0.014853954315185547, 0.016233444213867188, 0.017612934112548828, 0.01899242401123047, 0.02037191390991211, 0.02175140380859375, 0.02313089370727539, 0.02451038360595703, 0.025889873504638672, 0.027269363403320312, 0.028648853302001953, 0.030028343200683594, 0.031407833099365234, 0.032787322998046875, 0.034166812896728516, 0.035546302795410156, 0.0369257926940918, 0.03830528259277344, 0.03968477249145508, 0.04106426239013672, 0.04244375228881836, 0.0438232421875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 11.0, 12.0, 10.0, 23.0, 28.0, 49.0, 46.0, 70.0, 65.0, 76.0, 87.0, 102.0, 88.0, 72.0, 74.0, 58.0, 37.0, 23.0, 19.0, 11.0, 14.0, 6.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0203399658203125, -0.019743680953979492, -0.019147396087646484, -0.018551111221313477, -0.01795482635498047, -0.01735854148864746, -0.016762256622314453, -0.016165971755981445, -0.015569686889648438, -0.01497340202331543, -0.014377117156982422, -0.013780832290649414, -0.013184547424316406, -0.012588262557983398, -0.01199197769165039, -0.011395692825317383, -0.010799407958984375, -0.010203123092651367, -0.00960683822631836, -0.009010553359985352, -0.008414268493652344, -0.007817983627319336, -0.007221698760986328, -0.00662541389465332, -0.0060291290283203125, -0.005432844161987305, -0.004836559295654297, -0.004240274429321289, -0.0036439895629882812, -0.0030477046966552734, -0.0024514198303222656, -0.0018551349639892578, -0.00125885009765625, -0.0006625652313232422, -6.628036499023438e-05, 0.0005300045013427734, 0.0011262893676757812, 0.001722574234008789, 0.002318859100341797, 0.0029151439666748047, 0.0035114288330078125, 0.00410771369934082, 0.004703998565673828, 0.005300283432006836, 0.005896568298339844, 0.0064928531646728516, 0.007089138031005859, 0.007685422897338867, 0.008281707763671875, 0.008877992630004883, 0.00947427749633789, 0.010070562362670898, 0.010666847229003906, 0.011263132095336914, 0.011859416961669922, 0.01245570182800293, 0.013051986694335938, 0.013648271560668945, 0.014244556427001953, 0.014840841293334961, 0.015437126159667969, 0.016033411026000977, 0.016629695892333984, 0.017225980758666992, 0.017822265625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 10.0, 5.0, 12.0, 25.0, 42.0, 62.0, 108.0, 198.0, 389.0, 789.0, 2125.0, 8153.0, 68797.0, 4033029.0, 68810.0, 8025.0, 2091.0, 806.0, 394.0, 187.0, 91.0, 68.0, 29.0, 14.0, 12.0, 4.0, 3.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048828125, -0.04727792739868164, -0.04572772979736328, -0.04417753219604492, -0.04262733459472656, -0.0410771369934082, -0.039526939392089844, -0.037976741790771484, -0.036426544189453125, -0.034876346588134766, -0.033326148986816406, -0.03177595138549805, -0.030225753784179688, -0.028675556182861328, -0.02712535858154297, -0.02557516098022461, -0.02402496337890625, -0.02247476577758789, -0.02092456817626953, -0.019374370574951172, -0.017824172973632812, -0.016273975372314453, -0.014723777770996094, -0.013173580169677734, -0.011623382568359375, -0.010073184967041016, -0.008522987365722656, -0.006972789764404297, -0.0054225921630859375, -0.003872394561767578, -0.0023221969604492188, -0.0007719993591308594, 0.0007781982421875, 0.0023283958435058594, 0.0038785934448242188, 0.005428791046142578, 0.0069789886474609375, 0.008529186248779297, 0.010079383850097656, 0.011629581451416016, 0.013179779052734375, 0.014729976654052734, 0.016280174255371094, 0.017830371856689453, 0.019380569458007812, 0.020930767059326172, 0.02248096466064453, 0.02403116226196289, 0.02558135986328125, 0.02713155746459961, 0.02868175506591797, 0.030231952667236328, 0.03178215026855469, 0.03333234786987305, 0.034882545471191406, 0.036432743072509766, 0.037982940673828125, 0.039533138275146484, 0.041083335876464844, 0.0426335334777832, 0.04418373107910156, 0.04573392868041992, 0.04728412628173828, 0.04883432388305664, 0.050384521484375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 6.0, 10.0, 17.0, 40.0, 39.0, 152.0, 2322.0, 1246.0, 126.0, 48.0, 25.0, 13.0, 9.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019561767578125, -0.018626689910888672, -0.017691612243652344, -0.016756534576416016, -0.015821456909179688, -0.01488637924194336, -0.013951301574707031, -0.013016223907470703, -0.012081146240234375, -0.011146068572998047, -0.010210990905761719, -0.00927591323852539, -0.008340835571289062, -0.007405757904052734, -0.006470680236816406, -0.005535602569580078, -0.00460052490234375, -0.003665447235107422, -0.0027303695678710938, -0.0017952919006347656, -0.0008602142333984375, 7.486343383789062e-05, 0.0010099411010742188, 0.0019450187683105469, 0.002880096435546875, 0.003815174102783203, 0.004750251770019531, 0.005685329437255859, 0.0066204071044921875, 0.007555484771728516, 0.008490562438964844, 0.009425640106201172, 0.0103607177734375, 0.011295795440673828, 0.012230873107910156, 0.013165950775146484, 0.014101028442382812, 0.01503610610961914, 0.01597118377685547, 0.016906261444091797, 0.017841339111328125, 0.018776416778564453, 0.01971149444580078, 0.02064657211303711, 0.021581649780273438, 0.022516727447509766, 0.023451805114746094, 0.024386882781982422, 0.02532196044921875, 0.026257038116455078, 0.027192115783691406, 0.028127193450927734, 0.029062271118164062, 0.02999734878540039, 0.03093242645263672, 0.03186750411987305, 0.032802581787109375, 0.0337376594543457, 0.03467273712158203, 0.03560781478881836, 0.03654289245605469, 0.037477970123291016, 0.038413047790527344, 0.03934812545776367, 0.040283203125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 9.0, 49.0, 731.0, 196.0, 11.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08888839185237885, -0.07727264612913132, -0.06565690040588379, -0.05404115468263626, -0.04242540895938873, -0.030809663236141205, -0.019193917512893677, -0.007578171789646149, 0.004037573933601379, 0.015653319656848907, 0.027269065380096436, 0.038884811103343964, 0.05050055682659149, 0.06211630254983902, 0.07373204827308655, 0.08534779399633408, 0.0969635397195816, 0.10857928544282913, 0.12019503116607666, 0.13181078433990479, 0.14342652261257172, 0.15504226088523865, 0.16665801405906677, 0.1782737672328949, 0.18988950550556183, 0.20150524377822876, 0.21312099695205688, 0.224736750125885, 0.23635248839855194, 0.24796822667121887, 0.259583979845047, 0.2711997330188751, 0.28281545639038086, 0.294431209564209, 0.3060469627380371, 0.31766268610954285, 0.32927843928337097, 0.3408941924571991, 0.35250991582870483, 0.36412566900253296, 0.3757414221763611, 0.3873571753501892, 0.39897292852401733, 0.41058865189552307, 0.4222044050693512, 0.4338201582431793, 0.44543588161468506, 0.4570516347885132, 0.4686673879623413, 0.48028314113616943, 0.49189889430999756, 0.5035146474838257, 0.5151304006576538, 0.5267460942268372, 0.5383618474006653, 0.5499776005744934, 0.5615933537483215, 0.5732091069221497, 0.5848248600959778, 0.5964406132698059, 0.6080563068389893, 0.6196720600128174, 0.6312878131866455, 0.6429035663604736, 0.6545193195343018]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 8.0, 14.0, 11.0, 26.0, 32.0, 31.0, 61.0, 63.0, 64.0, 84.0, 96.0, 86.0, 73.0, 81.0, 75.0, 49.0, 45.0, 28.0, 18.0, 19.0, 7.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07468616962432861, -0.0723508894443512, -0.07001560926437378, -0.06768032908439636, -0.06534504890441895, -0.06300976127386093, -0.060674481093883514, -0.0583392009139061, -0.05600392073392868, -0.05366864055395126, -0.051333360373973846, -0.04899807646870613, -0.046662796288728714, -0.0443275161087513, -0.04199223220348358, -0.039656952023506165, -0.03732167184352875, -0.03498639166355133, -0.032651111483573914, -0.030315827578306198, -0.02798054739832878, -0.025645267218351364, -0.023309985175728798, -0.02097470313310623, -0.018639422953128815, -0.016304142773151398, -0.013968860730528831, -0.01163357961922884, -0.009298298507928848, -0.006963017396628857, -0.004627736285328865, -0.002292454242706299, 4.2825937271118164e-05, 0.0023781070485711098, 0.004713388159871101, 0.007048669271171093, 0.009383950382471085, 0.011719231493771076, 0.014054512605071068, 0.016389794647693634, 0.01872507482767105, 0.021060355007648468, 0.023395637050271034, 0.0257309190928936, 0.028066199272871017, 0.030401479452848434, 0.03273676335811615, 0.03507204353809357, 0.037407323718070984, 0.0397426038980484, 0.04207788407802582, 0.04441316798329353, 0.04674844816327095, 0.04908372834324837, 0.05141901224851608, 0.0537542924284935, 0.05608957260847092, 0.058424852788448334, 0.06076013296842575, 0.06309541314840317, 0.06543070077896118, 0.0677659809589386, 0.07010126113891602, 0.07243654131889343, 0.07477182149887085]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 10.0, 17.0, 25.0, 44.0, 74.0, 132.0, 253.0, 611.0, 1910.0, 8288.0, 83529.0, 743592.0, 190995.0, 14809.0, 2800.0, 809.0, 325.0, 135.0, 77.0, 35.0, 25.0, 14.0, 11.0, 5.0, 3.0, 4.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05474853515625, -0.053212642669677734, -0.05167675018310547, -0.0501408576965332, -0.04860496520996094, -0.04706907272338867, -0.045533180236816406, -0.04399728775024414, -0.042461395263671875, -0.04092550277709961, -0.039389610290527344, -0.03785371780395508, -0.03631782531738281, -0.03478193283081055, -0.03324604034423828, -0.031710147857666016, -0.03017425537109375, -0.028638362884521484, -0.02710247039794922, -0.025566577911376953, -0.024030685424804688, -0.022494792938232422, -0.020958900451660156, -0.01942300796508789, -0.017887115478515625, -0.01635122299194336, -0.014815330505371094, -0.013279438018798828, -0.011743545532226562, -0.010207653045654297, -0.008671760559082031, -0.007135868072509766, -0.0055999755859375, -0.004064083099365234, -0.0025281906127929688, -0.0009922981262207031, 0.0005435943603515625, 0.002079486846923828, 0.0036153793334960938, 0.005151271820068359, 0.006687164306640625, 0.00822305679321289, 0.009758949279785156, 0.011294841766357422, 0.012830734252929688, 0.014366626739501953, 0.01590251922607422, 0.017438411712646484, 0.01897430419921875, 0.020510196685791016, 0.02204608917236328, 0.023581981658935547, 0.025117874145507812, 0.026653766632080078, 0.028189659118652344, 0.02972555160522461, 0.031261444091796875, 0.03279733657836914, 0.034333229064941406, 0.03586912155151367, 0.03740501403808594, 0.0389409065246582, 0.04047679901123047, 0.042012691497802734, 0.043548583984375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 7.0, 12.0, 13.0, 14.0, 29.0, 41.0, 43.0, 55.0, 82.0, 70.0, 76.0, 104.0, 85.0, 73.0, 69.0, 61.0, 53.0, 40.0, 21.0, 14.0, 8.0, 8.0, 3.0, 4.0, 5.0, 2.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0205535888671875, -0.019941091537475586, -0.019328594207763672, -0.018716096878051758, -0.018103599548339844, -0.01749110221862793, -0.016878604888916016, -0.0162661075592041, -0.015653610229492188, -0.015041112899780273, -0.01442861557006836, -0.013816118240356445, -0.013203620910644531, -0.012591123580932617, -0.011978626251220703, -0.011366128921508789, -0.010753631591796875, -0.010141134262084961, -0.009528636932373047, -0.008916139602661133, -0.008303642272949219, -0.007691144943237305, -0.007078647613525391, -0.0064661502838134766, -0.0058536529541015625, -0.0052411556243896484, -0.004628658294677734, -0.00401616096496582, -0.0034036636352539062, -0.002791166305541992, -0.002178668975830078, -0.001566171646118164, -0.00095367431640625, -0.00034117698669433594, 0.0002713203430175781, 0.0008838176727294922, 0.0014963150024414062, 0.0021088123321533203, 0.0027213096618652344, 0.0033338069915771484, 0.0039463043212890625, 0.0045588016510009766, 0.005171298980712891, 0.005783796310424805, 0.006396293640136719, 0.007008790969848633, 0.007621288299560547, 0.008233785629272461, 0.008846282958984375, 0.009458780288696289, 0.010071277618408203, 0.010683774948120117, 0.011296272277832031, 0.011908769607543945, 0.01252126693725586, 0.013133764266967773, 0.013746261596679688, 0.014358758926391602, 0.014971256256103516, 0.01558375358581543, 0.016196250915527344, 0.016808748245239258, 0.017421245574951172, 0.018033742904663086, 0.018646240234375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 7.0, 3.0, 4.0, 9.0, 9.0, 11.0, 20.0, 24.0, 46.0, 58.0, 79.0, 110.0, 160.0, 236.0, 387.0, 739.0, 1846.0, 8723.0, 85938.0, 781398.0, 151308.0, 12966.0, 2407.0, 834.0, 375.0, 274.0, 197.0, 120.0, 71.0, 56.0, 43.0, 33.0, 21.0, 10.0, 10.0, 8.0, 10.0, 1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03607177734375, -0.03493022918701172, -0.03378868103027344, -0.032647132873535156, -0.031505584716796875, -0.030364036560058594, -0.029222488403320312, -0.02808094024658203, -0.02693939208984375, -0.02579784393310547, -0.024656295776367188, -0.023514747619628906, -0.022373199462890625, -0.021231651306152344, -0.020090103149414062, -0.01894855499267578, -0.0178070068359375, -0.01666545867919922, -0.015523910522460938, -0.014382362365722656, -0.013240814208984375, -0.012099266052246094, -0.010957717895507812, -0.009816169738769531, -0.00867462158203125, -0.007533073425292969, -0.0063915252685546875, -0.005249977111816406, -0.004108428955078125, -0.0029668807983398438, -0.0018253326416015625, -0.0006837844848632812, 0.000457763671875, 0.0015993118286132812, 0.0027408599853515625, 0.0038824081420898438, 0.005023956298828125, 0.006165504455566406, 0.0073070526123046875, 0.008448600769042969, 0.00959014892578125, 0.010731697082519531, 0.011873245239257812, 0.013014793395996094, 0.014156341552734375, 0.015297889709472656, 0.016439437866210938, 0.01758098602294922, 0.0187225341796875, 0.01986408233642578, 0.021005630493164062, 0.022147178649902344, 0.023288726806640625, 0.024430274963378906, 0.025571823120117188, 0.02671337127685547, 0.02785491943359375, 0.02899646759033203, 0.030138015747070312, 0.031279563903808594, 0.032421112060546875, 0.033562660217285156, 0.03470420837402344, 0.03584575653076172, 0.0369873046875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 9.0, 10.0, 14.0, 9.0, 14.0, 16.0, 24.0, 27.0, 21.0, 35.0, 36.0, 37.0, 47.0, 40.0, 49.0, 42.0, 58.0, 51.0, 52.0, 48.0, 39.0, 52.0, 25.0, 38.0, 40.0, 31.0, 23.0, 21.0, 19.0, 11.0, 9.0, 8.0, 10.0, 4.0, 2.0, 10.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04486083984375, -0.04352569580078125, -0.0421905517578125, -0.04085540771484375, -0.039520263671875, -0.03818511962890625, -0.0368499755859375, -0.03551483154296875, -0.0341796875, -0.03284454345703125, -0.0315093994140625, -0.03017425537109375, -0.028839111328125, -0.02750396728515625, -0.0261688232421875, -0.02483367919921875, -0.02349853515625, -0.02216339111328125, -0.0208282470703125, -0.01949310302734375, -0.018157958984375, -0.01682281494140625, -0.0154876708984375, -0.01415252685546875, -0.0128173828125, -0.01148223876953125, -0.0101470947265625, -0.00881195068359375, -0.007476806640625, -0.00614166259765625, -0.0048065185546875, -0.00347137451171875, -0.00213623046875, -0.00080108642578125, 0.0005340576171875, 0.00186920166015625, 0.003204345703125, 0.00453948974609375, 0.0058746337890625, 0.00720977783203125, 0.008544921875, 0.00988006591796875, 0.0112152099609375, 0.01255035400390625, 0.013885498046875, 0.01522064208984375, 0.0165557861328125, 0.01789093017578125, 0.01922607421875, 0.02056121826171875, 0.0218963623046875, 0.02323150634765625, 0.024566650390625, 0.02590179443359375, 0.0272369384765625, 0.02857208251953125, 0.0299072265625, 0.03124237060546875, 0.0325775146484375, 0.03391265869140625, 0.035247802734375, 0.03658294677734375, 0.0379180908203125, 0.03925323486328125, 0.04058837890625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 8.0, 14.0, 18.0, 29.0, 70.0, 125.0, 248.0, 505.0, 1204.0, 3420.0, 13673.0, 89159.0, 744466.0, 168023.0, 20061.0, 4730.0, 1557.0, 618.0, 281.0, 158.0, 74.0, 40.0, 28.0, 13.0, 10.0, 8.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01313018798828125, -0.012714982032775879, -0.012299776077270508, -0.011884570121765137, -0.011469364166259766, -0.011054158210754395, -0.010638952255249023, -0.010223746299743652, -0.009808540344238281, -0.00939333438873291, -0.008978128433227539, -0.008562922477722168, -0.008147716522216797, -0.007732510566711426, -0.007317304611206055, -0.006902098655700684, -0.0064868927001953125, -0.006071686744689941, -0.00565648078918457, -0.005241274833679199, -0.004826068878173828, -0.004410862922668457, -0.003995656967163086, -0.003580451011657715, -0.0031652450561523438, -0.0027500391006469727, -0.0023348331451416016, -0.0019196271896362305, -0.0015044212341308594, -0.0010892152786254883, -0.0006740093231201172, -0.0002588033676147461, 0.000156402587890625, 0.0005716085433959961, 0.0009868144989013672, 0.0014020204544067383, 0.0018172264099121094, 0.0022324323654174805, 0.0026476383209228516, 0.0030628442764282227, 0.0034780502319335938, 0.003893256187438965, 0.004308462142944336, 0.004723668098449707, 0.005138874053955078, 0.005554080009460449, 0.00596928596496582, 0.006384491920471191, 0.0067996978759765625, 0.007214903831481934, 0.007630109786987305, 0.008045315742492676, 0.008460521697998047, 0.008875727653503418, 0.009290933609008789, 0.00970613956451416, 0.010121345520019531, 0.010536551475524902, 0.010951757431030273, 0.011366963386535645, 0.011782169342041016, 0.012197375297546387, 0.012612581253051758, 0.013027787208557129, 0.0134429931640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 9.0, 11.0, 12.0, 26.0, 24.0, 70.0, 105.0, 136.0, 157.0, 163.0, 118.0, 61.0, 39.0, 30.0, 18.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.18235969543457e-05, -6.890296936035156e-05, -6.598234176635742e-05, -6.306171417236328e-05, -6.014108657836914e-05, -5.7220458984375e-05, -5.429983139038086e-05, -5.137920379638672e-05, -4.845857620239258e-05, -4.553794860839844e-05, -4.26173210144043e-05, -3.9696693420410156e-05, -3.6776065826416016e-05, -3.3855438232421875e-05, -3.0934810638427734e-05, -2.8014183044433594e-05, -2.5093555450439453e-05, -2.2172927856445312e-05, -1.9252300262451172e-05, -1.633167266845703e-05, -1.341104507446289e-05, -1.049041748046875e-05, -7.569789886474609e-06, -4.649162292480469e-06, -1.7285346984863281e-06, 1.1920928955078125e-06, 4.112720489501953e-06, 7.033348083496094e-06, 9.953975677490234e-06, 1.2874603271484375e-05, 1.5795230865478516e-05, 1.8715858459472656e-05, 2.1636486053466797e-05, 2.4557113647460938e-05, 2.7477741241455078e-05, 3.039836883544922e-05, 3.331899642944336e-05, 3.62396240234375e-05, 3.916025161743164e-05, 4.208087921142578e-05, 4.500150680541992e-05, 4.792213439941406e-05, 5.08427619934082e-05, 5.3763389587402344e-05, 5.6684017181396484e-05, 5.9604644775390625e-05, 6.252527236938477e-05, 6.54458999633789e-05, 6.836652755737305e-05, 7.128715515136719e-05, 7.420778274536133e-05, 7.712841033935547e-05, 8.004903793334961e-05, 8.296966552734375e-05, 8.589029312133789e-05, 8.881092071533203e-05, 9.173154830932617e-05, 9.465217590332031e-05, 9.757280349731445e-05, 0.0001004934310913086, 0.00010341405868530273, 0.00010633468627929688, 0.00010925531387329102, 0.00011217594146728516, 0.0001150965690612793]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 5.0, 2.0, 6.0, 14.0, 15.0, 17.0, 37.0, 47.0, 71.0, 120.0, 169.0, 284.0, 487.0, 1025.0, 1938.0, 5067.0, 14481.0, 57215.0, 306557.0, 514346.0, 108699.0, 24721.0, 7619.0, 2759.0, 1265.0, 645.0, 358.0, 203.0, 134.0, 81.0, 55.0, 35.0, 21.0, 13.0, 11.0, 12.0, 5.0, 4.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00905609130859375, -0.008791327476501465, -0.00852656364440918, -0.008261799812316895, -0.00799703598022461, -0.007732272148132324, -0.007467508316040039, -0.007202744483947754, -0.006937980651855469, -0.006673216819763184, -0.0064084529876708984, -0.006143689155578613, -0.005878925323486328, -0.005614161491394043, -0.005349397659301758, -0.005084633827209473, -0.0048198699951171875, -0.004555106163024902, -0.004290342330932617, -0.004025578498840332, -0.003760814666748047, -0.0034960508346557617, -0.0032312870025634766, -0.0029665231704711914, -0.0027017593383789062, -0.002436995506286621, -0.002172231674194336, -0.0019074678421020508, -0.0016427040100097656, -0.0013779401779174805, -0.0011131763458251953, -0.0008484125137329102, -0.000583648681640625, -0.00031888484954833984, -5.412101745605469e-05, 0.00021064281463623047, 0.0004754066467285156, 0.0007401704788208008, 0.001004934310913086, 0.001269698143005371, 0.0015344619750976562, 0.0017992258071899414, 0.0020639896392822266, 0.0023287534713745117, 0.002593517303466797, 0.002858281135559082, 0.003123044967651367, 0.0033878087997436523, 0.0036525726318359375, 0.003917336463928223, 0.004182100296020508, 0.004446864128112793, 0.004711627960205078, 0.004976391792297363, 0.0052411556243896484, 0.005505919456481934, 0.005770683288574219, 0.006035447120666504, 0.006300210952758789, 0.006564974784851074, 0.006829738616943359, 0.0070945024490356445, 0.00735926628112793, 0.007624030113220215, 0.0078887939453125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 7.0, 6.0, 10.0, 10.0, 21.0, 26.0, 59.0, 75.0, 82.0, 98.0, 106.0, 121.0, 89.0, 93.0, 67.0, 39.0, 29.0, 24.0, 10.0, 11.0, 4.0, 5.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.016387939453125, -0.015978693962097168, -0.015569448471069336, -0.015160202980041504, -0.014750957489013672, -0.01434171199798584, -0.013932466506958008, -0.013523221015930176, -0.013113975524902344, -0.012704730033874512, -0.01229548454284668, -0.011886239051818848, -0.011476993560791016, -0.011067748069763184, -0.010658502578735352, -0.01024925708770752, -0.009840011596679688, -0.009430766105651855, -0.009021520614624023, -0.008612275123596191, -0.00820302963256836, -0.007793784141540527, -0.007384538650512695, -0.006975293159484863, -0.006566047668457031, -0.006156802177429199, -0.005747556686401367, -0.005338311195373535, -0.004929065704345703, -0.004519820213317871, -0.004110574722290039, -0.003701329231262207, -0.003292083740234375, -0.002882838249206543, -0.002473592758178711, -0.002064347267150879, -0.0016551017761230469, -0.0012458562850952148, -0.0008366107940673828, -0.0004273653030395508, -1.811981201171875e-05, 0.0003911256790161133, 0.0008003711700439453, 0.0012096166610717773, 0.0016188621520996094, 0.0020281076431274414, 0.0024373531341552734, 0.0028465986251831055, 0.0032558441162109375, 0.0036650896072387695, 0.0040743350982666016, 0.004483580589294434, 0.004892826080322266, 0.005302071571350098, 0.00571131706237793, 0.006120562553405762, 0.006529808044433594, 0.006939053535461426, 0.007348299026489258, 0.00775754451751709, 0.008166790008544922, 0.008576035499572754, 0.008985280990600586, 0.009394526481628418, 0.00980377197265625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 13.0, 42.0, 153.0, 286.0, 297.0, 144.0, 43.0, 18.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31041884422302246, -0.2979366183280945, -0.2854543924331665, -0.2729721665382385, -0.26048994064331055, -0.24800771474838257, -0.2355254888534546, -0.2230432629585266, -0.21056103706359863, -0.19807881116867065, -0.18559658527374268, -0.1731143593788147, -0.16063213348388672, -0.14814990758895874, -0.13566768169403076, -0.12318544834852219, -0.11070321500301361, -0.09822098910808563, -0.08573876321315765, -0.07325653731822968, -0.0607743076980114, -0.04829208180308342, -0.03580985218286514, -0.023327626287937164, -0.010845400393009186, 0.0016368264332413673, 0.01411905325949192, 0.026601281017065048, 0.03908350691199303, 0.051565732806921005, 0.06404796242713928, 0.07653018832206726, 0.08901241421699524, 0.10149464011192322, 0.1139768660068512, 0.12645909190177917, 0.13894131779670715, 0.15142354369163513, 0.1639057695865631, 0.1763879954814911, 0.18887022137641907, 0.20135244727134705, 0.21383467316627502, 0.226316899061203, 0.23879912495613098, 0.25128135085105896, 0.26376357674598694, 0.2762458026409149, 0.2887280583381653, 0.30121028423309326, 0.31369251012802124, 0.3261747360229492, 0.3386569619178772, 0.3511391878128052, 0.36362141370773315, 0.37610363960266113, 0.3885858654975891, 0.4010680913925171, 0.41355031728744507, 0.42603254318237305, 0.438514769077301, 0.450996994972229, 0.463479220867157, 0.47596144676208496, 0.48844367265701294]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 1.0, 4.0, 3.0, 8.0, 11.0, 13.0, 12.0, 15.0, 19.0, 20.0, 18.0, 22.0, 17.0, 25.0, 28.0, 29.0, 25.0, 20.0, 44.0, 41.0, 32.0, 43.0, 36.0, 40.0, 42.0, 39.0, 36.0, 46.0, 43.0, 33.0, 30.0, 19.0, 19.0, 22.0, 19.0, 21.0, 15.0, 11.0, 13.0, 14.0, 7.0, 9.0, 9.0, 6.0, 6.0, 5.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.17645269632339478, -0.1709679812192917, -0.1654832810163498, -0.1599985659122467, -0.1545138657093048, -0.14902915060520172, -0.14354443550109863, -0.13805973529815674, -0.13257502019405365, -0.12709030508995056, -0.12160560488700867, -0.11612088978290558, -0.11063618212938309, -0.1051514744758606, -0.09966675937175751, -0.09418205171823502, -0.08869734406471252, -0.08321263641119003, -0.07772792875766754, -0.07224321365356445, -0.06675850600004196, -0.06127379834651947, -0.05578908696770668, -0.05030437558889389, -0.0448196679353714, -0.03933496028184891, -0.03385024890303612, -0.028365539386868477, -0.022880829870700836, -0.017396120354533195, -0.011911410838365555, -0.006426699459552765, -0.0009419918060302734, 0.004542717710137367, 0.010027427226305008, 0.015512136742472649, 0.02099684625864029, 0.02648155577480793, 0.03196626529097557, 0.03745097666978836, 0.04293568432331085, 0.048420391976833344, 0.05390510335564613, 0.05938981473445892, 0.06487452238798141, 0.0703592300415039, 0.075843945145607, 0.08132865279912949, 0.08681336045265198, 0.09229806810617447, 0.09778277575969696, 0.10326749086380005, 0.10875219851732254, 0.11423690617084503, 0.11972162127494812, 0.12520632147789001, 0.1306910365819931, 0.1361757516860962, 0.14166045188903809, 0.14714516699314117, 0.15262988209724426, 0.15811458230018616, 0.16359929740428925, 0.16908401250839233, 0.17456871271133423]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 1.0, 1.0, 5.0, 3.0, 7.0, 10.0, 3.0, 13.0, 18.0, 31.0, 39.0, 78.0, 148.0, 302.0, 567.0, 1443.0, 5075.0, 60219.0, 4101364.0, 19740.0, 3174.0, 1030.0, 417.0, 221.0, 125.0, 90.0, 39.0, 31.0, 15.0, 19.0, 8.0, 10.0, 5.0, 5.0, 7.0, 3.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04119873046875, -0.0397944450378418, -0.038390159606933594, -0.03698587417602539, -0.03558158874511719, -0.034177303314208984, -0.03277301788330078, -0.03136873245239258, -0.029964447021484375, -0.028560161590576172, -0.02715587615966797, -0.025751590728759766, -0.024347305297851562, -0.02294301986694336, -0.021538734436035156, -0.020134449005126953, -0.01873016357421875, -0.017325878143310547, -0.015921592712402344, -0.01451730728149414, -0.013113021850585938, -0.011708736419677734, -0.010304450988769531, -0.008900165557861328, -0.007495880126953125, -0.006091594696044922, -0.004687309265136719, -0.0032830238342285156, -0.0018787384033203125, -0.0004744529724121094, 0.0009298324584960938, 0.002334117889404297, 0.0037384033203125, 0.005142688751220703, 0.006546974182128906, 0.00795125961303711, 0.009355545043945312, 0.010759830474853516, 0.012164115905761719, 0.013568401336669922, 0.014972686767578125, 0.016376972198486328, 0.01778125762939453, 0.019185543060302734, 0.020589828491210938, 0.02199411392211914, 0.023398399353027344, 0.024802684783935547, 0.02620697021484375, 0.027611255645751953, 0.029015541076660156, 0.03041982650756836, 0.03182411193847656, 0.033228397369384766, 0.03463268280029297, 0.03603696823120117, 0.037441253662109375, 0.03884553909301758, 0.04024982452392578, 0.041654109954833984, 0.04305839538574219, 0.04446268081665039, 0.045866966247558594, 0.0472712516784668, 0.048675537109375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 6.0, 8.0, 7.0, 11.0, 19.0, 26.0, 35.0, 60.0, 59.0, 71.0, 87.0, 74.0, 89.0, 86.0, 72.0, 72.0, 54.0, 44.0, 30.0, 31.0, 15.0, 11.0, 8.0, 6.0, 4.0, 2.0, 1.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021148681640625, -0.02051544189453125, -0.0198822021484375, -0.01924896240234375, -0.01861572265625, -0.01798248291015625, -0.0173492431640625, -0.01671600341796875, -0.016082763671875, -0.01544952392578125, -0.0148162841796875, -0.01418304443359375, -0.0135498046875, -0.01291656494140625, -0.0122833251953125, -0.01165008544921875, -0.011016845703125, -0.01038360595703125, -0.0097503662109375, -0.00911712646484375, -0.00848388671875, -0.00785064697265625, -0.0072174072265625, -0.00658416748046875, -0.005950927734375, -0.00531768798828125, -0.0046844482421875, -0.00405120849609375, -0.00341796875, -0.00278472900390625, -0.0021514892578125, -0.00151824951171875, -0.000885009765625, -0.00025177001953125, 0.0003814697265625, 0.00101470947265625, 0.00164794921875, 0.00228118896484375, 0.0029144287109375, 0.00354766845703125, 0.004180908203125, 0.00481414794921875, 0.0054473876953125, 0.00608062744140625, 0.0067138671875, 0.00734710693359375, 0.0079803466796875, 0.00861358642578125, 0.009246826171875, 0.00988006591796875, 0.0105133056640625, 0.01114654541015625, 0.01177978515625, 0.01241302490234375, 0.0130462646484375, 0.01367950439453125, 0.014312744140625, 0.01494598388671875, 0.0155792236328125, 0.01621246337890625, 0.016845703125, 0.01747894287109375, 0.0181121826171875, 0.01874542236328125, 0.019378662109375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 8.0, 4.0, 7.0, 14.0, 19.0, 32.0, 31.0, 46.0, 70.0, 93.0, 125.0, 187.0, 282.0, 443.0, 740.0, 1387.0, 2849.0, 6785.0, 22561.0, 384559.0, 3726938.0, 31604.0, 8230.0, 3357.0, 1548.0, 860.0, 475.0, 307.0, 181.0, 146.0, 111.0, 71.0, 54.0, 44.0, 23.0, 30.0, 12.0, 9.0, 14.0, 7.0, 7.0, 3.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0162811279296875, -0.01575756072998047, -0.015233993530273438, -0.014710426330566406, -0.014186859130859375, -0.013663291931152344, -0.013139724731445312, -0.012616157531738281, -0.01209259033203125, -0.011569023132324219, -0.011045455932617188, -0.010521888732910156, -0.009998321533203125, -0.009474754333496094, -0.008951187133789062, -0.008427619934082031, -0.007904052734375, -0.007380485534667969, -0.0068569183349609375, -0.006333351135253906, -0.005809783935546875, -0.005286216735839844, -0.0047626495361328125, -0.004239082336425781, -0.00371551513671875, -0.0031919479370117188, -0.0026683807373046875, -0.0021448135375976562, -0.001621246337890625, -0.0010976791381835938, -0.0005741119384765625, -5.054473876953125e-05, 0.0004730224609375, 0.0009965896606445312, 0.0015201568603515625, 0.0020437240600585938, 0.002567291259765625, 0.0030908584594726562, 0.0036144256591796875, 0.004137992858886719, 0.00466156005859375, 0.005185127258300781, 0.0057086944580078125, 0.006232261657714844, 0.006755828857421875, 0.007279396057128906, 0.0078029632568359375, 0.008326530456542969, 0.00885009765625, 0.009373664855957031, 0.009897232055664062, 0.010420799255371094, 0.010944366455078125, 0.011467933654785156, 0.011991500854492188, 0.012515068054199219, 0.01303863525390625, 0.013562202453613281, 0.014085769653320312, 0.014609336853027344, 0.015132904052734375, 0.015656471252441406, 0.016180038452148438, 0.01670360565185547, 0.0172271728515625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 3.0, 5.0, 6.0, 5.0, 8.0, 14.0, 23.0, 54.0, 155.0, 3149.0, 457.0, 105.0, 37.0, 14.0, 7.0, 12.0, 6.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00331878662109375, -0.003185272216796875, -0.0030517578125, -0.002918243408203125, -0.00278472900390625, -0.002651214599609375, -0.0025177001953125, -0.002384185791015625, -0.00225067138671875, -0.002117156982421875, -0.001983642578125, -0.001850128173828125, -0.00171661376953125, -0.001583099365234375, -0.0014495849609375, -0.001316070556640625, -0.00118255615234375, -0.001049041748046875, -0.00091552734375, -0.000782012939453125, -0.00064849853515625, -0.000514984130859375, -0.0003814697265625, -0.000247955322265625, -0.00011444091796875, 1.9073486328125e-05, 0.000152587890625, 0.000286102294921875, 0.00041961669921875, 0.000553131103515625, 0.0006866455078125, 0.000820159912109375, 0.00095367431640625, 0.001087188720703125, 0.001220703125, 0.001354217529296875, 0.00148773193359375, 0.001621246337890625, 0.0017547607421875, 0.001888275146484375, 0.00202178955078125, 0.002155303955078125, 0.002288818359375, 0.002422332763671875, 0.00255584716796875, 0.002689361572265625, 0.0028228759765625, 0.002956390380859375, 0.00308990478515625, 0.003223419189453125, 0.00335693359375, 0.003490447998046875, 0.00362396240234375, 0.003757476806640625, 0.0038909912109375, 0.004024505615234375, 0.00415802001953125, 0.004291534423828125, 0.004425048828125, 0.004558563232421875, 0.00469207763671875, 0.004825592041015625, 0.0049591064453125, 0.005092620849609375, 0.00522613525390625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 10.0, 16.0, 53.0, 95.0, 149.0, 191.0, 189.0, 139.0, 67.0, 46.0, 14.0, 15.0, 8.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020072799175977707, -0.019483080133795738, -0.01889336109161377, -0.0183036420494318, -0.017713923007249832, -0.017124203965067863, -0.016534484922885895, -0.015944765880703926, -0.015355046838521957, -0.014765327796339989, -0.01417560875415802, -0.013585889711976051, -0.012996170669794083, -0.012406451627612114, -0.011816732585430145, -0.011227013543248177, -0.010637293569743633, -0.010047574527561665, -0.009457855485379696, -0.008868136443197727, -0.008278417401015759, -0.00768869835883379, -0.007098978850990534, -0.006509259808808565, -0.0059195407666265965, -0.005329821724444628, -0.004740102682262659, -0.004150383174419403, -0.003560664365068078, -0.0029709453228861094, -0.002381226047873497, -0.0017915070056915283, -0.0012017879635095596, -0.00061206886311993, -2.2349762730300426e-05, 0.0005673693958669901, 0.0011570884380489588, 0.0017468074802309275, 0.00233652675524354, 0.0029262457974255085, 0.003515964839607477, 0.004105683881789446, 0.0046954029239714146, 0.0052851224318146706, 0.005874841473996639, 0.006464560516178608, 0.007054279558360577, 0.007643998600542545, 0.008233717642724514, 0.008823436684906483, 0.009413155727088451, 0.01000287476927042, 0.010592593811452389, 0.011182312853634357, 0.0117720328271389, 0.01236175186932087, 0.012951470911502838, 0.013541189953684807, 0.014130908995866776, 0.014720628038048744, 0.015310347080230713, 0.01590006612241268, 0.01648978516459465, 0.01707950420677662, 0.017669223248958588]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 3.0, 9.0, 8.0, 4.0, 13.0, 8.0, 15.0, 12.0, 14.0, 22.0, 23.0, 26.0, 33.0, 40.0, 42.0, 40.0, 40.0, 41.0, 46.0, 37.0, 44.0, 48.0, 37.0, 50.0, 38.0, 58.0, 31.0, 34.0, 27.0, 18.0, 30.0, 23.0, 20.0, 20.0, 14.0, 8.0, 7.0, 5.0, 3.0, 10.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.007131099700927734, -0.006917395628988743, -0.006703691557049751, -0.00648998748511076, -0.006276283413171768, -0.006062579341232777, -0.005848875269293785, -0.0056351711973547935, -0.005421467125415802, -0.0052077630534768105, -0.004994058981537819, -0.004780354909598827, -0.004566650837659836, -0.004352946765720844, -0.004139242693781853, -0.003925538621842861, -0.0037118345499038696, -0.003498130477964878, -0.0032844264060258865, -0.003070722334086895, -0.0028570182621479034, -0.002643314190208912, -0.0024296101182699203, -0.002215906046330929, -0.0020022019743919373, -0.0017884979024529457, -0.0015747938305139542, -0.0013610897585749626, -0.001147385686635971, -0.0009336816146969795, -0.000719977542757988, -0.0005062734708189964, -0.0002925693988800049, -7.886532694101334e-05, 0.0001348387449979782, 0.00034854281693696976, 0.0005622468888759613, 0.0007759509608149529, 0.0009896550327539444, 0.001203359104692936, 0.0014170631766319275, 0.001630767248570919, 0.0018444713205099106, 0.002058175392448902, 0.0022718794643878937, 0.0024855835363268852, 0.0026992876082658768, 0.0029129916802048683, 0.00312669575214386, 0.0033403998240828514, 0.003554103896021843, 0.0037678079679608345, 0.003981512039899826, 0.004195216111838818, 0.004408920183777809, 0.004622624255716801, 0.004836328327655792, 0.005050032399594784, 0.005263736471533775, 0.005477440543472767, 0.005691144615411758, 0.00590484868735075, 0.0061185527592897415, 0.006332256831228733, 0.006545960903167725]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 2.0, 3.0, 9.0, 16.0, 19.0, 36.0, 42.0, 100.0, 169.0, 416.0, 953.0, 3070.0, 14543.0, 114880.0, 635166.0, 244675.0, 27205.0, 4820.0, 1346.0, 559.0, 232.0, 108.0, 61.0, 42.0, 25.0, 9.0, 9.0, 9.0, 0.0, 5.0, 6.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.033294677734375, -0.03224325180053711, -0.03119182586669922, -0.030140399932861328, -0.029088973999023438, -0.028037548065185547, -0.026986122131347656, -0.025934696197509766, -0.024883270263671875, -0.023831844329833984, -0.022780418395996094, -0.021728992462158203, -0.020677566528320312, -0.019626140594482422, -0.01857471466064453, -0.01752328872680664, -0.01647186279296875, -0.01542043685913086, -0.014369010925292969, -0.013317584991455078, -0.012266159057617188, -0.011214733123779297, -0.010163307189941406, -0.009111881256103516, -0.008060455322265625, -0.007009029388427734, -0.005957603454589844, -0.004906177520751953, -0.0038547515869140625, -0.002803325653076172, -0.0017518997192382812, -0.0007004737854003906, 0.0003509521484375, 0.0014023780822753906, 0.0024538040161132812, 0.003505229949951172, 0.0045566558837890625, 0.005608081817626953, 0.006659507751464844, 0.007710933685302734, 0.008762359619140625, 0.009813785552978516, 0.010865211486816406, 0.011916637420654297, 0.012968063354492188, 0.014019489288330078, 0.015070915222167969, 0.01612234115600586, 0.01717376708984375, 0.01822519302368164, 0.01927661895751953, 0.020328044891357422, 0.021379470825195312, 0.022430896759033203, 0.023482322692871094, 0.024533748626708984, 0.025585174560546875, 0.026636600494384766, 0.027688026428222656, 0.028739452362060547, 0.029790878295898438, 0.030842304229736328, 0.03189373016357422, 0.03294515609741211, 0.03399658203125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 3.0, 11.0, 5.0, 12.0, 17.0, 26.0, 47.0, 42.0, 63.0, 72.0, 80.0, 78.0, 86.0, 93.0, 79.0, 58.0, 52.0, 48.0, 29.0, 36.0, 18.0, 9.0, 5.0, 9.0, 2.0, 3.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02117919921875, -0.020545482635498047, -0.019911766052246094, -0.01927804946899414, -0.018644332885742188, -0.018010616302490234, -0.01737689971923828, -0.016743183135986328, -0.016109466552734375, -0.015475749969482422, -0.014842033386230469, -0.014208316802978516, -0.013574600219726562, -0.01294088363647461, -0.012307167053222656, -0.011673450469970703, -0.01103973388671875, -0.010406017303466797, -0.009772300720214844, -0.00913858413696289, -0.008504867553710938, -0.007871150970458984, -0.007237434387207031, -0.006603717803955078, -0.005970001220703125, -0.005336284637451172, -0.004702568054199219, -0.004068851470947266, -0.0034351348876953125, -0.0028014183044433594, -0.0021677017211914062, -0.0015339851379394531, -0.0009002685546875, -0.0002665519714355469, 0.00036716461181640625, 0.0010008811950683594, 0.0016345977783203125, 0.0022683143615722656, 0.0029020309448242188, 0.003535747528076172, 0.004169464111328125, 0.004803180694580078, 0.005436897277832031, 0.006070613861083984, 0.0067043304443359375, 0.007338047027587891, 0.007971763610839844, 0.008605480194091797, 0.00923919677734375, 0.009872913360595703, 0.010506629943847656, 0.01114034652709961, 0.011774063110351562, 0.012407779693603516, 0.013041496276855469, 0.013675212860107422, 0.014308929443359375, 0.014942646026611328, 0.015576362609863281, 0.016210079193115234, 0.016843795776367188, 0.01747751235961914, 0.018111228942871094, 0.018744945526123047, 0.019378662109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 8.0, 7.0, 9.0, 14.0, 22.0, 20.0, 33.0, 45.0, 60.0, 76.0, 108.0, 167.0, 200.0, 315.0, 556.0, 1150.0, 4610.0, 33096.0, 424499.0, 532840.0, 42400.0, 5430.0, 1231.0, 580.0, 302.0, 210.0, 148.0, 114.0, 75.0, 60.0, 44.0, 36.0, 24.0, 19.0, 15.0, 8.0, 6.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02801513671875, -0.02708292007446289, -0.02615070343017578, -0.025218486785888672, -0.024286270141601562, -0.023354053497314453, -0.022421836853027344, -0.021489620208740234, -0.020557403564453125, -0.019625186920166016, -0.018692970275878906, -0.017760753631591797, -0.016828536987304688, -0.015896320343017578, -0.014964103698730469, -0.01403188705444336, -0.01309967041015625, -0.01216745376586914, -0.011235237121582031, -0.010303020477294922, -0.009370803833007812, -0.008438587188720703, -0.007506370544433594, -0.006574153900146484, -0.005641937255859375, -0.004709720611572266, -0.0037775039672851562, -0.002845287322998047, -0.0019130706787109375, -0.0009808540344238281, -4.863739013671875e-05, 0.0008835792541503906, 0.0018157958984375, 0.0027480125427246094, 0.0036802291870117188, 0.004612445831298828, 0.0055446624755859375, 0.006476879119873047, 0.007409095764160156, 0.008341312408447266, 0.009273529052734375, 0.010205745697021484, 0.011137962341308594, 0.012070178985595703, 0.013002395629882812, 0.013934612274169922, 0.014866828918457031, 0.01579904556274414, 0.01673126220703125, 0.01766347885131836, 0.01859569549560547, 0.019527912139892578, 0.020460128784179688, 0.021392345428466797, 0.022324562072753906, 0.023256778717041016, 0.024188995361328125, 0.025121212005615234, 0.026053428649902344, 0.026985645294189453, 0.027917861938476562, 0.028850078582763672, 0.02978229522705078, 0.03071451187133789, 0.031646728515625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 6.0, 13.0, 8.0, 7.0, 14.0, 20.0, 17.0, 24.0, 27.0, 23.0, 39.0, 38.0, 37.0, 43.0, 50.0, 41.0, 41.0, 54.0, 51.0, 50.0, 50.0, 44.0, 47.0, 26.0, 41.0, 27.0, 24.0, 24.0, 22.0, 22.0, 17.0, 11.0, 6.0, 6.0, 6.0, 7.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.03961181640625, -0.038254737854003906, -0.03689765930175781, -0.03554058074951172, -0.034183502197265625, -0.03282642364501953, -0.03146934509277344, -0.030112266540527344, -0.02875518798828125, -0.027398109436035156, -0.026041030883789062, -0.02468395233154297, -0.023326873779296875, -0.02196979522705078, -0.020612716674804688, -0.019255638122558594, -0.0178985595703125, -0.016541481018066406, -0.015184402465820312, -0.013827323913574219, -0.012470245361328125, -0.011113166809082031, -0.009756088256835938, -0.008399009704589844, -0.00704193115234375, -0.005684852600097656, -0.0043277740478515625, -0.0029706954956054688, -0.001613616943359375, -0.00025653839111328125, 0.0011005401611328125, 0.0024576187133789062, 0.003814697265625, 0.005171775817871094, 0.0065288543701171875, 0.007885932922363281, 0.009243011474609375, 0.010600090026855469, 0.011957168579101562, 0.013314247131347656, 0.01467132568359375, 0.016028404235839844, 0.017385482788085938, 0.01874256134033203, 0.020099639892578125, 0.02145671844482422, 0.022813796997070312, 0.024170875549316406, 0.0255279541015625, 0.026885032653808594, 0.028242111206054688, 0.02959918975830078, 0.030956268310546875, 0.03231334686279297, 0.03367042541503906, 0.035027503967285156, 0.03638458251953125, 0.037741661071777344, 0.03909873962402344, 0.04045581817626953, 0.041812896728515625, 0.04316997528076172, 0.04452705383300781, 0.045884132385253906, 0.0472412109375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 8.0, 11.0, 12.0, 30.0, 32.0, 54.0, 86.0, 127.0, 201.0, 342.0, 585.0, 1213.0, 2604.0, 6052.0, 16451.0, 55734.0, 238227.0, 504363.0, 161380.0, 39293.0, 12430.0, 4813.0, 2133.0, 1022.0, 526.0, 309.0, 184.0, 105.0, 76.0, 39.0, 37.0, 19.0, 12.0, 9.0, 11.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0066986083984375, -0.006491661071777344, -0.0062847137451171875, -0.006077766418457031, -0.005870819091796875, -0.005663871765136719, -0.0054569244384765625, -0.005249977111816406, -0.00504302978515625, -0.004836082458496094, -0.0046291351318359375, -0.004422187805175781, -0.004215240478515625, -0.004008293151855469, -0.0038013458251953125, -0.0035943984985351562, -0.003387451171875, -0.0031805038452148438, -0.0029735565185546875, -0.0027666091918945312, -0.002559661865234375, -0.0023527145385742188, -0.0021457672119140625, -0.0019388198852539062, -0.00173187255859375, -0.0015249252319335938, -0.0013179779052734375, -0.0011110305786132812, -0.000904083251953125, -0.0006971359252929688, -0.0004901885986328125, -0.00028324127197265625, -7.62939453125e-05, 0.00013065338134765625, 0.0003376007080078125, 0.0005445480346679688, 0.000751495361328125, 0.0009584426879882812, 0.0011653900146484375, 0.0013723373413085938, 0.00157928466796875, 0.0017862319946289062, 0.0019931793212890625, 0.0022001266479492188, 0.002407073974609375, 0.0026140213012695312, 0.0028209686279296875, 0.0030279159545898438, 0.00323486328125, 0.0034418106079101562, 0.0036487579345703125, 0.0038557052612304688, 0.004062652587890625, 0.004269599914550781, 0.0044765472412109375, 0.004683494567871094, 0.00489044189453125, 0.005097389221191406, 0.0053043365478515625, 0.005511283874511719, 0.005718231201171875, 0.005925178527832031, 0.0061321258544921875, 0.006339073181152344, 0.0065460205078125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 9.0, 5.0, 5.0, 8.0, 15.0, 17.0, 19.0, 21.0, 22.0, 36.0, 37.0, 49.0, 47.0, 68.0, 73.0, 89.0, 81.0, 90.0, 54.0, 51.0, 42.0, 42.0, 28.0, 18.0, 19.0, 17.0, 10.0, 7.0, 5.0, 8.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.167722702026367e-05, -5.034264177083969e-05, -4.900805652141571e-05, -4.767347127199173e-05, -4.633888602256775e-05, -4.500430077314377e-05, -4.366971552371979e-05, -4.233513027429581e-05, -4.1000545024871826e-05, -3.9665959775447845e-05, -3.8331374526023865e-05, -3.6996789276599884e-05, -3.56622040271759e-05, -3.432761877775192e-05, -3.299303352832794e-05, -3.165844827890396e-05, -3.032386302947998e-05, -2.8989277780056e-05, -2.765469253063202e-05, -2.632010728120804e-05, -2.4985522031784058e-05, -2.3650936782360077e-05, -2.2316351532936096e-05, -2.0981766283512115e-05, -1.9647181034088135e-05, -1.8312595784664154e-05, -1.6978010535240173e-05, -1.5643425285816193e-05, -1.4308840036392212e-05, -1.2974254786968231e-05, -1.163966953754425e-05, -1.030508428812027e-05, -8.970499038696289e-06, -7.635913789272308e-06, -6.301328539848328e-06, -4.966743290424347e-06, -3.632158041000366e-06, -2.2975727915763855e-06, -9.629875421524048e-07, 3.7159770727157593e-07, 1.7061829566955566e-06, 3.0407682061195374e-06, 4.375353455543518e-06, 5.709938704967499e-06, 7.0445239543914795e-06, 8.37910920381546e-06, 9.713694453239441e-06, 1.1048279702663422e-05, 1.2382864952087402e-05, 1.3717450201511383e-05, 1.5052035450935364e-05, 1.6386620700359344e-05, 1.7721205949783325e-05, 1.9055791199207306e-05, 2.0390376448631287e-05, 2.1724961698055267e-05, 2.3059546947479248e-05, 2.439413219690323e-05, 2.572871744632721e-05, 2.706330269575119e-05, 2.839788794517517e-05, 2.973247319459915e-05, 3.106705844402313e-05, 3.240164369344711e-05, 3.3736228942871094e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 3.0, 7.0, 6.0, 9.0, 13.0, 26.0, 40.0, 42.0, 62.0, 141.0, 236.0, 333.0, 617.0, 1436.0, 3481.0, 9610.0, 35869.0, 176324.0, 549689.0, 210410.0, 42019.0, 10934.0, 3853.0, 1630.0, 755.0, 407.0, 225.0, 129.0, 71.0, 55.0, 39.0, 19.0, 20.0, 11.0, 10.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00632476806640625, -0.006086587905883789, -0.005848407745361328, -0.005610227584838867, -0.005372047424316406, -0.005133867263793945, -0.004895687103271484, -0.0046575069427490234, -0.0044193267822265625, -0.0041811466217041016, -0.003942966461181641, -0.0037047863006591797, -0.0034666061401367188, -0.003228425979614258, -0.002990245819091797, -0.002752065658569336, -0.002513885498046875, -0.002275705337524414, -0.002037525177001953, -0.0017993450164794922, -0.0015611648559570312, -0.0013229846954345703, -0.0010848045349121094, -0.0008466243743896484, -0.0006084442138671875, -0.00037026405334472656, -0.00013208389282226562, 0.00010609626770019531, 0.00034427642822265625, 0.0005824565887451172, 0.0008206367492675781, 0.001058816909790039, 0.0012969970703125, 0.001535177230834961, 0.0017733573913574219, 0.002011537551879883, 0.0022497177124023438, 0.0024878978729248047, 0.0027260780334472656, 0.0029642581939697266, 0.0032024383544921875, 0.0034406185150146484, 0.0036787986755371094, 0.00391697883605957, 0.004155158996582031, 0.004393339157104492, 0.004631519317626953, 0.004869699478149414, 0.005107879638671875, 0.005346059799194336, 0.005584239959716797, 0.005822420120239258, 0.006060600280761719, 0.00629878044128418, 0.006536960601806641, 0.0067751407623291016, 0.0070133209228515625, 0.0072515010833740234, 0.007489681243896484, 0.007727861404418945, 0.007966041564941406, 0.008204221725463867, 0.008442401885986328, 0.008680582046508789, 0.00891876220703125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 7.0, 8.0, 10.0, 16.0, 24.0, 22.0, 40.0, 36.0, 46.0, 57.0, 64.0, 76.0, 86.0, 98.0, 59.0, 71.0, 55.0, 44.0, 43.0, 41.0, 18.0, 16.0, 16.0, 16.0, 7.0, 5.0, 10.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00841522216796875, -0.008103728294372559, -0.007792234420776367, -0.007480740547180176, -0.007169246673583984, -0.006857752799987793, -0.0065462589263916016, -0.00623476505279541, -0.005923271179199219, -0.005611777305603027, -0.005300283432006836, -0.0049887895584106445, -0.004677295684814453, -0.004365801811218262, -0.00405430793762207, -0.003742814064025879, -0.0034313201904296875, -0.003119826316833496, -0.0028083324432373047, -0.0024968385696411133, -0.002185344696044922, -0.0018738508224487305, -0.001562356948852539, -0.0012508630752563477, -0.0009393692016601562, -0.0006278753280639648, -0.00031638145446777344, -4.887580871582031e-06, 0.0003066062927246094, 0.0006181001663208008, 0.0009295940399169922, 0.0012410879135131836, 0.001552581787109375, 0.0018640756607055664, 0.002175569534301758, 0.0024870634078979492, 0.0027985572814941406, 0.003110051155090332, 0.0034215450286865234, 0.003733038902282715, 0.004044532775878906, 0.004356026649475098, 0.004667520523071289, 0.0049790143966674805, 0.005290508270263672, 0.005602002143859863, 0.005913496017456055, 0.006224989891052246, 0.0065364837646484375, 0.006847977638244629, 0.00715947151184082, 0.007470965385437012, 0.007782459259033203, 0.008093953132629395, 0.008405447006225586, 0.008716940879821777, 0.009028434753417969, 0.00933992862701416, 0.009651422500610352, 0.009962916374206543, 0.010274410247802734, 0.010585904121398926, 0.010897397994995117, 0.011208891868591309, 0.0115203857421875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 8.0, 60.0, 316.0, 451.0, 150.0, 21.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.518557071685791, -0.4995139539241791, -0.48047083616256714, -0.4614277482032776, -0.44238463044166565, -0.4233415126800537, -0.40429842472076416, -0.3852553069591522, -0.3662121891975403, -0.34716907143592834, -0.3281259536743164, -0.30908286571502686, -0.2900397479534149, -0.270996630191803, -0.2519535422325134, -0.2329104244709015, -0.21386730670928955, -0.1948241889476776, -0.17578108608722687, -0.15673798322677612, -0.13769486546516418, -0.11865175515413284, -0.0996086448431015, -0.08056554198265076, -0.06152242422103882, -0.04247931391000748, -0.023436203598976135, -0.004393093287944794, 0.014650017023086548, 0.03369312733411789, 0.05273623764514923, 0.07177934050559998, 0.09082245826721191, 0.10986556857824326, 0.1289086788892746, 0.14795178174972534, 0.16699489951133728, 0.18603801727294922, 0.20508112013339996, 0.2241242229938507, 0.24316734075546265, 0.2622104585170746, 0.2812535762786865, 0.3002966642379761, 0.319339781999588, 0.33838289976119995, 0.3574259877204895, 0.37646910548210144, 0.3955122232437134, 0.4145553410053253, 0.43359845876693726, 0.4526415467262268, 0.47168466448783875, 0.4907277822494507, 0.5097708702087402, 0.5288139581680298, 0.5478571057319641, 0.5669001936912537, 0.585943341255188, 0.6049864292144775, 0.6240295171737671, 0.6430726647377014, 0.662115752696991, 0.6811589002609253, 0.7002019882202148]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 5.0, 10.0, 5.0, 6.0, 10.0, 10.0, 12.0, 18.0, 29.0, 21.0, 24.0, 18.0, 28.0, 26.0, 38.0, 42.0, 37.0, 44.0, 49.0, 50.0, 43.0, 36.0, 44.0, 39.0, 34.0, 45.0, 28.0, 26.0, 29.0, 37.0, 23.0, 22.0, 18.0, 14.0, 12.0, 11.0, 8.0, 9.0, 3.0, 9.0, 6.0, 4.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 4.0], "bins": [-0.20752465724945068, -0.2016763836145401, -0.19582809507846832, -0.18997982144355774, -0.18413153290748596, -0.17828325927257538, -0.1724349856376648, -0.16658669710159302, -0.16073842346668243, -0.15489014983177185, -0.14904186129570007, -0.1431935876607895, -0.1373453140258789, -0.13149702548980713, -0.12564875185489655, -0.11980047076940536, -0.11395218968391418, -0.108103908598423, -0.10225562751293182, -0.09640735387802124, -0.09055907279253006, -0.08471079170703888, -0.0788625180721283, -0.07301423698663712, -0.06716595590114594, -0.061317674815654755, -0.05546939745545387, -0.04962112009525299, -0.04377283900976181, -0.03792455792427063, -0.03207628056406975, -0.026228003203868866, -0.020379722118377686, -0.014531442895531654, -0.008683163672685623, -0.002834884449839592, 0.003013394773006439, 0.00886167399585247, 0.014709953218698502, 0.020558230578899384, 0.026406511664390564, 0.032254792749881744, 0.038103070110082626, 0.04395134747028351, 0.04979962855577469, 0.05564790964126587, 0.06149618700146675, 0.06734446436166763, 0.07319274544715881, 0.07904102653265, 0.08488930761814117, 0.09073758125305176, 0.09658586233854294, 0.10243414342403412, 0.1082824170589447, 0.11413069814443588, 0.11997897922992706, 0.12582725286483765, 0.13167554140090942, 0.13752381503582, 0.1433720886707306, 0.14922037720680237, 0.15506865084171295, 0.16091692447662354, 0.1667652130126953]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 7.0, 6.0, 7.0, 10.0, 15.0, 24.0, 41.0, 60.0, 65.0, 153.0, 239.0, 440.0, 1016.0, 3049.0, 14503.0, 525816.0, 3626915.0, 16527.0, 3199.0, 1062.0, 481.0, 230.0, 142.0, 81.0, 73.0, 28.0, 21.0, 20.0, 4.0, 12.0, 3.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0231781005859375, -0.022287607192993164, -0.021397113800048828, -0.020506620407104492, -0.019616127014160156, -0.01872563362121582, -0.017835140228271484, -0.01694464683532715, -0.016054153442382812, -0.015163660049438477, -0.01427316665649414, -0.013382673263549805, -0.012492179870605469, -0.011601686477661133, -0.010711193084716797, -0.009820699691772461, -0.008930206298828125, -0.008039712905883789, -0.007149219512939453, -0.006258726119995117, -0.005368232727050781, -0.004477739334106445, -0.0035872459411621094, -0.0026967525482177734, -0.0018062591552734375, -0.0009157657623291016, -2.5272369384765625e-05, 0.0008652210235595703, 0.0017557144165039062, 0.002646207809448242, 0.003536701202392578, 0.004427194595336914, 0.00531768798828125, 0.006208181381225586, 0.007098674774169922, 0.007989168167114258, 0.008879661560058594, 0.00977015495300293, 0.010660648345947266, 0.011551141738891602, 0.012441635131835938, 0.013332128524780273, 0.01422262191772461, 0.015113115310668945, 0.01600360870361328, 0.016894102096557617, 0.017784595489501953, 0.01867508888244629, 0.019565582275390625, 0.02045607566833496, 0.021346569061279297, 0.022237062454223633, 0.02312755584716797, 0.024018049240112305, 0.02490854263305664, 0.025799036026000977, 0.026689529418945312, 0.02758002281188965, 0.028470516204833984, 0.02936100959777832, 0.030251502990722656, 0.031141996383666992, 0.03203248977661133, 0.032922983169555664, 0.0338134765625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 1.0, 7.0, 9.0, 8.0, 26.0, 30.0, 38.0, 37.0, 54.0, 73.0, 66.0, 85.0, 85.0, 74.0, 82.0, 85.0, 54.0, 51.0, 36.0, 30.0, 15.0, 10.0, 3.0, 8.0, 7.0, 6.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021087646484375, -0.020461082458496094, -0.019834518432617188, -0.01920795440673828, -0.018581390380859375, -0.01795482635498047, -0.017328262329101562, -0.016701698303222656, -0.01607513427734375, -0.015448570251464844, -0.014822006225585938, -0.014195442199707031, -0.013568878173828125, -0.012942314147949219, -0.012315750122070312, -0.011689186096191406, -0.0110626220703125, -0.010436058044433594, -0.009809494018554688, -0.009182929992675781, -0.008556365966796875, -0.007929801940917969, -0.0073032379150390625, -0.006676673889160156, -0.00605010986328125, -0.005423545837402344, -0.0047969818115234375, -0.004170417785644531, -0.003543853759765625, -0.0029172897338867188, -0.0022907257080078125, -0.0016641616821289062, -0.00103759765625, -0.00041103363037109375, 0.0002155303955078125, 0.0008420944213867188, 0.001468658447265625, 0.0020952224731445312, 0.0027217864990234375, 0.0033483505249023438, 0.00397491455078125, 0.004601478576660156, 0.0052280426025390625, 0.005854606628417969, 0.006481170654296875, 0.007107734680175781, 0.0077342987060546875, 0.008360862731933594, 0.0089874267578125, 0.009613990783691406, 0.010240554809570312, 0.010867118835449219, 0.011493682861328125, 0.012120246887207031, 0.012746810913085938, 0.013373374938964844, 0.01399993896484375, 0.014626502990722656, 0.015253067016601562, 0.01587963104248047, 0.016506195068359375, 0.01713275909423828, 0.017759323120117188, 0.018385887145996094, 0.019012451171875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 0.0, 7.0, 11.0, 3.0, 18.0, 12.0, 27.0, 30.0, 36.0, 49.0, 69.0, 93.0, 128.0, 177.0, 295.0, 526.0, 893.0, 1782.0, 3444.0, 9251.0, 37220.0, 456455.0, 3605461.0, 56946.0, 12163.0, 4396.0, 2034.0, 1107.0, 595.0, 311.0, 210.0, 141.0, 91.0, 64.0, 58.0, 38.0, 34.0, 27.0, 15.0, 13.0, 11.0, 10.0, 15.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0117034912109375, -0.011339068412780762, -0.010974645614624023, -0.010610222816467285, -0.010245800018310547, -0.009881377220153809, -0.00951695442199707, -0.009152531623840332, -0.008788108825683594, -0.008423686027526855, -0.008059263229370117, -0.007694840431213379, -0.007330417633056641, -0.006965994834899902, -0.006601572036743164, -0.006237149238586426, -0.0058727264404296875, -0.005508303642272949, -0.005143880844116211, -0.004779458045959473, -0.004415035247802734, -0.004050612449645996, -0.003686189651489258, -0.0033217668533325195, -0.0029573440551757812, -0.002592921257019043, -0.0022284984588623047, -0.0018640756607055664, -0.0014996528625488281, -0.0011352300643920898, -0.0007708072662353516, -0.0004063844680786133, -4.1961669921875e-05, 0.0003224611282348633, 0.0006868839263916016, 0.0010513067245483398, 0.0014157295227050781, 0.0017801523208618164, 0.0021445751190185547, 0.002508997917175293, 0.0028734207153320312, 0.0032378435134887695, 0.003602266311645508, 0.003966689109802246, 0.004331111907958984, 0.004695534706115723, 0.005059957504272461, 0.005424380302429199, 0.0057888031005859375, 0.006153225898742676, 0.006517648696899414, 0.006882071495056152, 0.007246494293212891, 0.007610917091369629, 0.007975339889526367, 0.008339762687683105, 0.008704185485839844, 0.009068608283996582, 0.00943303108215332, 0.009797453880310059, 0.010161876678466797, 0.010526299476623535, 0.010890722274780273, 0.011255145072937012, 0.01161956787109375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 9.0, 7.0, 10.0, 12.0, 17.0, 43.0, 89.0, 192.0, 2862.0, 518.0, 141.0, 72.0, 38.0, 12.0, 14.0, 10.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.003871917724609375, -0.0037640929222106934, -0.0036562681198120117, -0.00354844331741333, -0.0034406185150146484, -0.003332793712615967, -0.003224968910217285, -0.0031171441078186035, -0.003009319305419922, -0.0029014945030212402, -0.0027936697006225586, -0.002685844898223877, -0.0025780200958251953, -0.0024701952934265137, -0.002362370491027832, -0.0022545456886291504, -0.0021467208862304688, -0.002038896083831787, -0.0019310712814331055, -0.0018232464790344238, -0.0017154216766357422, -0.0016075968742370605, -0.001499772071838379, -0.0013919472694396973, -0.0012841224670410156, -0.001176297664642334, -0.0010684728622436523, -0.0009606480598449707, -0.0008528232574462891, -0.0007449984550476074, -0.0006371736526489258, -0.0005293488502502441, -0.0004215240478515625, -0.00031369924545288086, -0.00020587444305419922, -9.804964065551758e-05, 9.775161743164062e-06, 0.0001175999641418457, 0.00022542476654052734, 0.000333249568939209, 0.0004410743713378906, 0.0005488991737365723, 0.0006567239761352539, 0.0007645487785339355, 0.0008723735809326172, 0.0009801983833312988, 0.0010880231857299805, 0.0011958479881286621, 0.0013036727905273438, 0.0014114975929260254, 0.001519322395324707, 0.0016271471977233887, 0.0017349720001220703, 0.001842796802520752, 0.0019506216049194336, 0.0020584464073181152, 0.002166271209716797, 0.0022740960121154785, 0.00238192081451416, 0.002489745616912842, 0.0025975704193115234, 0.002705395221710205, 0.0028132200241088867, 0.0029210448265075684, 0.00302886962890625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 14.0, 32.0, 168.0, 436.0, 287.0, 59.0, 12.0, 1.0, 1.0, 1.0], "bins": [-0.09188259392976761, -0.09029620885848999, -0.08870981633663177, -0.08712343126535416, -0.08553703874349594, -0.08395065367221832, -0.0823642686009407, -0.08077787607908249, -0.07919149100780487, -0.07760510593652725, -0.07601871341466904, -0.07443232834339142, -0.0728459358215332, -0.07125955075025558, -0.06967316567897797, -0.06808677315711975, -0.06650038808584213, -0.06491400301456451, -0.0633276104927063, -0.06174122542142868, -0.060154836624860764, -0.05856844782829285, -0.05698205903172493, -0.05539567023515701, -0.053809281438589096, -0.05222289264202118, -0.05063650384545326, -0.049050118774175644, -0.04746372997760773, -0.04587734118103981, -0.04429095238447189, -0.042704567313194275, -0.04111817851662636, -0.03953178972005844, -0.037945400923490524, -0.036359015852212906, -0.03477262705564499, -0.03318623825907707, -0.031599849462509155, -0.030013462528586388, -0.02842707559466362, -0.026840686798095703, -0.025254299864172935, -0.02366791106760502, -0.02208152413368225, -0.020495135337114334, -0.018908746540546417, -0.01732235960662365, -0.015735970810055733, -0.01414958294481039, -0.012563195079565048, -0.010976806282997131, -0.009390419349074364, -0.007804030552506447, -0.006217642687261105, -0.004631254822015762, -0.00304486695677042, -0.001458478975109756, 0.0001279090065509081, 0.001714297104626894, 0.0033006849698722363, 0.004887073300778866, 0.006473461166024208, 0.00805984903126955, 0.009646236896514893]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 2.0, 12.0, 8.0, 14.0, 16.0, 10.0, 16.0, 19.0, 24.0, 19.0, 36.0, 28.0, 31.0, 41.0, 28.0, 41.0, 39.0, 26.0, 33.0, 43.0, 39.0, 38.0, 37.0, 46.0, 31.0, 50.0, 38.0, 30.0, 19.0, 30.0, 28.0, 19.0, 17.0, 22.0, 12.0, 9.0, 14.0, 9.0, 6.0, 5.0, 5.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.007353544235229492, -0.007127969525754452, -0.006902394816279411, -0.006676820106804371, -0.0064512453973293304, -0.00622567068785429, -0.00600009597837925, -0.005774521268904209, -0.005548946559429169, -0.005323371849954128, -0.005097797140479088, -0.004872222431004047, -0.004646647721529007, -0.0044210730120539665, -0.004195498302578926, -0.003969923593103886, -0.003744348883628845, -0.0035187741741538048, -0.0032931994646787643, -0.003067624755203724, -0.0028420500457286835, -0.002616475336253643, -0.0023909006267786026, -0.002165325917303562, -0.0019397512078285217, -0.0017141764983534813, -0.0014886017888784409, -0.0012630270794034004, -0.00103745236992836, -0.0008118776604533195, -0.0005863029509782791, -0.0003607282415032387, -0.00013515353202819824, 9.04211774468422e-05, 0.00031599588692188263, 0.0005415705963969231, 0.0007671453058719635, 0.000992720015347004, 0.0012182947248220444, 0.0014438694342970848, 0.0016694441437721252, 0.0018950188532471657, 0.002120593562722206, 0.0023461682721972466, 0.002571742981672287, 0.0027973176911473274, 0.003022892400622368, 0.0032484671100974083, 0.0034740418195724487, 0.003699616529047489, 0.00392519123852253, 0.00415076594799757, 0.0043763406574726105, 0.004601915366947651, 0.004827490076422691, 0.005053064785897732, 0.005278639495372772, 0.005504214204847813, 0.005729788914322853, 0.0059553636237978935, 0.006180938333272934, 0.006406513042747974, 0.006632087752223015, 0.006857662461698055, 0.007083237171173096]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 4.0, 6.0, 5.0, 12.0, 20.0, 30.0, 44.0, 75.0, 145.0, 298.0, 551.0, 1260.0, 3087.0, 8925.0, 32006.0, 157326.0, 530439.0, 247697.0, 47229.0, 12331.0, 4055.0, 1555.0, 697.0, 342.0, 171.0, 98.0, 53.0, 22.0, 19.0, 14.0, 7.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.02239990234375, -0.0217134952545166, -0.021027088165283203, -0.020340681076049805, -0.019654273986816406, -0.018967866897583008, -0.01828145980834961, -0.01759505271911621, -0.016908645629882812, -0.016222238540649414, -0.015535831451416016, -0.014849424362182617, -0.014163017272949219, -0.01347661018371582, -0.012790203094482422, -0.012103796005249023, -0.011417388916015625, -0.010730981826782227, -0.010044574737548828, -0.00935816764831543, -0.008671760559082031, -0.007985353469848633, -0.007298946380615234, -0.006612539291381836, -0.0059261322021484375, -0.005239725112915039, -0.004553318023681641, -0.003866910934448242, -0.0031805038452148438, -0.0024940967559814453, -0.0018076896667480469, -0.0011212825775146484, -0.00043487548828125, 0.00025153160095214844, 0.0009379386901855469, 0.0016243457794189453, 0.0023107528686523438, 0.002997159957885742, 0.0036835670471191406, 0.004369974136352539, 0.0050563812255859375, 0.005742788314819336, 0.006429195404052734, 0.007115602493286133, 0.007802009582519531, 0.00848841667175293, 0.009174823760986328, 0.009861230850219727, 0.010547637939453125, 0.011234045028686523, 0.011920452117919922, 0.01260685920715332, 0.013293266296386719, 0.013979673385620117, 0.014666080474853516, 0.015352487564086914, 0.016038894653320312, 0.01672530174255371, 0.01741170883178711, 0.018098115921020508, 0.018784523010253906, 0.019470930099487305, 0.020157337188720703, 0.0208437442779541, 0.0215301513671875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 6.0, 3.0, 13.0, 11.0, 17.0, 33.0, 33.0, 39.0, 42.0, 69.0, 78.0, 78.0, 80.0, 80.0, 76.0, 72.0, 74.0, 55.0, 37.0, 33.0, 17.0, 13.0, 4.0, 8.0, 4.0, 7.0, 7.0, 0.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02117919921875, -0.0205538272857666, -0.019928455352783203, -0.019303083419799805, -0.018677711486816406, -0.018052339553833008, -0.01742696762084961, -0.01680159568786621, -0.016176223754882812, -0.015550851821899414, -0.014925479888916016, -0.014300107955932617, -0.013674736022949219, -0.01304936408996582, -0.012423992156982422, -0.011798620223999023, -0.011173248291015625, -0.010547876358032227, -0.009922504425048828, -0.00929713249206543, -0.008671760559082031, -0.008046388626098633, -0.007421016693115234, -0.006795644760131836, -0.0061702728271484375, -0.005544900894165039, -0.004919528961181641, -0.004294157028198242, -0.0036687850952148438, -0.0030434131622314453, -0.002418041229248047, -0.0017926692962646484, -0.00116729736328125, -0.0005419254302978516, 8.344650268554688e-05, 0.0007088184356689453, 0.0013341903686523438, 0.001959562301635742, 0.0025849342346191406, 0.003210306167602539, 0.0038356781005859375, 0.004461050033569336, 0.005086421966552734, 0.005711793899536133, 0.006337165832519531, 0.00696253776550293, 0.007587909698486328, 0.008213281631469727, 0.008838653564453125, 0.009464025497436523, 0.010089397430419922, 0.01071476936340332, 0.011340141296386719, 0.011965513229370117, 0.012590885162353516, 0.013216257095336914, 0.013841629028320312, 0.014467000961303711, 0.01509237289428711, 0.015717744827270508, 0.016343116760253906, 0.016968488693237305, 0.017593860626220703, 0.0182192325592041, 0.0188446044921875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 13.0, 10.0, 20.0, 31.0, 44.0, 83.0, 144.0, 243.0, 522.0, 1657.0, 12867.0, 682002.0, 341039.0, 7474.0, 1318.0, 482.0, 246.0, 126.0, 74.0, 45.0, 43.0, 26.0, 14.0, 9.0, 8.0, 3.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041290283203125, -0.03986167907714844, -0.038433074951171875, -0.03700447082519531, -0.03557586669921875, -0.03414726257324219, -0.032718658447265625, -0.03129005432128906, -0.0298614501953125, -0.028432846069335938, -0.027004241943359375, -0.025575637817382812, -0.02414703369140625, -0.022718429565429688, -0.021289825439453125, -0.019861221313476562, -0.0184326171875, -0.017004013061523438, -0.015575408935546875, -0.014146804809570312, -0.01271820068359375, -0.011289596557617188, -0.009860992431640625, -0.008432388305664062, -0.0070037841796875, -0.0055751800537109375, -0.004146575927734375, -0.0027179718017578125, -0.00128936767578125, 0.0001392364501953125, 0.001567840576171875, 0.0029964447021484375, 0.004425048828125, 0.0058536529541015625, 0.007282257080078125, 0.008710861206054688, 0.01013946533203125, 0.011568069458007812, 0.012996673583984375, 0.014425277709960938, 0.0158538818359375, 0.017282485961914062, 0.018711090087890625, 0.020139694213867188, 0.02156829833984375, 0.022996902465820312, 0.024425506591796875, 0.025854110717773438, 0.02728271484375, 0.028711318969726562, 0.030139923095703125, 0.03156852722167969, 0.03299713134765625, 0.03442573547363281, 0.035854339599609375, 0.03728294372558594, 0.0387115478515625, 0.04014015197753906, 0.041568756103515625, 0.04299736022949219, 0.04442596435546875, 0.04585456848144531, 0.047283172607421875, 0.04871177673339844, 0.050140380859375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 7.0, 17.0, 14.0, 15.0, 25.0, 27.0, 23.0, 26.0, 49.0, 51.0, 51.0, 72.0, 72.0, 47.0, 64.0, 57.0, 64.0, 49.0, 58.0, 42.0, 44.0, 32.0, 25.0, 13.0, 16.0, 18.0, 6.0, 5.0, 3.0, 5.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05078125, -0.049007415771484375, -0.04723358154296875, -0.045459747314453125, -0.0436859130859375, -0.041912078857421875, -0.04013824462890625, -0.038364410400390625, -0.036590576171875, -0.034816741943359375, -0.03304290771484375, -0.031269073486328125, -0.0294952392578125, -0.027721405029296875, -0.02594757080078125, -0.024173736572265625, -0.02239990234375, -0.020626068115234375, -0.01885223388671875, -0.017078399658203125, -0.0153045654296875, -0.013530731201171875, -0.01175689697265625, -0.009983062744140625, -0.008209228515625, -0.006435394287109375, -0.00466156005859375, -0.002887725830078125, -0.0011138916015625, 0.000659942626953125, 0.00243377685546875, 0.004207611083984375, 0.0059814453125, 0.007755279541015625, 0.00952911376953125, 0.011302947998046875, 0.0130767822265625, 0.014850616455078125, 0.01662445068359375, 0.018398284912109375, 0.020172119140625, 0.021945953369140625, 0.02371978759765625, 0.025493621826171875, 0.0272674560546875, 0.029041290283203125, 0.03081512451171875, 0.032588958740234375, 0.03436279296875, 0.036136627197265625, 0.03791046142578125, 0.039684295654296875, 0.0414581298828125, 0.043231964111328125, 0.04500579833984375, 0.046779632568359375, 0.048553466796875, 0.050327301025390625, 0.05210113525390625, 0.053874969482421875, 0.0556488037109375, 0.057422637939453125, 0.05919647216796875, 0.060970306396484375, 0.062744140625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 4.0, 7.0, 9.0, 13.0, 38.0, 83.0, 231.0, 866.0, 18099.0, 1017896.0, 10319.0, 630.0, 204.0, 77.0, 38.0, 16.0, 6.0, 6.0, 7.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.054351806640625, -0.05318140983581543, -0.05201101303100586, -0.05084061622619629, -0.04967021942138672, -0.04849982261657715, -0.04732942581176758, -0.04615902900695801, -0.04498863220214844, -0.04381823539733887, -0.0426478385925293, -0.04147744178771973, -0.040307044982910156, -0.039136648178100586, -0.037966251373291016, -0.036795854568481445, -0.035625457763671875, -0.034455060958862305, -0.033284664154052734, -0.032114267349243164, -0.030943870544433594, -0.029773473739624023, -0.028603076934814453, -0.027432680130004883, -0.026262283325195312, -0.025091886520385742, -0.023921489715576172, -0.0227510929107666, -0.02158069610595703, -0.02041029930114746, -0.01923990249633789, -0.01806950569152832, -0.01689910888671875, -0.01572871208190918, -0.01455831527709961, -0.013387918472290039, -0.012217521667480469, -0.011047124862670898, -0.009876728057861328, -0.008706331253051758, -0.0075359344482421875, -0.006365537643432617, -0.005195140838623047, -0.0040247440338134766, -0.0028543472290039062, -0.001683950424194336, -0.0005135536193847656, 0.0006568431854248047, 0.001827239990234375, 0.0029976367950439453, 0.004168033599853516, 0.005338430404663086, 0.006508827209472656, 0.0076792240142822266, 0.008849620819091797, 0.010020017623901367, 0.011190414428710938, 0.012360811233520508, 0.013531208038330078, 0.014701604843139648, 0.01587200164794922, 0.01704239845275879, 0.01821279525756836, 0.01938319206237793, 0.0205535888671875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 9.0, 14.0, 23.0, 48.0, 83.0, 144.0, 202.0, 206.0, 111.0, 75.0, 34.0, 15.0, 13.0, 13.0, 5.0, 6.0, 0.0, 4.0, 0.0, 2.0], "bins": [-0.00016641616821289062, -0.00016314350068569183, -0.00015987083315849304, -0.00015659816563129425, -0.00015332549810409546, -0.00015005283057689667, -0.00014678016304969788, -0.00014350749552249908, -0.0001402348279953003, -0.0001369621604681015, -0.0001336894929409027, -0.00013041682541370392, -0.00012714415788650513, -0.00012387149035930634, -0.00012059882283210754, -0.00011732615530490875, -0.00011405348777770996, -0.00011078082025051117, -0.00010750815272331238, -0.00010423548519611359, -0.0001009628176689148, -9.7690150141716e-05, -9.441748261451721e-05, -9.114481508731842e-05, -8.787214756011963e-05, -8.459948003292084e-05, -8.132681250572205e-05, -7.805414497852325e-05, -7.478147745132446e-05, -7.150880992412567e-05, -6.823614239692688e-05, -6.496347486972809e-05, -6.16908073425293e-05, -5.8418139815330505e-05, -5.5145472288131714e-05, -5.187280476093292e-05, -4.860013723373413e-05, -4.532746970653534e-05, -4.205480217933655e-05, -3.8782134652137756e-05, -3.5509467124938965e-05, -3.223679959774017e-05, -2.8964132070541382e-05, -2.569146454334259e-05, -2.24187970161438e-05, -1.9146129488945007e-05, -1.5873461961746216e-05, -1.2600794434547424e-05, -9.328126907348633e-06, -6.055459380149841e-06, -2.78279185295105e-06, 4.898756742477417e-07, 3.762543201446533e-06, 7.035210728645325e-06, 1.0307878255844116e-05, 1.3580545783042908e-05, 1.68532133102417e-05, 2.012588083744049e-05, 2.3398548364639282e-05, 2.6671215891838074e-05, 2.9943883419036865e-05, 3.321655094623566e-05, 3.648921847343445e-05, 3.976188600063324e-05, 4.303455352783203e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 10.0, 16.0, 18.0, 36.0, 68.0, 157.0, 298.0, 974.0, 5597.0, 325743.0, 705468.0, 8273.0, 1178.0, 358.0, 180.0, 88.0, 38.0, 16.0, 11.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02093505859375, -0.020189523696899414, -0.019443988800048828, -0.018698453903198242, -0.017952919006347656, -0.01720738410949707, -0.016461849212646484, -0.0157163143157959, -0.014970779418945312, -0.014225244522094727, -0.01347970962524414, -0.012734174728393555, -0.011988639831542969, -0.011243104934692383, -0.010497570037841797, -0.009752035140991211, -0.009006500244140625, -0.008260965347290039, -0.007515430450439453, -0.006769895553588867, -0.006024360656738281, -0.005278825759887695, -0.004533290863037109, -0.0037877559661865234, -0.0030422210693359375, -0.0022966861724853516, -0.0015511512756347656, -0.0008056163787841797, -6.008148193359375e-05, 0.0006854534149169922, 0.0014309883117675781, 0.002176523208618164, 0.00292205810546875, 0.003667593002319336, 0.004413127899169922, 0.005158662796020508, 0.005904197692871094, 0.00664973258972168, 0.007395267486572266, 0.008140802383422852, 0.008886337280273438, 0.009631872177124023, 0.01037740707397461, 0.011122941970825195, 0.011868476867675781, 0.012614011764526367, 0.013359546661376953, 0.014105081558227539, 0.014850616455078125, 0.015596151351928711, 0.016341686248779297, 0.017087221145629883, 0.01783275604248047, 0.018578290939331055, 0.01932382583618164, 0.020069360733032227, 0.020814895629882812, 0.0215604305267334, 0.022305965423583984, 0.02305150032043457, 0.023797035217285156, 0.024542570114135742, 0.025288105010986328, 0.026033639907836914, 0.0267791748046875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 11.0, 36.0, 128.0, 325.0, 329.0, 115.0, 32.0, 18.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036102294921875, -0.034714698791503906, -0.03332710266113281, -0.03193950653076172, -0.030551910400390625, -0.02916431427001953, -0.027776718139648438, -0.026389122009277344, -0.02500152587890625, -0.023613929748535156, -0.022226333618164062, -0.02083873748779297, -0.019451141357421875, -0.01806354522705078, -0.016675949096679688, -0.015288352966308594, -0.0139007568359375, -0.012513160705566406, -0.011125564575195312, -0.009737968444824219, -0.008350372314453125, -0.006962776184082031, -0.0055751800537109375, -0.004187583923339844, -0.00279998779296875, -0.0014123916625976562, -2.47955322265625e-05, 0.0013628005981445312, 0.002750396728515625, 0.004137992858886719, 0.0055255889892578125, 0.006913185119628906, 0.00830078125, 0.009688377380371094, 0.011075973510742188, 0.012463569641113281, 0.013851165771484375, 0.015238761901855469, 0.016626358032226562, 0.018013954162597656, 0.01940155029296875, 0.020789146423339844, 0.022176742553710938, 0.02356433868408203, 0.024951934814453125, 0.02633953094482422, 0.027727127075195312, 0.029114723205566406, 0.0305023193359375, 0.031889915466308594, 0.03327751159667969, 0.03466510772705078, 0.036052703857421875, 0.03744029998779297, 0.03882789611816406, 0.040215492248535156, 0.04160308837890625, 0.042990684509277344, 0.04437828063964844, 0.04576587677001953, 0.047153472900390625, 0.04854106903076172, 0.04992866516113281, 0.051316261291503906, 0.052703857421875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 7.0, 94.0, 316.0, 370.0, 132.0, 41.0, 14.0, 15.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42696258425712585, -0.4121873378753662, -0.39741209149360657, -0.3826368451118469, -0.3678615987300873, -0.35308635234832764, -0.338311105966568, -0.32353585958480835, -0.3087606132030487, -0.29398536682128906, -0.2792101204395294, -0.2644348740577698, -0.24965962767601013, -0.2348843812942505, -0.22010913491249084, -0.2053338885307312, -0.19055864214897156, -0.17578339576721191, -0.16100814938545227, -0.14623290300369263, -0.13145765662193298, -0.11668241024017334, -0.1019071638584137, -0.08713191747665405, -0.07235667109489441, -0.057581424713134766, -0.04280617833137512, -0.02803093194961548, -0.013255685567855835, 0.0015195608139038086, 0.016294807195663452, 0.031070053577423096, 0.04584532976150513, 0.06062057614326477, 0.07539582252502441, 0.09017106890678406, 0.1049463152885437, 0.11972156167030334, 0.134496808052063, 0.14927205443382263, 0.16404730081558228, 0.17882254719734192, 0.19359779357910156, 0.2083730399608612, 0.22314828634262085, 0.2379235327243805, 0.25269877910614014, 0.2674740254878998, 0.2822492718696594, 0.29702451825141907, 0.3117997646331787, 0.32657501101493835, 0.341350257396698, 0.35612550377845764, 0.3709007501602173, 0.38567599654197693, 0.4004512429237366, 0.4152264893054962, 0.43000173568725586, 0.4447769820690155, 0.45955222845077515, 0.4743274748325348, 0.48910272121429443, 0.5038779973983765, 0.5186532139778137]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 7.0, 12.0, 9.0, 9.0, 15.0, 23.0, 28.0, 33.0, 39.0, 40.0, 61.0, 40.0, 68.0, 56.0, 58.0, 68.0, 58.0, 60.0, 51.0, 44.0, 41.0, 42.0, 24.0, 26.0, 16.0, 22.0, 16.0, 11.0, 5.0, 9.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.34668922424316406, -0.3384120464324951, -0.33013486862182617, -0.3218576908111572, -0.3135804831981659, -0.30530330538749695, -0.297026127576828, -0.28874894976615906, -0.2804717719554901, -0.27219459414482117, -0.2639174163341522, -0.2556402087211609, -0.24736304581165314, -0.239085853099823, -0.23080867528915405, -0.2225314974784851, -0.21425430476665497, -0.20597712695598602, -0.19769993424415588, -0.18942275643348694, -0.181145578622818, -0.17286840081214905, -0.1645912081003189, -0.15631403028964996, -0.14803683757781982, -0.13975965976715088, -0.13148246705532074, -0.1232052892446518, -0.11492811143398285, -0.1066509261727333, -0.09837374091148376, -0.09009656310081482, -0.08181938529014587, -0.07354220002889633, -0.06526502221822739, -0.056987836956977844, -0.0487106554210186, -0.04043347388505936, -0.032156288623809814, -0.02387910708785057, -0.015601925551891327, -0.0073247430846095085, 0.0009524393826723099, 0.009229622781276703, 0.017506804317235947, 0.02578398585319519, 0.03406117111444473, 0.042338352650403976, 0.05061553418636322, 0.058892715722322464, 0.06716989725828171, 0.07544708251953125, 0.0837242603302002, 0.09200144559144974, 0.10027863085269928, 0.10855580866336823, 0.11683299392461777, 0.1251101791858673, 0.13338735699653625, 0.1416645348072052, 0.14994172751903534, 0.15821890532970428, 0.16649609804153442, 0.17477327585220337, 0.18305045366287231]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 14.0, 28.0, 31.0, 43.0, 55.0, 67.0, 112.0, 182.0, 429.0, 1975.0, 229224.0, 3958835.0, 2248.0, 457.0, 206.0, 111.0, 87.0, 54.0, 43.0, 16.0, 29.0, 11.0, 9.0, 3.0, 1.0, 5.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08172607421875, -0.07939338684082031, -0.07706069946289062, -0.07472801208496094, -0.07239532470703125, -0.07006263732910156, -0.06772994995117188, -0.06539726257324219, -0.0630645751953125, -0.06073188781738281, -0.058399200439453125, -0.05606651306152344, -0.05373382568359375, -0.05140113830566406, -0.049068450927734375, -0.04673576354980469, -0.044403076171875, -0.04207038879394531, -0.039737701416015625, -0.03740501403808594, -0.03507232666015625, -0.03273963928222656, -0.030406951904296875, -0.028074264526367188, -0.0257415771484375, -0.023408889770507812, -0.021076202392578125, -0.018743515014648438, -0.01641082763671875, -0.014078140258789062, -0.011745452880859375, -0.009412765502929688, -0.007080078125, -0.0047473907470703125, -0.002414703369140625, -8.20159912109375e-05, 0.00225067138671875, 0.0045833587646484375, 0.006916046142578125, 0.009248733520507812, 0.0115814208984375, 0.013914108276367188, 0.016246795654296875, 0.018579483032226562, 0.02091217041015625, 0.023244857788085938, 0.025577545166015625, 0.027910232543945312, 0.030242919921875, 0.03257560729980469, 0.034908294677734375, 0.03724098205566406, 0.03957366943359375, 0.04190635681152344, 0.044239044189453125, 0.04657173156738281, 0.0489044189453125, 0.05123710632324219, 0.053569793701171875, 0.05590248107910156, 0.05823516845703125, 0.06056785583496094, 0.06290054321289062, 0.06523323059082031, 0.06756591796875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 8.0, 4.0, 8.0, 14.0, 21.0, 19.0, 44.0, 39.0, 56.0, 62.0, 70.0, 71.0, 75.0, 82.0, 85.0, 72.0, 61.0, 50.0, 41.0, 25.0, 32.0, 11.0, 10.0, 12.0, 6.0, 4.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0213165283203125, -0.02068638801574707, -0.02005624771118164, -0.01942610740661621, -0.01879596710205078, -0.01816582679748535, -0.017535686492919922, -0.016905546188354492, -0.016275405883789062, -0.015645265579223633, -0.015015125274658203, -0.014384984970092773, -0.013754844665527344, -0.013124704360961914, -0.012494564056396484, -0.011864423751831055, -0.011234283447265625, -0.010604143142700195, -0.009974002838134766, -0.009343862533569336, -0.008713722229003906, -0.008083581924438477, -0.007453441619873047, -0.006823301315307617, -0.0061931610107421875, -0.005563020706176758, -0.004932880401611328, -0.0043027400970458984, -0.0036725997924804688, -0.003042459487915039, -0.0024123191833496094, -0.0017821788787841797, -0.00115203857421875, -0.0005218982696533203, 0.00010824203491210938, 0.0007383823394775391, 0.0013685226440429688, 0.0019986629486083984, 0.002628803253173828, 0.003258943557739258, 0.0038890838623046875, 0.004519224166870117, 0.005149364471435547, 0.0057795047760009766, 0.006409645080566406, 0.007039785385131836, 0.007669925689697266, 0.008300065994262695, 0.008930206298828125, 0.009560346603393555, 0.010190486907958984, 0.010820627212524414, 0.011450767517089844, 0.012080907821655273, 0.012711048126220703, 0.013341188430786133, 0.013971328735351562, 0.014601469039916992, 0.015231609344482422, 0.01586174964904785, 0.01649188995361328, 0.01712203025817871, 0.01775217056274414, 0.01838231086730957, 0.019012451171875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 5.0, 3.0, 10.0, 5.0, 12.0, 18.0, 29.0, 29.0, 38.0, 57.0, 54.0, 83.0, 98.0, 160.0, 230.0, 392.0, 752.0, 2036.0, 8744.0, 192843.0, 3968594.0, 15012.0, 2753.0, 976.0, 412.0, 268.0, 188.0, 119.0, 77.0, 60.0, 43.0, 41.0, 35.0, 29.0, 25.0, 15.0, 9.0, 6.0, 5.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.025604248046875, -0.02478170394897461, -0.02395915985107422, -0.023136615753173828, -0.022314071655273438, -0.021491527557373047, -0.020668983459472656, -0.019846439361572266, -0.019023895263671875, -0.018201351165771484, -0.017378807067871094, -0.016556262969970703, -0.015733718872070312, -0.014911174774169922, -0.014088630676269531, -0.01326608657836914, -0.01244354248046875, -0.01162099838256836, -0.010798454284667969, -0.009975910186767578, -0.009153366088867188, -0.008330821990966797, -0.007508277893066406, -0.006685733795166016, -0.005863189697265625, -0.005040645599365234, -0.004218101501464844, -0.003395557403564453, -0.0025730133056640625, -0.0017504692077636719, -0.0009279251098632812, -0.00010538101196289062, 0.0007171630859375, 0.0015397071838378906, 0.0023622512817382812, 0.003184795379638672, 0.0040073394775390625, 0.004829883575439453, 0.005652427673339844, 0.006474971771240234, 0.007297515869140625, 0.008120059967041016, 0.008942604064941406, 0.009765148162841797, 0.010587692260742188, 0.011410236358642578, 0.012232780456542969, 0.01305532455444336, 0.01387786865234375, 0.01470041275024414, 0.015522956848144531, 0.016345500946044922, 0.017168045043945312, 0.017990589141845703, 0.018813133239746094, 0.019635677337646484, 0.020458221435546875, 0.021280765533447266, 0.022103309631347656, 0.022925853729248047, 0.023748397827148438, 0.024570941925048828, 0.02539348602294922, 0.02621603012084961, 0.02703857421875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 22.0, 50.0, 219.0, 3615.0, 110.0, 25.0, 7.0, 10.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006000518798828125, -0.0057433247566223145, -0.005486130714416504, -0.005228936672210693, -0.004971742630004883, -0.004714548587799072, -0.004457354545593262, -0.004200160503387451, -0.003942966461181641, -0.00368577241897583, -0.0034285783767700195, -0.003171384334564209, -0.0029141902923583984, -0.002656996250152588, -0.0023998022079467773, -0.002142608165740967, -0.0018854141235351562, -0.0016282200813293457, -0.0013710260391235352, -0.0011138319969177246, -0.0008566379547119141, -0.0005994439125061035, -0.00034224987030029297, -8.505582809448242e-05, 0.00017213821411132812, 0.00042933225631713867, 0.0006865262985229492, 0.0009437203407287598, 0.0012009143829345703, 0.0014581084251403809, 0.0017153024673461914, 0.001972496509552002, 0.0022296905517578125, 0.002486884593963623, 0.0027440786361694336, 0.003001272678375244, 0.0032584667205810547, 0.0035156607627868652, 0.0037728548049926758, 0.004030048847198486, 0.004287242889404297, 0.004544436931610107, 0.004801630973815918, 0.0050588250160217285, 0.005316019058227539, 0.00557321310043335, 0.00583040714263916, 0.006087601184844971, 0.006344795227050781, 0.006601989269256592, 0.006859183311462402, 0.007116377353668213, 0.0073735713958740234, 0.007630765438079834, 0.007887959480285645, 0.008145153522491455, 0.008402347564697266, 0.008659541606903076, 0.008916735649108887, 0.009173929691314697, 0.009431123733520508, 0.009688317775726318, 0.009945511817932129, 0.01020270586013794, 0.01045989990234375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 17.0, 29.0, 168.0, 386.0, 278.0, 86.0, 22.0, 11.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.08268772065639496, -0.08115063607692719, -0.07961354404687881, -0.07807645946741104, -0.07653936743736267, -0.0750022828578949, -0.07346519827842712, -0.07192810624837875, -0.07039102166891098, -0.0688539370894432, -0.06731684505939484, -0.06577976047992706, -0.06424266844987869, -0.06270558387041092, -0.06116849556565285, -0.059631407260894775, -0.058094315230846405, -0.05655722692608833, -0.05502013862133026, -0.05348305404186249, -0.051945965737104416, -0.050408877432346344, -0.04887178912758827, -0.0473347008228302, -0.04579761624336243, -0.044260527938604355, -0.04272343963384628, -0.04118635505437851, -0.03964926674962044, -0.038112178444862366, -0.036575090140104294, -0.03503800183534622, -0.03350091353058815, -0.03196382522583008, -0.030426738783717155, -0.028889650478959084, -0.02735256217420101, -0.02581547573208809, -0.024278387427330017, -0.022741299122571945, -0.021204210817813873, -0.0196671225130558, -0.01813003607094288, -0.016592947766184807, -0.015055859461426735, -0.013518772087991238, -0.01198168471455574, -0.010444596409797668, -0.008907509967684746, -0.007370422128587961, -0.005833334289491177, -0.004296246916055679, -0.0027591590769588947, -0.0012220712378621101, 0.00031501613557338715, 0.001852104440331459, 0.0033891918137669563, 0.004926279652863741, 0.0064633674919605255, 0.008000454865396023, 0.00953754223883152, 0.011074630543589592, 0.01261171791702509, 0.014148806221783161, 0.01568589359521866]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 7.0, 9.0, 10.0, 13.0, 12.0, 23.0, 19.0, 25.0, 21.0, 31.0, 44.0, 31.0, 32.0, 47.0, 54.0, 59.0, 36.0, 50.0, 48.0, 53.0, 48.0, 43.0, 38.0, 28.0, 42.0, 26.0, 20.0, 23.0, 18.0, 16.0, 15.0, 16.0, 9.0, 6.0, 5.0, 5.0, 8.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00836944580078125, -0.00805980060249567, -0.007750155404210091, -0.007440510205924511, -0.007130865007638931, -0.006821219809353352, -0.006511574611067772, -0.006201929412782192, -0.0058922842144966125, -0.005582639016211033, -0.005272993817925453, -0.0049633486196398735, -0.004653703421354294, -0.004344058223068714, -0.0040344130247831345, -0.0037247678264975548, -0.003415122628211975, -0.0031054774299263954, -0.0027958322316408157, -0.002486187033355236, -0.0021765418350696564, -0.0018668966367840767, -0.001557251438498497, -0.0012476062402129173, -0.0009379610419273376, -0.000628315843641758, -0.0003186706453561783, -9.025447070598602e-06, 0.0003006197512149811, 0.0006102649495005608, 0.0009199101477861404, 0.0012295553460717201, 0.0015392005443572998, 0.0018488457426428795, 0.002158490940928459, 0.002468136139214039, 0.0027777813374996185, 0.003087426535785198, 0.003397071734070778, 0.0037067169323563576, 0.004016362130641937, 0.004326007328927517, 0.004635652527213097, 0.004945297725498676, 0.005254942923784256, 0.005564588122069836, 0.005874233320355415, 0.006183878518640995, 0.006493523716926575, 0.006803168915212154, 0.007112814113497734, 0.007422459311783314, 0.007732104510068893, 0.008041749708354473, 0.008351394906640053, 0.008661040104925632, 0.008970685303211212, 0.009280330501496792, 0.009589975699782372, 0.009899620898067951, 0.010209266096353531, 0.01051891129463911, 0.01082855649292469, 0.01113820169121027, 0.01144784688949585]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 1.0, 12.0, 11.0, 22.0, 44.0, 44.0, 80.0, 137.0, 282.0, 454.0, 911.0, 1822.0, 4261.0, 11260.0, 34344.0, 116819.0, 336060.0, 354587.0, 128848.0, 37602.0, 12302.0, 4552.0, 2056.0, 941.0, 457.0, 261.0, 151.0, 78.0, 54.0, 38.0, 17.0, 18.0, 11.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.015289306640625, -0.014796733856201172, -0.014304161071777344, -0.013811588287353516, -0.013319015502929688, -0.01282644271850586, -0.012333869934082031, -0.011841297149658203, -0.011348724365234375, -0.010856151580810547, -0.010363578796386719, -0.00987100601196289, -0.009378433227539062, -0.008885860443115234, -0.008393287658691406, -0.007900714874267578, -0.00740814208984375, -0.006915569305419922, -0.006422996520996094, -0.005930423736572266, -0.0054378509521484375, -0.004945278167724609, -0.004452705383300781, -0.003960132598876953, -0.003467559814453125, -0.002974987030029297, -0.0024824142456054688, -0.0019898414611816406, -0.0014972686767578125, -0.0010046958923339844, -0.0005121231079101562, -1.9550323486328125e-05, 0.0004730224609375, 0.0009655952453613281, 0.0014581680297851562, 0.0019507408142089844, 0.0024433135986328125, 0.0029358863830566406, 0.0034284591674804688, 0.003921031951904297, 0.004413604736328125, 0.004906177520751953, 0.005398750305175781, 0.005891323089599609, 0.0063838958740234375, 0.006876468658447266, 0.007369041442871094, 0.007861614227294922, 0.00835418701171875, 0.008846759796142578, 0.009339332580566406, 0.009831905364990234, 0.010324478149414062, 0.01081705093383789, 0.011309623718261719, 0.011802196502685547, 0.012294769287109375, 0.012787342071533203, 0.013279914855957031, 0.01377248764038086, 0.014265060424804688, 0.014757633209228516, 0.015250205993652344, 0.015742778778076172, 0.0162353515625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 3.0, 6.0, 12.0, 14.0, 26.0, 29.0, 34.0, 50.0, 52.0, 76.0, 72.0, 69.0, 72.0, 92.0, 81.0, 66.0, 57.0, 41.0, 39.0, 30.0, 23.0, 10.0, 13.0, 3.0, 7.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0211334228515625, -0.02050161361694336, -0.01986980438232422, -0.019237995147705078, -0.018606185913085938, -0.017974376678466797, -0.017342567443847656, -0.016710758209228516, -0.016078948974609375, -0.015447139739990234, -0.014815330505371094, -0.014183521270751953, -0.013551712036132812, -0.012919902801513672, -0.012288093566894531, -0.01165628433227539, -0.01102447509765625, -0.01039266586303711, -0.009760856628417969, -0.009129047393798828, -0.008497238159179688, -0.007865428924560547, -0.007233619689941406, -0.006601810455322266, -0.005970001220703125, -0.005338191986083984, -0.004706382751464844, -0.004074573516845703, -0.0034427642822265625, -0.002810955047607422, -0.0021791458129882812, -0.0015473365783691406, -0.00091552734375, -0.0002837181091308594, 0.00034809112548828125, 0.0009799003601074219, 0.0016117095947265625, 0.002243518829345703, 0.0028753280639648438, 0.0035071372985839844, 0.004138946533203125, 0.004770755767822266, 0.005402565002441406, 0.006034374237060547, 0.0066661834716796875, 0.007297992706298828, 0.007929801940917969, 0.00856161117553711, 0.00919342041015625, 0.00982522964477539, 0.010457038879394531, 0.011088848114013672, 0.011720657348632812, 0.012352466583251953, 0.012984275817871094, 0.013616085052490234, 0.014247894287109375, 0.014879703521728516, 0.015511512756347656, 0.016143321990966797, 0.016775131225585938, 0.017406940460205078, 0.01803874969482422, 0.01867055892944336, 0.0193023681640625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 5.0, 7.0, 15.0, 13.0, 26.0, 25.0, 36.0, 31.0, 45.0, 75.0, 96.0, 145.0, 216.0, 324.0, 575.0, 1040.0, 2083.0, 4825.0, 16092.0, 102655.0, 645570.0, 232614.0, 29080.0, 6975.0, 2699.0, 1333.0, 697.0, 406.0, 218.0, 162.0, 123.0, 84.0, 63.0, 49.0, 38.0, 19.0, 23.0, 17.0, 10.0, 5.0, 11.0, 8.0, 3.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0], "bins": [-0.0223388671875, -0.02165532112121582, -0.02097177505493164, -0.02028822898864746, -0.01960468292236328, -0.0189211368560791, -0.018237590789794922, -0.017554044723510742, -0.016870498657226562, -0.016186952590942383, -0.015503406524658203, -0.014819860458374023, -0.014136314392089844, -0.013452768325805664, -0.012769222259521484, -0.012085676193237305, -0.011402130126953125, -0.010718584060668945, -0.010035037994384766, -0.009351491928100586, -0.008667945861816406, -0.007984399795532227, -0.007300853729248047, -0.006617307662963867, -0.0059337615966796875, -0.005250215530395508, -0.004566669464111328, -0.0038831233978271484, -0.0031995773315429688, -0.002516031265258789, -0.0018324851989746094, -0.0011489391326904297, -0.00046539306640625, 0.0002181529998779297, 0.0009016990661621094, 0.001585245132446289, 0.0022687911987304688, 0.0029523372650146484, 0.003635883331298828, 0.004319429397583008, 0.0050029754638671875, 0.005686521530151367, 0.006370067596435547, 0.0070536136627197266, 0.007737159729003906, 0.008420705795288086, 0.009104251861572266, 0.009787797927856445, 0.010471343994140625, 0.011154890060424805, 0.011838436126708984, 0.012521982192993164, 0.013205528259277344, 0.013889074325561523, 0.014572620391845703, 0.015256166458129883, 0.015939712524414062, 0.016623258590698242, 0.017306804656982422, 0.0179903507232666, 0.01867389678955078, 0.01935744285583496, 0.02004098892211914, 0.02072453498840332, 0.0214080810546875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 11.0, 7.0, 16.0, 14.0, 17.0, 29.0, 21.0, 40.0, 32.0, 39.0, 43.0, 40.0, 62.0, 65.0, 49.0, 44.0, 53.0, 60.0, 47.0, 56.0, 41.0, 38.0, 26.0, 22.0, 28.0, 16.0, 18.0, 11.0, 12.0, 7.0, 10.0, 5.0, 6.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055084228515625, -0.053281307220458984, -0.05147838592529297, -0.04967546463012695, -0.04787254333496094, -0.04606962203979492, -0.044266700744628906, -0.04246377944946289, -0.040660858154296875, -0.03885793685913086, -0.037055015563964844, -0.03525209426879883, -0.03344917297363281, -0.0316462516784668, -0.02984333038330078, -0.028040409088134766, -0.02623748779296875, -0.024434566497802734, -0.02263164520263672, -0.020828723907470703, -0.019025802612304688, -0.017222881317138672, -0.015419960021972656, -0.01361703872680664, -0.011814117431640625, -0.01001119613647461, -0.008208274841308594, -0.006405353546142578, -0.0046024322509765625, -0.002799510955810547, -0.0009965896606445312, 0.0008063316345214844, 0.0026092529296875, 0.004412174224853516, 0.006215095520019531, 0.008018016815185547, 0.009820938110351562, 0.011623859405517578, 0.013426780700683594, 0.01522970199584961, 0.017032623291015625, 0.01883554458618164, 0.020638465881347656, 0.022441387176513672, 0.024244308471679688, 0.026047229766845703, 0.02785015106201172, 0.029653072357177734, 0.03145599365234375, 0.033258914947509766, 0.03506183624267578, 0.0368647575378418, 0.03866767883300781, 0.04047060012817383, 0.042273521423339844, 0.04407644271850586, 0.045879364013671875, 0.04768228530883789, 0.049485206604003906, 0.05128812789916992, 0.05309104919433594, 0.05489397048950195, 0.05669689178466797, 0.058499813079833984, 0.060302734375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 3.0, 4.0, 3.0, 4.0, 10.0, 12.0, 16.0, 16.0, 22.0, 35.0, 72.0, 87.0, 168.0, 353.0, 857.0, 2637.0, 12928.0, 956717.0, 66895.0, 5024.0, 1455.0, 563.0, 284.0, 120.0, 90.0, 56.0, 42.0, 20.0, 17.0, 14.0, 5.0, 7.0, 3.0, 4.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0258636474609375, -0.02493119239807129, -0.023998737335205078, -0.023066282272338867, -0.022133827209472656, -0.021201372146606445, -0.020268917083740234, -0.019336462020874023, -0.018404006958007812, -0.0174715518951416, -0.01653909683227539, -0.01560664176940918, -0.014674186706542969, -0.013741731643676758, -0.012809276580810547, -0.011876821517944336, -0.010944366455078125, -0.010011911392211914, -0.009079456329345703, -0.008147001266479492, -0.007214546203613281, -0.00628209114074707, -0.005349636077880859, -0.0044171810150146484, -0.0034847259521484375, -0.0025522708892822266, -0.0016198158264160156, -0.0006873607635498047, 0.00024509429931640625, 0.0011775493621826172, 0.002110004425048828, 0.003042459487915039, 0.00397491455078125, 0.004907369613647461, 0.005839824676513672, 0.006772279739379883, 0.007704734802246094, 0.008637189865112305, 0.009569644927978516, 0.010502099990844727, 0.011434555053710938, 0.012367010116577148, 0.01329946517944336, 0.01423192024230957, 0.015164375305175781, 0.016096830368041992, 0.017029285430908203, 0.017961740493774414, 0.018894195556640625, 0.019826650619506836, 0.020759105682373047, 0.021691560745239258, 0.02262401580810547, 0.02355647087097168, 0.02448892593383789, 0.0254213809967041, 0.026353836059570312, 0.027286291122436523, 0.028218746185302734, 0.029151201248168945, 0.030083656311035156, 0.031016111373901367, 0.03194856643676758, 0.03288102149963379, 0.0338134765625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 4.0, 8.0, 7.0, 4.0, 5.0, 14.0, 6.0, 10.0, 15.0, 24.0, 32.0, 38.0, 41.0, 46.0, 65.0, 74.0, 88.0, 87.0, 92.0, 61.0, 55.0, 35.0, 34.0, 28.0, 17.0, 13.0, 15.0, 13.0, 10.0, 11.0, 5.0, 9.0, 5.0, 3.0, 3.0, 3.0, 4.0, 0.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0], "bins": [-3.415346145629883e-05, -3.3204443752765656e-05, -3.225542604923248e-05, -3.130640834569931e-05, -3.0357390642166138e-05, -2.9408372938632965e-05, -2.8459355235099792e-05, -2.751033753156662e-05, -2.6561319828033447e-05, -2.5612302124500275e-05, -2.4663284420967102e-05, -2.371426671743393e-05, -2.2765249013900757e-05, -2.1816231310367584e-05, -2.086721360683441e-05, -1.991819590330124e-05, -1.8969178199768066e-05, -1.8020160496234894e-05, -1.707114279270172e-05, -1.612212508916855e-05, -1.5173107385635376e-05, -1.4224089682102203e-05, -1.327507197856903e-05, -1.2326054275035858e-05, -1.1377036571502686e-05, -1.0428018867969513e-05, -9.47900116443634e-06, -8.529983460903168e-06, -7.580965757369995e-06, -6.6319480538368225e-06, -5.68293035030365e-06, -4.733912646770477e-06, -3.7848949432373047e-06, -2.835877239704132e-06, -1.8868595361709595e-06, -9.378418326377869e-07, 1.1175870895385742e-08, 9.601935744285583e-07, 1.909211277961731e-06, 2.8582289814949036e-06, 3.807246685028076e-06, 4.756264388561249e-06, 5.705282092094421e-06, 6.654299795627594e-06, 7.603317499160767e-06, 8.55233520269394e-06, 9.501352906227112e-06, 1.0450370609760284e-05, 1.1399388313293457e-05, 1.234840601682663e-05, 1.3297423720359802e-05, 1.4246441423892975e-05, 1.5195459127426147e-05, 1.614447683095932e-05, 1.7093494534492493e-05, 1.8042512238025665e-05, 1.8991529941558838e-05, 1.994054764509201e-05, 2.0889565348625183e-05, 2.1838583052158356e-05, 2.278760075569153e-05, 2.37366184592247e-05, 2.4685636162757874e-05, 2.5634653866291046e-05, 2.658367156982422e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 5.0, 9.0, 12.0, 8.0, 16.0, 20.0, 25.0, 38.0, 44.0, 76.0, 119.0, 199.0, 322.0, 537.0, 1029.0, 2171.0, 5521.0, 29212.0, 896666.0, 97984.0, 8549.0, 2874.0, 1321.0, 715.0, 400.0, 243.0, 152.0, 79.0, 56.0, 41.0, 23.0, 21.0, 19.0, 10.0, 5.0, 2.0, 7.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01690673828125, -0.016317129135131836, -0.015727519989013672, -0.015137910842895508, -0.014548301696777344, -0.01395869255065918, -0.013369083404541016, -0.012779474258422852, -0.012189865112304688, -0.011600255966186523, -0.01101064682006836, -0.010421037673950195, -0.009831428527832031, -0.009241819381713867, -0.008652210235595703, -0.008062601089477539, -0.007472991943359375, -0.006883382797241211, -0.006293773651123047, -0.005704164505004883, -0.005114555358886719, -0.004524946212768555, -0.003935337066650391, -0.0033457279205322266, -0.0027561187744140625, -0.0021665096282958984, -0.0015769004821777344, -0.0009872913360595703, -0.00039768218994140625, 0.0001919269561767578, 0.0007815361022949219, 0.001371145248413086, 0.00196075439453125, 0.002550363540649414, 0.003139972686767578, 0.003729581832885742, 0.004319190979003906, 0.00490880012512207, 0.005498409271240234, 0.0060880184173583984, 0.0066776275634765625, 0.0072672367095947266, 0.00785684585571289, 0.008446455001831055, 0.009036064147949219, 0.009625673294067383, 0.010215282440185547, 0.010804891586303711, 0.011394500732421875, 0.011984109878540039, 0.012573719024658203, 0.013163328170776367, 0.013752937316894531, 0.014342546463012695, 0.01493215560913086, 0.015521764755249023, 0.016111373901367188, 0.01670098304748535, 0.017290592193603516, 0.01788020133972168, 0.018469810485839844, 0.019059419631958008, 0.019649028778076172, 0.020238637924194336, 0.0208282470703125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 2.0, 3.0, 4.0, 4.0, 3.0, 6.0, 6.0, 7.0, 21.0, 43.0, 70.0, 159.0, 199.0, 190.0, 117.0, 55.0, 42.0, 15.0, 15.0, 4.0, 4.0, 4.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.029052734375, -0.028322696685791016, -0.02759265899658203, -0.026862621307373047, -0.026132583618164062, -0.025402545928955078, -0.024672508239746094, -0.02394247055053711, -0.023212432861328125, -0.02248239517211914, -0.021752357482910156, -0.021022319793701172, -0.020292282104492188, -0.019562244415283203, -0.01883220672607422, -0.018102169036865234, -0.01737213134765625, -0.016642093658447266, -0.01591205596923828, -0.015182018280029297, -0.014451980590820312, -0.013721942901611328, -0.012991905212402344, -0.01226186752319336, -0.011531829833984375, -0.01080179214477539, -0.010071754455566406, -0.009341716766357422, -0.008611679077148438, -0.007881641387939453, -0.007151603698730469, -0.006421566009521484, -0.0056915283203125, -0.004961490631103516, -0.004231452941894531, -0.003501415252685547, -0.0027713775634765625, -0.002041339874267578, -0.0013113021850585938, -0.0005812644958496094, 0.000148773193359375, 0.0008788108825683594, 0.0016088485717773438, 0.002338886260986328, 0.0030689239501953125, 0.003798961639404297, 0.004528999328613281, 0.005259037017822266, 0.00598907470703125, 0.006719112396240234, 0.007449150085449219, 0.008179187774658203, 0.008909225463867188, 0.009639263153076172, 0.010369300842285156, 0.01109933853149414, 0.011829376220703125, 0.01255941390991211, 0.013289451599121094, 0.014019489288330078, 0.014749526977539062, 0.015479564666748047, 0.01620960235595703, 0.016939640045166016, 0.017669677734375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 7.0, 8.0, 25.0, 87.0, 199.0, 301.0, 245.0, 80.0, 34.0, 17.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33140426874160767, -0.3185504376888275, -0.30569660663604736, -0.2928428053855896, -0.27998897433280945, -0.2671351432800293, -0.25428131222724915, -0.241427481174469, -0.22857366502285004, -0.21571983397006989, -0.20286601781845093, -0.19001218676567078, -0.17715835571289062, -0.16430453956127167, -0.15145070850849152, -0.13859689235687256, -0.1257430613040924, -0.11288923770189285, -0.1000354140996933, -0.08718158304691315, -0.07432775944471359, -0.06147393584251404, -0.04862010478973389, -0.03576628118753433, -0.022912457585334778, -0.010058632120490074, 0.0027951933443546295, 0.015649020671844482, 0.028502844274044037, 0.04135666787624359, 0.05421049892902374, 0.0670643225312233, 0.07991817593574524, 0.0927719995379448, 0.10562582314014435, 0.1184796541929245, 0.13133347034454346, 0.1441873013973236, 0.15704113245010376, 0.1698949635028839, 0.18274877965450287, 0.19560261070728302, 0.20845642685890198, 0.22131025791168213, 0.23416408896446228, 0.24701790511608124, 0.2598717212677002, 0.27272555232048035, 0.2855793833732605, 0.29843321442604065, 0.3112870454788208, 0.32414084672927856, 0.3369946777820587, 0.34984850883483887, 0.362702339887619, 0.37555617094039917, 0.38840997219085693, 0.4012638032436371, 0.41411763429641724, 0.426971435546875, 0.43982526659965515, 0.4526790976524353, 0.46553292870521545, 0.4783867597579956, 0.49124059081077576]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 2.0, 5.0, 7.0, 16.0, 7.0, 12.0, 17.0, 12.0, 21.0, 19.0, 30.0, 36.0, 32.0, 37.0, 41.0, 39.0, 41.0, 48.0, 38.0, 43.0, 40.0, 42.0, 52.0, 46.0, 30.0, 27.0, 27.0, 33.0, 24.0, 25.0, 22.0, 20.0, 12.0, 16.0, 12.0, 16.0, 15.0, 7.0, 3.0, 6.0, 5.0, 5.0, 2.0, 0.0, 4.0, 0.0, 1.0], "bins": [-0.22798937559127808, -0.22182203829288483, -0.21565470099449158, -0.20948734879493713, -0.20332001149654388, -0.19715267419815063, -0.1909853219985962, -0.18481798470020294, -0.1786506474018097, -0.17248331010341644, -0.1663159728050232, -0.16014862060546875, -0.1539812833070755, -0.14781394600868225, -0.1416465938091278, -0.13547925651073456, -0.1293119192123413, -0.12314458191394806, -0.11697723716497421, -0.11080989241600037, -0.10464255511760712, -0.09847521781921387, -0.09230787307024002, -0.08614052832126617, -0.07997319102287292, -0.07380585372447968, -0.06763850897550583, -0.06147116795182228, -0.05530382692813873, -0.049136485904455185, -0.04296914488077164, -0.03680180385708809, -0.03063446283340454, -0.024467121809720993, -0.018299780786037445, -0.012132439762353897, -0.005965098738670349, 0.00020224228501319885, 0.006369583308696747, 0.012536924332380295, 0.018704265356063843, 0.02487160637974739, 0.03103894740343094, 0.03720628842711449, 0.043373629450798035, 0.04954097047448158, 0.05570831149816513, 0.06187565252184868, 0.06804299354553223, 0.07421033084392548, 0.08037767559289932, 0.08654502034187317, 0.09271235764026642, 0.09887969493865967, 0.10504703968763351, 0.11121438443660736, 0.11738172173500061, 0.12354905903339386, 0.1297163963317871, 0.13588374853134155, 0.1420510858297348, 0.14821842312812805, 0.1543857753276825, 0.16055311262607574, 0.166720449924469]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 6.0, 5.0, 5.0, 20.0, 20.0, 39.0, 64.0, 68.0, 101.0, 167.0, 272.0, 511.0, 939.0, 2105.0, 5938.0, 32111.0, 3998030.0, 136628.0, 11089.0, 3199.0, 1308.0, 634.0, 343.0, 247.0, 142.0, 87.0, 59.0, 44.0, 33.0, 19.0, 7.0, 7.0, 7.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0267486572265625, -0.025878190994262695, -0.02500772476196289, -0.024137258529663086, -0.02326679229736328, -0.022396326065063477, -0.021525859832763672, -0.020655393600463867, -0.019784927368164062, -0.018914461135864258, -0.018043994903564453, -0.01717352867126465, -0.016303062438964844, -0.015432596206665039, -0.014562129974365234, -0.01369166374206543, -0.012821197509765625, -0.01195073127746582, -0.011080265045166016, -0.010209798812866211, -0.009339332580566406, -0.008468866348266602, -0.007598400115966797, -0.006727933883666992, -0.0058574676513671875, -0.004987001419067383, -0.004116535186767578, -0.0032460689544677734, -0.0023756027221679688, -0.001505136489868164, -0.0006346702575683594, 0.0002357959747314453, 0.00110626220703125, 0.0019767284393310547, 0.0028471946716308594, 0.003717660903930664, 0.004588127136230469, 0.0054585933685302734, 0.006329059600830078, 0.007199525833129883, 0.008069992065429688, 0.008940458297729492, 0.009810924530029297, 0.010681390762329102, 0.011551856994628906, 0.012422323226928711, 0.013292789459228516, 0.01416325569152832, 0.015033721923828125, 0.01590418815612793, 0.016774654388427734, 0.01764512062072754, 0.018515586853027344, 0.01938605308532715, 0.020256519317626953, 0.021126985549926758, 0.021997451782226562, 0.022867918014526367, 0.023738384246826172, 0.024608850479125977, 0.02547931671142578, 0.026349782943725586, 0.02722024917602539, 0.028090715408325195, 0.028961181640625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 6.0, 12.0, 18.0, 29.0, 27.0, 48.0, 47.0, 50.0, 79.0, 79.0, 74.0, 100.0, 92.0, 84.0, 61.0, 40.0, 41.0, 33.0, 23.0, 9.0, 11.0, 5.0, 2.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0227203369140625, -0.022068023681640625, -0.02141571044921875, -0.020763397216796875, -0.020111083984375, -0.019458770751953125, -0.01880645751953125, -0.018154144287109375, -0.0175018310546875, -0.016849517822265625, -0.01619720458984375, -0.015544891357421875, -0.014892578125, -0.014240264892578125, -0.01358795166015625, -0.012935638427734375, -0.0122833251953125, -0.011631011962890625, -0.01097869873046875, -0.010326385498046875, -0.009674072265625, -0.009021759033203125, -0.00836944580078125, -0.007717132568359375, -0.0070648193359375, -0.006412506103515625, -0.00576019287109375, -0.005107879638671875, -0.00445556640625, -0.003803253173828125, -0.00315093994140625, -0.002498626708984375, -0.0018463134765625, -0.001194000244140625, -0.00054168701171875, 0.000110626220703125, 0.000762939453125, 0.001415252685546875, 0.00206756591796875, 0.002719879150390625, 0.0033721923828125, 0.004024505615234375, 0.00467681884765625, 0.005329132080078125, 0.0059814453125, 0.006633758544921875, 0.00728607177734375, 0.007938385009765625, 0.0085906982421875, 0.009243011474609375, 0.00989532470703125, 0.010547637939453125, 0.011199951171875, 0.011852264404296875, 0.01250457763671875, 0.013156890869140625, 0.0138092041015625, 0.014461517333984375, 0.01511383056640625, 0.015766143798828125, 0.01641845703125, 0.017070770263671875, 0.01772308349609375, 0.018375396728515625, 0.0190277099609375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 11.0, 21.0, 23.0, 40.0, 65.0, 73.0, 110.0, 142.0, 203.0, 210.0, 294.0, 487.0, 1328.0, 32793.0, 4153126.0, 3163.0, 716.0, 434.0, 273.0, 210.0, 150.0, 116.0, 74.0, 72.0, 55.0, 26.0, 27.0, 17.0, 8.0, 9.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11895751953125, -0.11514568328857422, -0.11133384704589844, -0.10752201080322266, -0.10371017456054688, -0.0998983383178711, -0.09608650207519531, -0.09227466583251953, -0.08846282958984375, -0.08465099334716797, -0.08083915710449219, -0.0770273208618164, -0.07321548461914062, -0.06940364837646484, -0.06559181213378906, -0.06177997589111328, -0.0579681396484375, -0.05415630340576172, -0.05034446716308594, -0.046532630920410156, -0.042720794677734375, -0.038908958435058594, -0.03509712219238281, -0.03128528594970703, -0.02747344970703125, -0.02366161346435547, -0.019849777221679688, -0.016037940979003906, -0.012226104736328125, -0.008414268493652344, -0.0046024322509765625, -0.0007905960083007812, 0.003021240234375, 0.006833076477050781, 0.010644912719726562, 0.014456748962402344, 0.018268585205078125, 0.022080421447753906, 0.025892257690429688, 0.02970409393310547, 0.03351593017578125, 0.03732776641845703, 0.04113960266113281, 0.044951438903808594, 0.048763275146484375, 0.052575111389160156, 0.05638694763183594, 0.06019878387451172, 0.0640106201171875, 0.06782245635986328, 0.07163429260253906, 0.07544612884521484, 0.07925796508789062, 0.0830698013305664, 0.08688163757324219, 0.09069347381591797, 0.09450531005859375, 0.09831714630126953, 0.10212898254394531, 0.1059408187866211, 0.10975265502929688, 0.11356449127197266, 0.11737632751464844, 0.12118816375732422, 0.125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 15.0, 359.0, 3670.0, 25.0, 12.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046875, -0.04465484619140625, -0.0424346923828125, -0.04021453857421875, -0.037994384765625, -0.03577423095703125, -0.0335540771484375, -0.03133392333984375, -0.02911376953125, -0.02689361572265625, -0.0246734619140625, -0.02245330810546875, -0.020233154296875, -0.01801300048828125, -0.0157928466796875, -0.01357269287109375, -0.0113525390625, -0.00913238525390625, -0.0069122314453125, -0.00469207763671875, -0.002471923828125, -0.00025177001953125, 0.0019683837890625, 0.00418853759765625, 0.00640869140625, 0.00862884521484375, 0.0108489990234375, 0.01306915283203125, 0.015289306640625, 0.01750946044921875, 0.0197296142578125, 0.02194976806640625, 0.024169921875, 0.02639007568359375, 0.0286102294921875, 0.03083038330078125, 0.033050537109375, 0.03527069091796875, 0.0374908447265625, 0.03971099853515625, 0.04193115234375, 0.04415130615234375, 0.0463714599609375, 0.04859161376953125, 0.050811767578125, 0.05303192138671875, 0.0552520751953125, 0.05747222900390625, 0.0596923828125, 0.06191253662109375, 0.0641326904296875, 0.06635284423828125, 0.068572998046875, 0.07079315185546875, 0.0730133056640625, 0.07523345947265625, 0.07745361328125, 0.07967376708984375, 0.0818939208984375, 0.08411407470703125, 0.086334228515625, 0.08855438232421875, 0.0907745361328125, 0.09299468994140625, 0.09521484375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 12.0, 29.0, 109.0, 359.0, 375.0, 96.0, 23.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15574894845485687, -0.1479724645614624, -0.14019599556922913, -0.13241951167583466, -0.12464303523302078, -0.11686655879020691, -0.10909007489681244, -0.10131359845399857, -0.09353712201118469, -0.08576064556837082, -0.07798416912555695, -0.07020768523216248, -0.0624312087893486, -0.05465473234653473, -0.04687825217843056, -0.039101772010326385, -0.03132529556751251, -0.02354881726205349, -0.015772338956594467, -0.007995860651135445, -0.00021938234567642212, 0.007557094097137451, 0.015333574265241623, 0.023110054433345795, 0.030886530876159668, 0.03866300731897354, 0.04643948748707771, 0.054215967655181885, 0.06199244409799576, 0.06976892054080963, 0.0775454044342041, 0.08532188087701797, 0.09309834241867065, 0.10087481886148453, 0.1086512953042984, 0.11642777919769287, 0.12420425564050674, 0.13198073208332062, 0.1397572159767151, 0.14753368496894836, 0.15531016886234283, 0.1630866527557373, 0.17086312174797058, 0.17863960564136505, 0.18641608953475952, 0.1941925585269928, 0.20196904242038727, 0.20974552631378174, 0.21752199530601501, 0.22529847919940948, 0.23307494819164276, 0.24085143208503723, 0.2486279010772705, 0.25640439987182617, 0.26418086886405945, 0.2719573378562927, 0.2797338366508484, 0.28751030564308167, 0.29528680443763733, 0.3030632734298706, 0.3108397424221039, 0.31861621141433716, 0.3263927102088928, 0.3341691792011261, 0.3419456481933594]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 6.0, 5.0, 13.0, 18.0, 23.0, 31.0, 40.0, 50.0, 77.0, 112.0, 118.0, 101.0, 103.0, 79.0, 72.0, 59.0, 28.0, 24.0, 19.0, 10.0, 5.0, 3.0, 5.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15625214576721191, -0.15150687098503113, -0.14676161110401154, -0.14201635122299194, -0.13727107644081116, -0.13252580165863037, -0.12778054177761078, -0.12303527444601059, -0.1182900071144104, -0.11354473978281021, -0.10879947245121002, -0.10405420511960983, -0.09930893778800964, -0.09456367045640945, -0.08981840312480927, -0.08507313579320908, -0.08032786846160889, -0.0755826011300087, -0.07083733379840851, -0.06609206646680832, -0.06134679913520813, -0.05660153180360794, -0.05185626447200775, -0.04711099714040756, -0.04236572980880737, -0.037620462477207184, -0.032875195145606995, -0.028129927814006805, -0.023384660482406616, -0.018639393150806427, -0.013894125819206238, -0.009148858487606049, -0.004403591156005859, 0.00034167617559432983, 0.005086943507194519, 0.009832210838794708, 0.014577478170394897, 0.019322745501995087, 0.024068012833595276, 0.028813280165195465, 0.033558547496795654, 0.038303814828395844, 0.04304908215999603, 0.04779434949159622, 0.05253961682319641, 0.0572848841547966, 0.06203015148639679, 0.06677541881799698, 0.07152068614959717, 0.07626595348119736, 0.08101122081279755, 0.08575648814439774, 0.09050175547599792, 0.09524702280759811, 0.0999922901391983, 0.10473755747079849, 0.10948282480239868, 0.11422809213399887, 0.11897335946559906, 0.12371862679719925, 0.12846389412879944, 0.13320916891098022, 0.13795442879199982, 0.1426996886730194, 0.1474449634552002]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 7.0, 20.0, 21.0, 24.0, 72.0, 104.0, 195.0, 418.0, 1136.0, 3616.0, 14175.0, 75503.0, 485147.0, 394254.0, 57793.0, 11268.0, 2979.0, 1030.0, 397.0, 169.0, 94.0, 45.0, 27.0, 21.0, 16.0, 6.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02947998046875, -0.028526782989501953, -0.027573585510253906, -0.02662038803100586, -0.025667190551757812, -0.024713993072509766, -0.02376079559326172, -0.022807598114013672, -0.021854400634765625, -0.020901203155517578, -0.01994800567626953, -0.018994808197021484, -0.018041610717773438, -0.01708841323852539, -0.016135215759277344, -0.015182018280029297, -0.01422882080078125, -0.013275623321533203, -0.012322425842285156, -0.01136922836303711, -0.010416030883789062, -0.009462833404541016, -0.008509635925292969, -0.007556438446044922, -0.006603240966796875, -0.005650043487548828, -0.004696846008300781, -0.0037436485290527344, -0.0027904510498046875, -0.0018372535705566406, -0.0008840560913085938, 6.914138793945312e-05, 0.0010223388671875, 0.001975536346435547, 0.0029287338256835938, 0.0038819313049316406, 0.0048351287841796875, 0.005788326263427734, 0.006741523742675781, 0.007694721221923828, 0.008647918701171875, 0.009601116180419922, 0.010554313659667969, 0.011507511138916016, 0.012460708618164062, 0.01341390609741211, 0.014367103576660156, 0.015320301055908203, 0.01627349853515625, 0.017226696014404297, 0.018179893493652344, 0.01913309097290039, 0.020086288452148438, 0.021039485931396484, 0.02199268341064453, 0.022945880889892578, 0.023899078369140625, 0.024852275848388672, 0.02580547332763672, 0.026758670806884766, 0.027711868286132812, 0.02866506576538086, 0.029618263244628906, 0.030571460723876953, 0.031524658203125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 8.0, 4.0, 4.0, 8.0, 12.0, 21.0, 21.0, 31.0, 47.0, 49.0, 67.0, 64.0, 89.0, 82.0, 81.0, 76.0, 73.0, 62.0, 42.0, 43.0, 33.0, 28.0, 12.0, 12.0, 7.0, 6.0, 6.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02520751953125, -0.024524927139282227, -0.023842334747314453, -0.02315974235534668, -0.022477149963378906, -0.021794557571411133, -0.02111196517944336, -0.020429372787475586, -0.019746780395507812, -0.01906418800354004, -0.018381595611572266, -0.017699003219604492, -0.01701641082763672, -0.016333818435668945, -0.015651226043701172, -0.014968633651733398, -0.014286041259765625, -0.013603448867797852, -0.012920856475830078, -0.012238264083862305, -0.011555671691894531, -0.010873079299926758, -0.010190486907958984, -0.009507894515991211, -0.008825302124023438, -0.008142709732055664, -0.007460117340087891, -0.006777524948120117, -0.006094932556152344, -0.00541234016418457, -0.004729747772216797, -0.0040471553802490234, -0.00336456298828125, -0.0026819705963134766, -0.001999378204345703, -0.0013167858123779297, -0.0006341934204101562, 4.839897155761719e-05, 0.0007309913635253906, 0.001413583755493164, 0.0020961761474609375, 0.002778768539428711, 0.0034613609313964844, 0.004143953323364258, 0.004826545715332031, 0.005509138107299805, 0.006191730499267578, 0.0068743228912353516, 0.007556915283203125, 0.008239507675170898, 0.008922100067138672, 0.009604692459106445, 0.010287284851074219, 0.010969877243041992, 0.011652469635009766, 0.012335062026977539, 0.013017654418945312, 0.013700246810913086, 0.01438283920288086, 0.015065431594848633, 0.015748023986816406, 0.01643061637878418, 0.017113208770751953, 0.017795801162719727, 0.0184783935546875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 15.0, 25.0, 58.0, 91.0, 251.0, 635.0, 1983.0, 19666.0, 934283.0, 86281.0, 3646.0, 964.0, 346.0, 147.0, 68.0, 32.0, 16.0, 9.0, 7.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0780029296875, -0.07568645477294922, -0.07336997985839844, -0.07105350494384766, -0.06873703002929688, -0.0664205551147461, -0.06410408020019531, -0.06178760528564453, -0.05947113037109375, -0.05715465545654297, -0.05483818054199219, -0.052521705627441406, -0.050205230712890625, -0.047888755798339844, -0.04557228088378906, -0.04325580596923828, -0.0409393310546875, -0.03862285614013672, -0.03630638122558594, -0.033989906311035156, -0.031673431396484375, -0.029356956481933594, -0.027040481567382812, -0.02472400665283203, -0.02240753173828125, -0.02009105682373047, -0.017774581909179688, -0.015458106994628906, -0.013141632080078125, -0.010825157165527344, -0.008508682250976562, -0.006192207336425781, -0.003875732421875, -0.0015592575073242188, 0.0007572174072265625, 0.0030736923217773438, 0.005390167236328125, 0.007706642150878906, 0.010023117065429688, 0.012339591979980469, 0.01465606689453125, 0.01697254180908203, 0.019289016723632812, 0.021605491638183594, 0.023921966552734375, 0.026238441467285156, 0.028554916381835938, 0.03087139129638672, 0.0331878662109375, 0.03550434112548828, 0.03782081604003906, 0.040137290954589844, 0.042453765869140625, 0.044770240783691406, 0.04708671569824219, 0.04940319061279297, 0.05171966552734375, 0.05403614044189453, 0.05635261535644531, 0.058669090270996094, 0.060985565185546875, 0.06330204010009766, 0.06561851501464844, 0.06793498992919922, 0.07025146484375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 3.0, 5.0, 9.0, 11.0, 27.0, 42.0, 39.0, 68.0, 79.0, 113.0, 87.0, 102.0, 86.0, 70.0, 80.0, 55.0, 58.0, 29.0, 25.0, 5.0, 9.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.075439453125, -0.07217597961425781, -0.06891250610351562, -0.06564903259277344, -0.06238555908203125, -0.05912208557128906, -0.055858612060546875, -0.05259513854980469, -0.0493316650390625, -0.04606819152832031, -0.042804718017578125, -0.03954124450683594, -0.03627777099609375, -0.03301429748535156, -0.029750823974609375, -0.026487350463867188, -0.023223876953125, -0.019960403442382812, -0.016696929931640625, -0.013433456420898438, -0.01016998291015625, -0.0069065093994140625, -0.003643035888671875, -0.0003795623779296875, 0.0028839111328125, 0.0061473846435546875, 0.009410858154296875, 0.012674331665039062, 0.01593780517578125, 0.019201278686523438, 0.022464752197265625, 0.025728225708007812, 0.02899169921875, 0.03225517272949219, 0.035518646240234375, 0.03878211975097656, 0.04204559326171875, 0.04530906677246094, 0.048572540283203125, 0.05183601379394531, 0.0550994873046875, 0.05836296081542969, 0.061626434326171875, 0.06488990783691406, 0.06815338134765625, 0.07141685485839844, 0.07468032836914062, 0.07794380187988281, 0.081207275390625, 0.08447074890136719, 0.08773422241210938, 0.09099769592285156, 0.09426116943359375, 0.09752464294433594, 0.10078811645507812, 0.10405158996582031, 0.1073150634765625, 0.11057853698730469, 0.11384201049804688, 0.11710548400878906, 0.12036895751953125, 0.12363243103027344, 0.12689590454101562, 0.1301593780517578, 0.1334228515625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 10.0, 7.0, 20.0, 34.0, 64.0, 116.0, 360.0, 1359.0, 10121.0, 754580.0, 274024.0, 6221.0, 1046.0, 317.0, 150.0, 63.0, 23.0, 17.0, 9.0, 2.0, 8.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0211181640625, -0.020270347595214844, -0.019422531127929688, -0.01857471466064453, -0.017726898193359375, -0.01687908172607422, -0.016031265258789062, -0.015183448791503906, -0.01433563232421875, -0.013487815856933594, -0.012639999389648438, -0.011792182922363281, -0.010944366455078125, -0.010096549987792969, -0.009248733520507812, -0.008400917053222656, -0.0075531005859375, -0.006705284118652344, -0.0058574676513671875, -0.005009651184082031, -0.004161834716796875, -0.0033140182495117188, -0.0024662017822265625, -0.0016183853149414062, -0.00077056884765625, 7.724761962890625e-05, 0.0009250640869140625, 0.0017728805541992188, 0.002620697021484375, 0.0034685134887695312, 0.0043163299560546875, 0.005164146423339844, 0.006011962890625, 0.006859779357910156, 0.0077075958251953125, 0.008555412292480469, 0.009403228759765625, 0.010251045227050781, 0.011098861694335938, 0.011946678161621094, 0.01279449462890625, 0.013642311096191406, 0.014490127563476562, 0.015337944030761719, 0.016185760498046875, 0.01703357696533203, 0.017881393432617188, 0.018729209899902344, 0.0195770263671875, 0.020424842834472656, 0.021272659301757812, 0.02212047576904297, 0.022968292236328125, 0.02381610870361328, 0.024663925170898438, 0.025511741638183594, 0.02635955810546875, 0.027207374572753906, 0.028055191040039062, 0.02890300750732422, 0.029750823974609375, 0.03059864044189453, 0.03144645690917969, 0.032294273376464844, 0.03314208984375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 6.0, 9.0, 4.0, 9.0, 11.0, 16.0, 25.0, 33.0, 31.0, 52.0, 67.0, 94.0, 132.0, 133.0, 89.0, 60.0, 47.0, 41.0, 26.0, 20.0, 12.0, 15.0, 11.0, 2.0, 5.0, 8.0, 9.0, 5.0, 7.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.112720489501953e-05, -3.9880163967609406e-05, -3.863312304019928e-05, -3.7386082112789154e-05, -3.613904118537903e-05, -3.48920002579689e-05, -3.364495933055878e-05, -3.239791840314865e-05, -3.1150877475738525e-05, -2.99038365483284e-05, -2.8656795620918274e-05, -2.7409754693508148e-05, -2.6162713766098022e-05, -2.4915672838687897e-05, -2.366863191127777e-05, -2.2421590983867645e-05, -2.117455005645752e-05, -1.9927509129047394e-05, -1.8680468201637268e-05, -1.7433427274227142e-05, -1.6186386346817017e-05, -1.4939345419406891e-05, -1.3692304491996765e-05, -1.244526356458664e-05, -1.1198222637176514e-05, -9.951181709766388e-06, -8.704140782356262e-06, -7.4570998549461365e-06, -6.210058927536011e-06, -4.963018000125885e-06, -3.7159770727157593e-06, -2.4689361453056335e-06, -1.2218952178955078e-06, 2.514570951461792e-08, 1.2721866369247437e-06, 2.5192275643348694e-06, 3.766268491744995e-06, 5.013309419155121e-06, 6.260350346565247e-06, 7.507391273975372e-06, 8.754432201385498e-06, 1.0001473128795624e-05, 1.124851405620575e-05, 1.2495554983615875e-05, 1.3742595911026001e-05, 1.4989636838436127e-05, 1.6236677765846252e-05, 1.7483718693256378e-05, 1.8730759620666504e-05, 1.997780054807663e-05, 2.1224841475486755e-05, 2.247188240289688e-05, 2.3718923330307007e-05, 2.4965964257717133e-05, 2.6213005185127258e-05, 2.7460046112537384e-05, 2.870708703994751e-05, 2.9954127967357635e-05, 3.120116889476776e-05, 3.244820982217789e-05, 3.369525074958801e-05, 3.494229167699814e-05, 3.6189332604408264e-05, 3.743637353181839e-05, 3.8683414459228516e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 4.0, 10.0, 18.0, 31.0, 62.0, 101.0, 259.0, 825.0, 3794.0, 115181.0, 913414.0, 12651.0, 1464.0, 390.0, 181.0, 79.0, 38.0, 24.0, 4.0, 11.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0287628173828125, -0.02787041664123535, -0.026978015899658203, -0.026085615158081055, -0.025193214416503906, -0.024300813674926758, -0.02340841293334961, -0.02251601219177246, -0.021623611450195312, -0.020731210708618164, -0.019838809967041016, -0.018946409225463867, -0.01805400848388672, -0.01716160774230957, -0.016269207000732422, -0.015376806259155273, -0.014484405517578125, -0.013592004776000977, -0.012699604034423828, -0.01180720329284668, -0.010914802551269531, -0.010022401809692383, -0.009130001068115234, -0.008237600326538086, -0.0073451995849609375, -0.006452798843383789, -0.005560398101806641, -0.004667997360229492, -0.0037755966186523438, -0.0028831958770751953, -0.001990795135498047, -0.0010983943939208984, -0.00020599365234375, 0.0006864070892333984, 0.0015788078308105469, 0.0024712085723876953, 0.0033636093139648438, 0.004256010055541992, 0.005148410797119141, 0.006040811538696289, 0.0069332122802734375, 0.007825613021850586, 0.008718013763427734, 0.009610414505004883, 0.010502815246582031, 0.01139521598815918, 0.012287616729736328, 0.013180017471313477, 0.014072418212890625, 0.014964818954467773, 0.015857219696044922, 0.01674962043762207, 0.01764202117919922, 0.018534421920776367, 0.019426822662353516, 0.020319223403930664, 0.021211624145507812, 0.02210402488708496, 0.02299642562866211, 0.023888826370239258, 0.024781227111816406, 0.025673627853393555, 0.026566028594970703, 0.02745842933654785, 0.028350830078125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 6.0, 9.0, 10.0, 11.0, 25.0, 43.0, 57.0, 130.0, 177.0, 203.0, 153.0, 71.0, 41.0, 25.0, 21.0, 7.0, 5.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0297698974609375, -0.028970956802368164, -0.028172016143798828, -0.027373075485229492, -0.026574134826660156, -0.02577519416809082, -0.024976253509521484, -0.02417731285095215, -0.023378372192382812, -0.022579431533813477, -0.02178049087524414, -0.020981550216674805, -0.02018260955810547, -0.019383668899536133, -0.018584728240966797, -0.01778578758239746, -0.016986846923828125, -0.01618790626525879, -0.015388965606689453, -0.014590024948120117, -0.013791084289550781, -0.012992143630981445, -0.01219320297241211, -0.011394262313842773, -0.010595321655273438, -0.009796380996704102, -0.008997440338134766, -0.00819849967956543, -0.007399559020996094, -0.006600618362426758, -0.005801677703857422, -0.005002737045288086, -0.00420379638671875, -0.003404855728149414, -0.002605915069580078, -0.0018069744110107422, -0.0010080337524414062, -0.0002090930938720703, 0.0005898475646972656, 0.0013887882232666016, 0.0021877288818359375, 0.0029866695404052734, 0.0037856101989746094, 0.004584550857543945, 0.005383491516113281, 0.006182432174682617, 0.006981372833251953, 0.007780313491821289, 0.008579254150390625, 0.009378194808959961, 0.010177135467529297, 0.010976076126098633, 0.011775016784667969, 0.012573957443237305, 0.01337289810180664, 0.014171838760375977, 0.014970779418945312, 0.01576972007751465, 0.016568660736083984, 0.01736760139465332, 0.018166542053222656, 0.018965482711791992, 0.019764423370361328, 0.020563364028930664, 0.0213623046875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 12.0, 31.0, 90.0, 259.0, 304.0, 176.0, 75.0, 27.0, 15.0, 0.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.36147540807724, -0.3451583683490753, -0.32884132862091064, -0.31252431869506836, -0.2962072789669037, -0.279890239238739, -0.26357322931289673, -0.24725618958473206, -0.23093914985656738, -0.2146221101284027, -0.19830508530139923, -0.18198806047439575, -0.16567102074623108, -0.1493539810180664, -0.13303695619106293, -0.11671992391347885, -0.10040289163589478, -0.0840858593583107, -0.06776882708072662, -0.05145179480314255, -0.03513476252555847, -0.018817730247974396, -0.00250069797039032, 0.013816334307193756, 0.030133366584777832, 0.04645039886236191, 0.06276743113994598, 0.07908446341753006, 0.09540149569511414, 0.11171852797269821, 0.1280355602502823, 0.14435258507728577, 0.16066968441009521, 0.1769867241382599, 0.19330374896526337, 0.20962077379226685, 0.22593781352043152, 0.2422548532485962, 0.2585718631744385, 0.27488890290260315, 0.2912059426307678, 0.3075229823589325, 0.32384002208709717, 0.34015703201293945, 0.3564740717411041, 0.3727911114692688, 0.3891081213951111, 0.40542516112327576, 0.42174220085144043, 0.4380592405796051, 0.4543762803077698, 0.47069329023361206, 0.48701032996177673, 0.5033273696899414, 0.5196443796157837, 0.5359614491462708, 0.552278459072113, 0.5685954689979553, 0.5849125385284424, 0.6012295484542847, 0.617546558380127, 0.633863627910614, 0.6501806378364563, 0.6664977073669434, 0.6828147172927856]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 4.0, 11.0, 8.0, 12.0, 16.0, 17.0, 13.0, 22.0, 22.0, 30.0, 29.0, 28.0, 37.0, 38.0, 35.0, 38.0, 40.0, 44.0, 56.0, 53.0, 41.0, 48.0, 35.0, 31.0, 31.0, 26.0, 31.0, 25.0, 23.0, 28.0, 21.0, 15.0, 15.0, 15.0, 7.0, 9.0, 9.0, 5.0, 6.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.2416272759437561, -0.23407693207263947, -0.22652658820152283, -0.218976229429245, -0.21142588555812836, -0.20387554168701172, -0.1963251829147339, -0.18877483904361725, -0.1812244951725006, -0.17367415130138397, -0.16612380743026733, -0.1585734486579895, -0.15102310478687286, -0.14347276091575623, -0.1359224021434784, -0.12837205827236176, -0.12082171440124512, -0.11327137053012848, -0.10572101920843124, -0.09817066788673401, -0.09062032401561737, -0.08306998014450073, -0.0755196288228035, -0.06796927750110626, -0.060418933629989624, -0.05286858603358269, -0.04531823843717575, -0.037767890840768814, -0.030217543244361877, -0.02266719564795494, -0.015116848051548004, -0.0075665004551410675, -1.615285873413086e-05, 0.007534194737672806, 0.015084542334079742, 0.02263488993048668, 0.030185237526893616, 0.03773558512330055, 0.04528593271970749, 0.052836280316114426, 0.06038662791252136, 0.067936971783638, 0.07548732310533524, 0.08303767442703247, 0.09058801829814911, 0.09813836216926575, 0.10568871349096298, 0.11323906481266022, 0.12078940868377686, 0.1283397525548935, 0.13589009642601013, 0.14344045519828796, 0.1509907990694046, 0.15854114294052124, 0.16609150171279907, 0.1736418455839157, 0.18119218945503235, 0.188742533326149, 0.19629287719726562, 0.20384323596954346, 0.2113935798406601, 0.21894392371177673, 0.22649428248405457, 0.2340446263551712, 0.24159497022628784]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [5.0, 1.0, 11.0, 10.0, 10.0, 21.0, 55.0, 115.0, 289.0, 773.0, 2277.0, 9447.0, 72115.0, 3946684.0, 144253.0, 13516.0, 3010.0, 976.0, 403.0, 154.0, 80.0, 43.0, 16.0, 15.0, 10.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017425537109375, -0.01614522933959961, -0.014864921569824219, -0.013584613800048828, -0.012304306030273438, -0.011023998260498047, -0.009743690490722656, -0.008463382720947266, -0.007183074951171875, -0.005902767181396484, -0.004622459411621094, -0.003342151641845703, -0.0020618438720703125, -0.0007815361022949219, 0.0004987716674804688, 0.0017790794372558594, 0.00305938720703125, 0.004339694976806641, 0.005620002746582031, 0.006900310516357422, 0.008180618286132812, 0.009460926055908203, 0.010741233825683594, 0.012021541595458984, 0.013301849365234375, 0.014582157135009766, 0.015862464904785156, 0.017142772674560547, 0.018423080444335938, 0.019703388214111328, 0.02098369598388672, 0.02226400375366211, 0.0235443115234375, 0.02482461929321289, 0.02610492706298828, 0.027385234832763672, 0.028665542602539062, 0.029945850372314453, 0.031226158142089844, 0.032506465911865234, 0.033786773681640625, 0.035067081451416016, 0.036347389221191406, 0.0376276969909668, 0.03890800476074219, 0.04018831253051758, 0.04146862030029297, 0.04274892807006836, 0.04402923583984375, 0.04530954360961914, 0.04658985137939453, 0.04787015914916992, 0.04915046691894531, 0.0504307746887207, 0.051711082458496094, 0.052991390228271484, 0.054271697998046875, 0.055552005767822266, 0.056832313537597656, 0.05811262130737305, 0.05939292907714844, 0.06067323684692383, 0.06195354461669922, 0.06323385238647461, 0.06451416015625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 8.0, 9.0, 15.0, 25.0, 29.0, 37.0, 48.0, 51.0, 60.0, 79.0, 69.0, 80.0, 85.0, 66.0, 62.0, 68.0, 56.0, 45.0, 23.0, 23.0, 15.0, 6.0, 10.0, 3.0, 6.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.019195556640625, -0.018589019775390625, -0.01798248291015625, -0.017375946044921875, -0.0167694091796875, -0.016162872314453125, -0.01555633544921875, -0.014949798583984375, -0.01434326171875, -0.013736724853515625, -0.01313018798828125, -0.012523651123046875, -0.0119171142578125, -0.011310577392578125, -0.01070404052734375, -0.010097503662109375, -0.009490966796875, -0.008884429931640625, -0.00827789306640625, -0.007671356201171875, -0.0070648193359375, -0.006458282470703125, -0.00585174560546875, -0.005245208740234375, -0.004638671875, -0.004032135009765625, -0.00342559814453125, -0.002819061279296875, -0.0022125244140625, -0.001605987548828125, -0.00099945068359375, -0.000392913818359375, 0.000213623046875, 0.000820159912109375, 0.00142669677734375, 0.002033233642578125, 0.0026397705078125, 0.003246307373046875, 0.00385284423828125, 0.004459381103515625, 0.00506591796875, 0.005672454833984375, 0.00627899169921875, 0.006885528564453125, 0.0074920654296875, 0.008098602294921875, 0.00870513916015625, 0.009311676025390625, 0.009918212890625, 0.010524749755859375, 0.01113128662109375, 0.011737823486328125, 0.0123443603515625, 0.012950897216796875, 0.01355743408203125, 0.014163970947265625, 0.0147705078125, 0.015377044677734375, 0.01598358154296875, 0.016590118408203125, 0.0171966552734375, 0.017803192138671875, 0.01840972900390625, 0.019016265869140625, 0.019622802734375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 7.0, 4.0, 1.0, 9.0, 6.0, 15.0, 9.0, 21.0, 24.0, 31.0, 44.0, 79.0, 131.0, 258.0, 666.0, 2056.0, 9421.0, 78209.0, 3935771.0, 148080.0, 14792.0, 2904.0, 932.0, 355.0, 171.0, 84.0, 65.0, 49.0, 24.0, 15.0, 13.0, 9.0, 6.0, 3.0, 9.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.044219970703125, -0.04294252395629883, -0.041665077209472656, -0.040387630462646484, -0.03911018371582031, -0.03783273696899414, -0.03655529022216797, -0.0352778434753418, -0.034000396728515625, -0.03272294998168945, -0.03144550323486328, -0.03016805648803711, -0.028890609741210938, -0.027613162994384766, -0.026335716247558594, -0.025058269500732422, -0.02378082275390625, -0.022503376007080078, -0.021225929260253906, -0.019948482513427734, -0.018671035766601562, -0.01739358901977539, -0.01611614227294922, -0.014838695526123047, -0.013561248779296875, -0.012283802032470703, -0.011006355285644531, -0.00972890853881836, -0.008451461791992188, -0.007174015045166016, -0.005896568298339844, -0.004619121551513672, -0.0033416748046875, -0.002064228057861328, -0.0007867813110351562, 0.0004906654357910156, 0.0017681121826171875, 0.0030455589294433594, 0.004323005676269531, 0.005600452423095703, 0.006877899169921875, 0.008155345916748047, 0.009432792663574219, 0.01071023941040039, 0.011987686157226562, 0.013265132904052734, 0.014542579650878906, 0.015820026397705078, 0.01709747314453125, 0.018374919891357422, 0.019652366638183594, 0.020929813385009766, 0.022207260131835938, 0.02348470687866211, 0.02476215362548828, 0.026039600372314453, 0.027317047119140625, 0.028594493865966797, 0.02987194061279297, 0.03114938735961914, 0.03242683410644531, 0.033704280853271484, 0.034981727600097656, 0.03625917434692383, 0.03753662109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 6.0, 4.0, 7.0, 16.0, 31.0, 25.0, 33.0, 66.0, 93.0, 369.0, 1580.0, 1324.0, 251.0, 80.0, 46.0, 34.0, 29.0, 22.0, 12.0, 11.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03759765625, -0.03645467758178711, -0.03531169891357422, -0.03416872024536133, -0.03302574157714844, -0.03188276290893555, -0.030739784240722656, -0.029596805572509766, -0.028453826904296875, -0.027310848236083984, -0.026167869567871094, -0.025024890899658203, -0.023881912231445312, -0.022738933563232422, -0.02159595489501953, -0.02045297622680664, -0.01930999755859375, -0.01816701889038086, -0.01702404022216797, -0.015881061553955078, -0.014738082885742188, -0.013595104217529297, -0.012452125549316406, -0.011309146881103516, -0.010166168212890625, -0.009023189544677734, -0.007880210876464844, -0.006737232208251953, -0.0055942535400390625, -0.004451274871826172, -0.0033082962036132812, -0.0021653175354003906, -0.0010223388671875, 0.00012063980102539062, 0.0012636184692382812, 0.002406597137451172, 0.0035495758056640625, 0.004692554473876953, 0.005835533142089844, 0.006978511810302734, 0.008121490478515625, 0.009264469146728516, 0.010407447814941406, 0.011550426483154297, 0.012693405151367188, 0.013836383819580078, 0.014979362487792969, 0.01612234115600586, 0.01726531982421875, 0.01840829849243164, 0.01955127716064453, 0.020694255828857422, 0.021837234497070312, 0.022980213165283203, 0.024123191833496094, 0.025266170501708984, 0.026409149169921875, 0.027552127838134766, 0.028695106506347656, 0.029838085174560547, 0.030981063842773438, 0.03212404251098633, 0.03326702117919922, 0.03440999984741211, 0.035552978515625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 5.0, 8.0, 5.0, 7.0, 24.0, 49.0, 111.0, 187.0, 240.0, 204.0, 93.0, 42.0, 12.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27881789207458496, -0.27002912759780884, -0.2612403929233551, -0.252451628446579, -0.24366287887096405, -0.23487412929534912, -0.226085364818573, -0.21729661524295807, -0.20850786566734314, -0.1997191160917282, -0.19093036651611328, -0.18214160203933716, -0.17335285246372223, -0.1645641028881073, -0.15577533841133118, -0.14698658883571625, -0.13819783926010132, -0.1294090896844864, -0.12062033265829086, -0.11183157563209534, -0.10304282605648041, -0.09425407648086548, -0.08546531945466995, -0.07667656242847443, -0.0678878128528595, -0.05909905955195427, -0.05031030625104904, -0.041521552950143814, -0.032732799649238586, -0.02394404634833336, -0.015155293047428131, -0.0063665397465229034, 0.0024221837520599365, 0.011210937052965164, 0.019999690353870392, 0.02878844365477562, 0.03757719695568085, 0.046365950256586075, 0.0551547035574913, 0.06394346058368683, 0.07273221015930176, 0.08152095973491669, 0.09030971676111221, 0.09909847378730774, 0.10788722336292267, 0.1166759729385376, 0.12546473741531372, 0.13425348699092865, 0.14304223656654358, 0.1518309861421585, 0.16061973571777344, 0.16940850019454956, 0.1781972497701645, 0.18698599934577942, 0.19577476382255554, 0.20456351339817047, 0.2133522629737854, 0.22214101254940033, 0.23092976212501526, 0.23971852660179138, 0.2485072761774063, 0.25729602575302124, 0.26608479022979736, 0.2748735249042511, 0.2836622893810272]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 6.0, 10.0, 7.0, 10.0, 6.0, 6.0, 10.0, 16.0, 23.0, 18.0, 20.0, 21.0, 25.0, 19.0, 28.0, 32.0, 38.0, 34.0, 40.0, 40.0, 39.0, 54.0, 43.0, 48.0, 32.0, 41.0, 38.0, 30.0, 26.0, 22.0, 25.0, 27.0, 19.0, 23.0, 20.0, 13.0, 13.0, 7.0, 13.0, 10.0, 7.0, 7.0, 9.0, 7.0, 3.0, 2.0, 2.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.09588378667831421, -0.09298962354660034, -0.09009545296430588, -0.08720128983259201, -0.08430711925029755, -0.08141295611858368, -0.07851879298686981, -0.07562462985515594, -0.07273045927286148, -0.06983629614114761, -0.06694212555885315, -0.06404796242713928, -0.06115379557013512, -0.05825962871313095, -0.055365465581417084, -0.05247129872441292, -0.04957713186740875, -0.04668296501040459, -0.04378879815340042, -0.040894635021686554, -0.03800046816468239, -0.03510630130767822, -0.032212138175964355, -0.02931797131896019, -0.026423804461956024, -0.02352963760495186, -0.020635472610592842, -0.017741307616233826, -0.01484714075922966, -0.011952974833548069, -0.009058808907866478, -0.0061646439135074615, -0.003270477056503296, -0.00037631113082170486, 0.002517854794859886, 0.005412020720541477, 0.008306186646223068, 0.01120035257190466, 0.01409451849758625, 0.016988683491945267, 0.019882850348949432, 0.022777017205953598, 0.025671182200312614, 0.02856534719467163, 0.031459514051675797, 0.03435368090867996, 0.03724784404039383, 0.040142010897397995, 0.04303617775440216, 0.045930344611406326, 0.04882451146841049, 0.05171867460012436, 0.054612841457128525, 0.05750700831413269, 0.06040117144584656, 0.06329533457756042, 0.06618950515985489, 0.06908366829156876, 0.07197783887386322, 0.07487200200557709, 0.07776616513729095, 0.08066033571958542, 0.08355449885129929, 0.08644866943359375, 0.08934283256530762]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 0.0, 4.0, 3.0, 7.0, 25.0, 30.0, 40.0, 54.0, 95.0, 176.0, 395.0, 749.0, 1573.0, 3981.0, 10523.0, 34137.0, 125714.0, 390202.0, 338802.0, 99493.0, 27643.0, 8780.0, 3323.0, 1418.0, 659.0, 317.0, 169.0, 94.0, 54.0, 29.0, 28.0, 13.0, 12.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0197906494140625, -0.019129037857055664, -0.018467426300048828, -0.017805814743041992, -0.017144203186035156, -0.01648259162902832, -0.015820980072021484, -0.015159368515014648, -0.014497756958007812, -0.013836145401000977, -0.01317453384399414, -0.012512922286987305, -0.011851310729980469, -0.011189699172973633, -0.010528087615966797, -0.009866476058959961, -0.009204864501953125, -0.008543252944946289, -0.007881641387939453, -0.007220029830932617, -0.006558418273925781, -0.005896806716918945, -0.005235195159912109, -0.0045735836029052734, -0.0039119720458984375, -0.0032503604888916016, -0.0025887489318847656, -0.0019271373748779297, -0.0012655258178710938, -0.0006039142608642578, 5.7697296142578125e-05, 0.0007193088531494141, 0.00138092041015625, 0.002042531967163086, 0.002704143524169922, 0.003365755081176758, 0.004027366638183594, 0.00468897819519043, 0.005350589752197266, 0.0060122013092041016, 0.0066738128662109375, 0.0073354244232177734, 0.00799703598022461, 0.008658647537231445, 0.009320259094238281, 0.009981870651245117, 0.010643482208251953, 0.011305093765258789, 0.011966705322265625, 0.012628316879272461, 0.013289928436279297, 0.013951539993286133, 0.014613151550292969, 0.015274763107299805, 0.01593637466430664, 0.016597986221313477, 0.017259597778320312, 0.01792120933532715, 0.018582820892333984, 0.01924443244934082, 0.019906044006347656, 0.020567655563354492, 0.021229267120361328, 0.021890878677368164, 0.022552490234375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 8.0, 5.0, 15.0, 16.0, 23.0, 33.0, 51.0, 59.0, 66.0, 57.0, 79.0, 93.0, 70.0, 74.0, 69.0, 54.0, 64.0, 45.0, 38.0, 15.0, 20.0, 8.0, 8.0, 6.0, 3.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01953125, -0.01890110969543457, -0.01827096939086914, -0.01764082908630371, -0.01701068878173828, -0.01638054847717285, -0.015750408172607422, -0.015120267868041992, -0.014490127563476562, -0.013859987258911133, -0.013229846954345703, -0.012599706649780273, -0.011969566345214844, -0.011339426040649414, -0.010709285736083984, -0.010079145431518555, -0.009449005126953125, -0.008818864822387695, -0.008188724517822266, -0.007558584213256836, -0.006928443908691406, -0.0062983036041259766, -0.005668163299560547, -0.005038022994995117, -0.0044078826904296875, -0.003777742385864258, -0.003147602081298828, -0.0025174617767333984, -0.0018873214721679688, -0.001257181167602539, -0.0006270408630371094, 3.0994415283203125e-06, 0.00063323974609375, 0.0012633800506591797, 0.0018935203552246094, 0.002523660659790039, 0.0031538009643554688, 0.0037839412689208984, 0.004414081573486328, 0.005044221878051758, 0.0056743621826171875, 0.006304502487182617, 0.006934642791748047, 0.0075647830963134766, 0.008194923400878906, 0.008825063705444336, 0.009455204010009766, 0.010085344314575195, 0.010715484619140625, 0.011345624923706055, 0.011975765228271484, 0.012605905532836914, 0.013236045837402344, 0.013866186141967773, 0.014496326446533203, 0.015126466751098633, 0.015756607055664062, 0.016386747360229492, 0.017016887664794922, 0.01764702796936035, 0.01827716827392578, 0.01890730857849121, 0.01953744888305664, 0.02016758918762207, 0.0207977294921875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 8.0, 4.0, 9.0, 14.0, 29.0, 32.0, 70.0, 107.0, 168.0, 247.0, 436.0, 757.0, 1537.0, 3961.0, 18352.0, 243002.0, 714140.0, 53562.0, 7240.0, 2262.0, 1043.0, 578.0, 361.0, 205.0, 156.0, 96.0, 50.0, 54.0, 23.0, 16.0, 15.0, 4.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03839111328125, -0.037199974060058594, -0.03600883483886719, -0.03481769561767578, -0.033626556396484375, -0.03243541717529297, -0.031244277954101562, -0.030053138732910156, -0.02886199951171875, -0.027670860290527344, -0.026479721069335938, -0.02528858184814453, -0.024097442626953125, -0.02290630340576172, -0.021715164184570312, -0.020524024963378906, -0.0193328857421875, -0.018141746520996094, -0.016950607299804688, -0.01575946807861328, -0.014568328857421875, -0.013377189636230469, -0.012186050415039062, -0.010994911193847656, -0.00980377197265625, -0.008612632751464844, -0.0074214935302734375, -0.006230354309082031, -0.005039215087890625, -0.0038480758666992188, -0.0026569366455078125, -0.0014657974243164062, -0.000274658203125, 0.0009164810180664062, 0.0021076202392578125, 0.0032987594604492188, 0.004489898681640625, 0.005681037902832031, 0.0068721771240234375, 0.008063316345214844, 0.00925445556640625, 0.010445594787597656, 0.011636734008789062, 0.012827873229980469, 0.014019012451171875, 0.015210151672363281, 0.016401290893554688, 0.017592430114746094, 0.0187835693359375, 0.019974708557128906, 0.021165847778320312, 0.02235698699951172, 0.023548126220703125, 0.02473926544189453, 0.025930404663085938, 0.027121543884277344, 0.02831268310546875, 0.029503822326660156, 0.030694961547851562, 0.03188610076904297, 0.033077239990234375, 0.03426837921142578, 0.03545951843261719, 0.036650657653808594, 0.037841796875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 1.0, 8.0, 5.0, 11.0, 6.0, 11.0, 19.0, 13.0, 23.0, 28.0, 27.0, 23.0, 28.0, 30.0, 46.0, 40.0, 44.0, 48.0, 34.0, 50.0, 51.0, 46.0, 34.0, 35.0, 42.0, 39.0, 35.0, 30.0, 25.0, 28.0, 26.0, 12.0, 18.0, 23.0, 13.0, 15.0, 6.0, 5.0, 8.0, 6.0, 0.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03802490234375, -0.03664731979370117, -0.035269737243652344, -0.033892154693603516, -0.03251457214355469, -0.03113698959350586, -0.02975940704345703, -0.028381824493408203, -0.027004241943359375, -0.025626659393310547, -0.02424907684326172, -0.02287149429321289, -0.021493911743164062, -0.020116329193115234, -0.018738746643066406, -0.017361164093017578, -0.01598358154296875, -0.014605998992919922, -0.013228416442871094, -0.011850833892822266, -0.010473251342773438, -0.00909566879272461, -0.007718086242675781, -0.006340503692626953, -0.004962921142578125, -0.003585338592529297, -0.0022077560424804688, -0.0008301734924316406, 0.0005474090576171875, 0.0019249916076660156, 0.0033025741577148438, 0.004680156707763672, 0.0060577392578125, 0.007435321807861328, 0.008812904357910156, 0.010190486907958984, 0.011568069458007812, 0.01294565200805664, 0.014323234558105469, 0.015700817108154297, 0.017078399658203125, 0.018455982208251953, 0.01983356475830078, 0.02121114730834961, 0.022588729858398438, 0.023966312408447266, 0.025343894958496094, 0.026721477508544922, 0.02809906005859375, 0.029476642608642578, 0.030854225158691406, 0.032231807708740234, 0.03360939025878906, 0.03498697280883789, 0.03636455535888672, 0.03774213790893555, 0.039119720458984375, 0.0404973030090332, 0.04187488555908203, 0.04325246810913086, 0.04463005065917969, 0.046007633209228516, 0.047385215759277344, 0.04876279830932617, 0.050140380859375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 7.0, 1.0, 9.0, 5.0, 6.0, 9.0, 18.0, 48.0, 72.0, 141.0, 213.0, 486.0, 1025.0, 2792.0, 12670.0, 996288.0, 28395.0, 3958.0, 1274.0, 544.0, 249.0, 145.0, 97.0, 46.0, 21.0, 8.0, 8.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0731201171875, -0.07112503051757812, -0.06912994384765625, -0.06713485717773438, -0.0651397705078125, -0.06314468383789062, -0.06114959716796875, -0.059154510498046875, -0.057159423828125, -0.055164337158203125, -0.05316925048828125, -0.051174163818359375, -0.0491790771484375, -0.047183990478515625, -0.04518890380859375, -0.043193817138671875, -0.04119873046875, -0.039203643798828125, -0.03720855712890625, -0.035213470458984375, -0.0332183837890625, -0.031223297119140625, -0.02922821044921875, -0.027233123779296875, -0.025238037109375, -0.023242950439453125, -0.02124786376953125, -0.019252777099609375, -0.0172576904296875, -0.015262603759765625, -0.01326751708984375, -0.011272430419921875, -0.00927734375, -0.007282257080078125, -0.00528717041015625, -0.003292083740234375, -0.0012969970703125, 0.000698089599609375, 0.00269317626953125, 0.004688262939453125, 0.006683349609375, 0.008678436279296875, 0.01067352294921875, 0.012668609619140625, 0.0146636962890625, 0.016658782958984375, 0.01865386962890625, 0.020648956298828125, 0.02264404296875, 0.024639129638671875, 0.02663421630859375, 0.028629302978515625, 0.0306243896484375, 0.032619476318359375, 0.03461456298828125, 0.036609649658203125, 0.038604736328125, 0.040599822998046875, 0.04259490966796875, 0.044589996337890625, 0.0465850830078125, 0.048580169677734375, 0.05057525634765625, 0.052570343017578125, 0.0545654296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 2.0, 5.0, 5.0, 1.0, 12.0, 7.0, 11.0, 23.0, 23.0, 23.0, 26.0, 67.0, 89.0, 139.0, 159.0, 142.0, 67.0, 39.0, 39.0, 25.0, 20.0, 17.0, 18.0, 6.0, 13.0, 10.0, 5.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.684925079345703e-05, -4.5000575482845306e-05, -4.315190017223358e-05, -4.130322486162186e-05, -3.945454955101013e-05, -3.760587424039841e-05, -3.575719892978668e-05, -3.390852361917496e-05, -3.205984830856323e-05, -3.0211172997951508e-05, -2.8362497687339783e-05, -2.6513822376728058e-05, -2.4665147066116333e-05, -2.2816471755504608e-05, -2.0967796444892883e-05, -1.911912113428116e-05, -1.7270445823669434e-05, -1.542177051305771e-05, -1.3573095202445984e-05, -1.1724419891834259e-05, -9.875744581222534e-06, -8.02706927061081e-06, -6.1783939599990845e-06, -4.32971864938736e-06, -2.4810433387756348e-06, -6.323680281639099e-07, 1.216307282447815e-06, 3.06498259305954e-06, 4.913657903671265e-06, 6.7623332142829895e-06, 8.611008524894714e-06, 1.045968383550644e-05, 1.2308359146118164e-05, 1.4157034456729889e-05, 1.6005709767341614e-05, 1.785438507795334e-05, 1.9703060388565063e-05, 2.155173569917679e-05, 2.3400411009788513e-05, 2.5249086320400238e-05, 2.7097761631011963e-05, 2.8946436941623688e-05, 3.079511225223541e-05, 3.264378756284714e-05, 3.449246287345886e-05, 3.634113818407059e-05, 3.818981349468231e-05, 4.003848880529404e-05, 4.188716411590576e-05, 4.3735839426517487e-05, 4.558451473712921e-05, 4.7433190047740936e-05, 4.928186535835266e-05, 5.1130540668964386e-05, 5.297921597957611e-05, 5.4827891290187836e-05, 5.667656660079956e-05, 5.8525241911411285e-05, 6.037391722202301e-05, 6.222259253263474e-05, 6.407126784324646e-05, 6.591994315385818e-05, 6.776861846446991e-05, 6.961729377508163e-05, 7.146596908569336e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 3.0, 5.0, 1.0, 11.0, 8.0, 9.0, 11.0, 18.0, 19.0, 24.0, 57.0, 92.0, 152.0, 298.0, 570.0, 1404.0, 3558.0, 11947.0, 366618.0, 643448.0, 13425.0, 3805.0, 1545.0, 702.0, 332.0, 179.0, 94.0, 61.0, 43.0, 30.0, 17.0, 10.0, 8.0, 11.0, 7.0, 4.0, 7.0, 6.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.036712646484375, -0.03563404083251953, -0.03455543518066406, -0.033476829528808594, -0.032398223876953125, -0.031319618225097656, -0.030241012573242188, -0.02916240692138672, -0.02808380126953125, -0.02700519561767578, -0.025926589965820312, -0.024847984313964844, -0.023769378662109375, -0.022690773010253906, -0.021612167358398438, -0.02053356170654297, -0.0194549560546875, -0.01837635040283203, -0.017297744750976562, -0.016219139099121094, -0.015140533447265625, -0.014061927795410156, -0.012983322143554688, -0.011904716491699219, -0.01082611083984375, -0.009747505187988281, -0.008668899536132812, -0.007590293884277344, -0.006511688232421875, -0.005433082580566406, -0.0043544769287109375, -0.0032758712768554688, -0.002197265625, -0.0011186599731445312, -4.00543212890625e-05, 0.0010385513305664062, 0.002117156982421875, 0.0031957626342773438, 0.0042743682861328125, 0.005352973937988281, 0.00643157958984375, 0.007510185241699219, 0.008588790893554688, 0.009667396545410156, 0.010746002197265625, 0.011824607849121094, 0.012903213500976562, 0.013981819152832031, 0.0150604248046875, 0.01613903045654297, 0.017217636108398438, 0.018296241760253906, 0.019374847412109375, 0.020453453063964844, 0.021532058715820312, 0.02261066436767578, 0.02368927001953125, 0.02476787567138672, 0.025846481323242188, 0.026925086975097656, 0.028003692626953125, 0.029082298278808594, 0.030160903930664062, 0.03123950958251953, 0.032318115234375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 6.0, 18.0, 21.0, 52.0, 65.0, 117.0, 152.0, 190.0, 149.0, 80.0, 39.0, 34.0, 21.0, 12.0, 13.0, 8.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.024169921875, -0.023463964462280273, -0.022758007049560547, -0.02205204963684082, -0.021346092224121094, -0.020640134811401367, -0.01993417739868164, -0.019228219985961914, -0.018522262573242188, -0.01781630516052246, -0.017110347747802734, -0.016404390335083008, -0.01569843292236328, -0.014992475509643555, -0.014286518096923828, -0.013580560684204102, -0.012874603271484375, -0.012168645858764648, -0.011462688446044922, -0.010756731033325195, -0.010050773620605469, -0.009344816207885742, -0.008638858795166016, -0.007932901382446289, -0.0072269439697265625, -0.006520986557006836, -0.005815029144287109, -0.005109071731567383, -0.004403114318847656, -0.0036971569061279297, -0.002991199493408203, -0.0022852420806884766, -0.00157928466796875, -0.0008733272552490234, -0.00016736984252929688, 0.0005385875701904297, 0.0012445449829101562, 0.0019505023956298828, 0.0026564598083496094, 0.003362417221069336, 0.0040683746337890625, 0.004774332046508789, 0.005480289459228516, 0.006186246871948242, 0.006892204284667969, 0.007598161697387695, 0.008304119110107422, 0.009010076522827148, 0.009716033935546875, 0.010421991348266602, 0.011127948760986328, 0.011833906173706055, 0.012539863586425781, 0.013245820999145508, 0.013951778411865234, 0.014657735824584961, 0.015363693237304688, 0.016069650650024414, 0.01677560806274414, 0.017481565475463867, 0.018187522888183594, 0.01889348030090332, 0.019599437713623047, 0.020305395126342773, 0.0210113525390625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 5.0, 12.0, 33.0, 125.0, 432.0, 310.0, 68.0, 16.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21322138607501984, -0.18608735501766205, -0.15895330905914307, -0.13181927800178528, -0.1046852394938469, -0.07755120098590851, -0.05041716992855072, -0.02328312397003174, 0.00385090708732605, 0.030984943732619286, 0.05811898037791252, 0.08525301516056061, 0.11238705366849899, 0.13952109217643738, 0.16665512323379517, 0.19378916919231415, 0.22092320024967194, 0.24805723130702972, 0.2751912772655487, 0.3023253083229065, 0.3294593393802643, 0.35659337043762207, 0.38372743129730225, 0.41086146235466003, 0.4379954934120178, 0.4651295244693756, 0.4922635555267334, 0.5193976163864136, 0.546531617641449, 0.5736656785011292, 0.6007996797561646, 0.6279337406158447, 0.6550677418708801, 0.6822018027305603, 0.7093358039855957, 0.7364698648452759, 0.7636038661003113, 0.7907379269599915, 0.8178719282150269, 0.845005989074707, 0.8721400499343872, 0.8992741107940674, 0.9264081120491028, 0.953542172908783, 0.9806761741638184, 1.0078102350234985, 1.0349442958831787, 1.0620783567428589, 1.0892122983932495, 1.1163463592529297, 1.1434804201126099, 1.1706143617630005, 1.1977484226226807, 1.2248824834823608, 1.252016544342041, 1.2791506052017212, 1.3062846660614014, 1.3334187269210815, 1.3605527877807617, 1.3876867294311523, 1.4148207902908325, 1.4419548511505127, 1.4690889120101929, 1.496222972869873, 1.5233569145202637]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 5.0, 5.0, 11.0, 12.0, 17.0, 18.0, 23.0, 17.0, 26.0, 39.0, 41.0, 36.0, 47.0, 43.0, 44.0, 60.0, 55.0, 65.0, 63.0, 55.0, 41.0, 42.0, 36.0, 37.0, 31.0, 21.0, 26.0, 14.0, 11.0, 15.0, 9.0, 7.0, 10.0, 6.0, 9.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17495495080947876, -0.16816669702529907, -0.16137844324111938, -0.1545901745557785, -0.14780192077159882, -0.14101366698741913, -0.13422539830207825, -0.12743714451789856, -0.12064889073371887, -0.11386063694953918, -0.1070723757147789, -0.10028411448001862, -0.09349586069583893, -0.08670760691165924, -0.07991934567689896, -0.07313108444213867, -0.06634283065795898, -0.059554573148489, -0.05276631563901901, -0.045978058129549026, -0.03918980062007904, -0.032401543110609055, -0.02561328560113907, -0.018825028091669083, -0.012036770582199097, -0.005248513072729111, 0.0015397444367408752, 0.008328001946210861, 0.015116259455680847, 0.021904516965150833, 0.02869277447462082, 0.035481031984090805, 0.04226928949356079, 0.04905754700303078, 0.05584580451250076, 0.06263406574726105, 0.06942231953144073, 0.07621057331562042, 0.0829988345503807, 0.08978709578514099, 0.09657534956932068, 0.10336360335350037, 0.11015186458826065, 0.11694012582302094, 0.12372837960720062, 0.1305166333913803, 0.1373049020767212, 0.14409315586090088, 0.15088140964508057, 0.15766966342926025, 0.16445791721343994, 0.17124618589878082, 0.1780344396829605, 0.1848226934671402, 0.19161096215248108, 0.19839921593666077, 0.20518746972084045, 0.21197572350502014, 0.21876397728919983, 0.2255522459745407, 0.2323404997587204, 0.23912875354290009, 0.24591702222824097, 0.25270527601242065, 0.25949352979660034]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 11.0, 39.0, 119.0, 352.0, 1820487.0, 2372818.0, 315.0, 90.0, 32.0, 17.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2320556640625, -0.20627403259277344, -0.18049240112304688, -0.1547107696533203, -0.12892913818359375, -0.10314750671386719, -0.07736587524414062, -0.05158424377441406, -0.0258026123046875, -2.09808349609375e-05, 0.025760650634765625, 0.05154228210449219, 0.07732391357421875, 0.10310554504394531, 0.12888717651367188, 0.15466880798339844, 0.180450439453125, 0.20623207092285156, 0.23201370239257812, 0.2577953338623047, 0.28357696533203125, 0.3093585968017578, 0.3351402282714844, 0.36092185974121094, 0.3867034912109375, 0.41248512268066406, 0.4382667541503906, 0.4640483856201172, 0.48983001708984375, 0.5156116485595703, 0.5413932800292969, 0.5671749114990234, 0.59295654296875, 0.6187381744384766, 0.6445198059082031, 0.6703014373779297, 0.6960830688476562, 0.7218647003173828, 0.7476463317871094, 0.7734279632568359, 0.7992095947265625, 0.8249912261962891, 0.8507728576660156, 0.8765544891357422, 0.9023361206054688, 0.9281177520751953, 0.9538993835449219, 0.9796810150146484, 1.005462646484375, 1.0312442779541016, 1.0570259094238281, 1.0828075408935547, 1.1085891723632812, 1.1343708038330078, 1.1601524353027344, 1.185934066772461, 1.2117156982421875, 1.237497329711914, 1.2632789611816406, 1.2890605926513672, 1.3148422241210938, 1.3406238555908203, 1.3664054870605469, 1.3921871185302734, 1.41796875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 7.0, 1.0, 10.0, 14.0, 25.0, 36.0, 50.0, 64.0, 63.0, 77.0, 80.0, 76.0, 85.0, 72.0, 77.0, 78.0, 45.0, 39.0, 32.0, 22.0, 11.0, 9.0, 7.0, 9.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0184478759765625, -0.017790555953979492, -0.017133235931396484, -0.016475915908813477, -0.01581859588623047, -0.015161275863647461, -0.014503955841064453, -0.013846635818481445, -0.013189315795898438, -0.01253199577331543, -0.011874675750732422, -0.011217355728149414, -0.010560035705566406, -0.009902715682983398, -0.00924539566040039, -0.008588075637817383, -0.007930755615234375, -0.007273435592651367, -0.006616115570068359, -0.0059587955474853516, -0.005301475524902344, -0.004644155502319336, -0.003986835479736328, -0.0033295154571533203, -0.0026721954345703125, -0.0020148754119873047, -0.0013575553894042969, -0.0007002353668212891, -4.291534423828125e-05, 0.0006144046783447266, 0.0012717247009277344, 0.0019290447235107422, 0.00258636474609375, 0.003243684768676758, 0.0039010047912597656, 0.0045583248138427734, 0.005215644836425781, 0.005872964859008789, 0.006530284881591797, 0.007187604904174805, 0.007844924926757812, 0.00850224494934082, 0.009159564971923828, 0.009816884994506836, 0.010474205017089844, 0.011131525039672852, 0.01178884506225586, 0.012446165084838867, 0.013103485107421875, 0.013760805130004883, 0.01441812515258789, 0.015075445175170898, 0.015732765197753906, 0.016390085220336914, 0.017047405242919922, 0.01770472526550293, 0.018362045288085938, 0.019019365310668945, 0.019676685333251953, 0.02033400535583496, 0.02099132537841797, 0.021648645401000977, 0.022305965423583984, 0.022963285446166992, 0.02362060546875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 9.0, 15.0, 24.0, 39.0, 93.0, 183.0, 426.0, 934.0, 2701.0, 12927.0, 174290.0, 3940919.0, 52533.0, 6475.0, 1663.0, 551.0, 262.0, 115.0, 42.0, 34.0, 16.0, 6.0, 6.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05572509765625, -0.05405235290527344, -0.052379608154296875, -0.05070686340332031, -0.04903411865234375, -0.04736137390136719, -0.045688629150390625, -0.04401588439941406, -0.0423431396484375, -0.04067039489746094, -0.038997650146484375, -0.03732490539550781, -0.03565216064453125, -0.03397941589355469, -0.032306671142578125, -0.030633926391601562, -0.028961181640625, -0.027288436889648438, -0.025615692138671875, -0.023942947387695312, -0.02227020263671875, -0.020597457885742188, -0.018924713134765625, -0.017251968383789062, -0.0155792236328125, -0.013906478881835938, -0.012233734130859375, -0.010560989379882812, -0.00888824462890625, -0.0072154998779296875, -0.005542755126953125, -0.0038700103759765625, -0.002197265625, -0.0005245208740234375, 0.001148223876953125, 0.0028209686279296875, 0.00449371337890625, 0.0061664581298828125, 0.007839202880859375, 0.009511947631835938, 0.0111846923828125, 0.012857437133789062, 0.014530181884765625, 0.016202926635742188, 0.01787567138671875, 0.019548416137695312, 0.021221160888671875, 0.022893905639648438, 0.024566650390625, 0.026239395141601562, 0.027912139892578125, 0.029584884643554688, 0.03125762939453125, 0.03293037414550781, 0.034603118896484375, 0.03627586364746094, 0.0379486083984375, 0.03962135314941406, 0.041294097900390625, 0.04296684265136719, 0.04463958740234375, 0.04631233215332031, 0.047985076904296875, 0.04965782165527344, 0.05133056640625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 21.0, 19.0, 37.0, 69.0, 88.0, 321.0, 1417.0, 1413.0, 368.0, 109.0, 75.0, 39.0, 24.0, 16.0, 7.0, 9.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.047454833984375, -0.04623866081237793, -0.04502248764038086, -0.04380631446838379, -0.04259014129638672, -0.04137396812438965, -0.04015779495239258, -0.03894162178039551, -0.03772544860839844, -0.03650927543640137, -0.0352931022644043, -0.03407692909240723, -0.032860755920410156, -0.031644582748413086, -0.030428409576416016, -0.029212236404418945, -0.027996063232421875, -0.026779890060424805, -0.025563716888427734, -0.024347543716430664, -0.023131370544433594, -0.021915197372436523, -0.020699024200439453, -0.019482851028442383, -0.018266677856445312, -0.017050504684448242, -0.015834331512451172, -0.014618158340454102, -0.013401985168457031, -0.012185811996459961, -0.01096963882446289, -0.00975346565246582, -0.00853729248046875, -0.00732111930847168, -0.006104946136474609, -0.004888772964477539, -0.0036725997924804688, -0.0024564266204833984, -0.0012402534484863281, -2.4080276489257812e-05, 0.0011920928955078125, 0.002408266067504883, 0.003624439239501953, 0.0048406124114990234, 0.006056785583496094, 0.007272958755493164, 0.008489131927490234, 0.009705305099487305, 0.010921478271484375, 0.012137651443481445, 0.013353824615478516, 0.014569997787475586, 0.015786170959472656, 0.017002344131469727, 0.018218517303466797, 0.019434690475463867, 0.020650863647460938, 0.021867036819458008, 0.023083209991455078, 0.02429938316345215, 0.02551555633544922, 0.02673172950744629, 0.02794790267944336, 0.02916407585144043, 0.0303802490234375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 8.0, 14.0, 31.0, 63.0, 131.0, 230.0, 250.0, 147.0, 85.0, 18.0, 4.0, 8.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46390947699546814, -0.4539170265197754, -0.44392457604408264, -0.4339321553707123, -0.42393970489501953, -0.4139472544193268, -0.40395480394363403, -0.3939623534679413, -0.38396990299224854, -0.3739774525165558, -0.36398500204086304, -0.3539925813674927, -0.3440001308917999, -0.3340076804161072, -0.32401522994041443, -0.3140227794647217, -0.3040303587913513, -0.29403790831565857, -0.2840454578399658, -0.27405303716659546, -0.2640605866909027, -0.25406813621520996, -0.2440756857395172, -0.23408323526382446, -0.2240907996892929, -0.21409834921360016, -0.2041059136390686, -0.19411346316337585, -0.1841210126876831, -0.17412857711315155, -0.1641361266374588, -0.15414369106292725, -0.1441512554883957, -0.13415880501270294, -0.12416636943817139, -0.11417391896247864, -0.10418147593736649, -0.09418903291225433, -0.08419658243656158, -0.07420413941144943, -0.06421169638633728, -0.05421925336122513, -0.04422680661082268, -0.03423435986042023, -0.024241916835308075, -0.014249473810195923, -0.004257027059793472, 0.005735419690608978, 0.01572786271572113, 0.02572030760347843, 0.03571275249123573, 0.045705199241638184, 0.055697642266750336, 0.06569008529186249, 0.07568253576755524, 0.08567497879266739, 0.09566742181777954, 0.1056598648428917, 0.11565230786800385, 0.1256447583436966, 0.13563719391822815, 0.1456296443939209, 0.15562209486961365, 0.1656145453453064, 0.17560698091983795]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 8.0, 12.0, 22.0, 16.0, 25.0, 27.0, 32.0, 50.0, 42.0, 45.0, 57.0, 51.0, 60.0, 54.0, 52.0, 65.0, 63.0, 52.0, 50.0, 35.0, 40.0, 20.0, 19.0, 28.0, 19.0, 7.0, 14.0, 6.0, 9.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.14072805643081665, -0.1366768777370453, -0.13262568414211273, -0.12857449054718018, -0.12452331185340881, -0.12047212570905685, -0.1164209395647049, -0.11236975342035294, -0.10831856727600098, -0.10426738113164902, -0.10021619498729706, -0.0961650088429451, -0.09211382269859314, -0.08806263655424118, -0.08401145040988922, -0.07996026426553726, -0.0759090781211853, -0.07185789197683334, -0.06780670583248138, -0.06375551968812943, -0.059704333543777466, -0.05565314739942551, -0.05160196125507355, -0.04755077511072159, -0.04349958896636963, -0.03944840282201767, -0.03539721667766571, -0.03134603053331375, -0.027294844388961792, -0.023243658244609833, -0.019192472100257874, -0.015141285955905914, -0.011090099811553955, -0.007038913667201996, -0.0029877275228500366, 0.0010634586215019226, 0.005114644765853882, 0.009165830910205841, 0.0132170170545578, 0.01726820319890976, 0.02131938934326172, 0.025370575487613678, 0.029421761631965637, 0.033472947776317596, 0.037524133920669556, 0.041575320065021515, 0.045626506209373474, 0.04967769235372543, 0.05372887849807739, 0.05778006464242935, 0.06183125078678131, 0.06588243693113327, 0.06993362307548523, 0.07398480921983719, 0.07803599536418915, 0.08208718150854111, 0.08613836765289307, 0.09018955379724503, 0.09424073994159698, 0.09829192608594894, 0.1023431122303009, 0.10639429837465286, 0.11044548451900482, 0.11449667066335678, 0.11854785680770874]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 9.0, 11.0, 22.0, 24.0, 48.0, 162.0, 429.0, 1871.0, 12830.0, 322268.0, 680551.0, 26403.0, 2952.0, 586.0, 212.0, 78.0, 32.0, 20.0, 12.0, 8.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06427001953125, -0.062064170837402344, -0.05985832214355469, -0.05765247344970703, -0.055446624755859375, -0.05324077606201172, -0.05103492736816406, -0.048829078674316406, -0.04662322998046875, -0.044417381286621094, -0.04221153259277344, -0.04000568389892578, -0.037799835205078125, -0.03559398651123047, -0.03338813781738281, -0.031182289123535156, -0.0289764404296875, -0.026770591735839844, -0.024564743041992188, -0.02235889434814453, -0.020153045654296875, -0.01794719696044922, -0.015741348266601562, -0.013535499572753906, -0.01132965087890625, -0.009123802185058594, -0.0069179534912109375, -0.004712104797363281, -0.002506256103515625, -0.00030040740966796875, 0.0019054412841796875, 0.004111289978027344, 0.006317138671875, 0.008522987365722656, 0.010728836059570312, 0.012934684753417969, 0.015140533447265625, 0.01734638214111328, 0.019552230834960938, 0.021758079528808594, 0.02396392822265625, 0.026169776916503906, 0.028375625610351562, 0.03058147430419922, 0.032787322998046875, 0.03499317169189453, 0.03719902038574219, 0.039404869079589844, 0.0416107177734375, 0.043816566467285156, 0.04602241516113281, 0.04822826385498047, 0.050434112548828125, 0.05263996124267578, 0.05484580993652344, 0.057051658630371094, 0.05925750732421875, 0.061463356018066406, 0.06366920471191406, 0.06587505340576172, 0.06808090209960938, 0.07028675079345703, 0.07249259948730469, 0.07469844818115234, 0.076904296875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 4.0, 9.0, 14.0, 22.0, 20.0, 31.0, 51.0, 61.0, 55.0, 70.0, 52.0, 86.0, 69.0, 90.0, 66.0, 62.0, 64.0, 48.0, 39.0, 18.0, 17.0, 15.0, 6.0, 6.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019500732421875, -0.018875837326049805, -0.01825094223022461, -0.017626047134399414, -0.01700115203857422, -0.016376256942749023, -0.015751361846923828, -0.015126466751098633, -0.014501571655273438, -0.013876676559448242, -0.013251781463623047, -0.012626886367797852, -0.012001991271972656, -0.011377096176147461, -0.010752201080322266, -0.01012730598449707, -0.009502410888671875, -0.00887751579284668, -0.008252620697021484, -0.007627725601196289, -0.007002830505371094, -0.0063779354095458984, -0.005753040313720703, -0.005128145217895508, -0.0045032501220703125, -0.003878355026245117, -0.003253459930419922, -0.0026285648345947266, -0.0020036697387695312, -0.001378774642944336, -0.0007538795471191406, -0.0001289844512939453, 0.00049591064453125, 0.0011208057403564453, 0.0017457008361816406, 0.002370595932006836, 0.0029954910278320312, 0.0036203861236572266, 0.004245281219482422, 0.004870176315307617, 0.0054950714111328125, 0.006119966506958008, 0.006744861602783203, 0.0073697566986083984, 0.007994651794433594, 0.008619546890258789, 0.009244441986083984, 0.00986933708190918, 0.010494232177734375, 0.01111912727355957, 0.011744022369384766, 0.012368917465209961, 0.012993812561035156, 0.013618707656860352, 0.014243602752685547, 0.014868497848510742, 0.015493392944335938, 0.016118288040161133, 0.016743183135986328, 0.017368078231811523, 0.01799297332763672, 0.018617868423461914, 0.01924276351928711, 0.019867658615112305, 0.0204925537109375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 6.0, 6.0, 13.0, 17.0, 32.0, 35.0, 85.0, 90.0, 154.0, 201.0, 384.0, 677.0, 1309.0, 3284.0, 10966.0, 59671.0, 569746.0, 348340.0, 40038.0, 8262.0, 2690.0, 1068.0, 556.0, 308.0, 208.0, 139.0, 79.0, 50.0, 35.0, 16.0, 16.0, 22.0, 9.0, 8.0, 8.0, 1.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.037139892578125, -0.03593778610229492, -0.034735679626464844, -0.033533573150634766, -0.03233146667480469, -0.03112936019897461, -0.02992725372314453, -0.028725147247314453, -0.027523040771484375, -0.026320934295654297, -0.02511882781982422, -0.02391672134399414, -0.022714614868164062, -0.021512508392333984, -0.020310401916503906, -0.019108295440673828, -0.01790618896484375, -0.016704082489013672, -0.015501976013183594, -0.014299869537353516, -0.013097763061523438, -0.01189565658569336, -0.010693550109863281, -0.009491443634033203, -0.008289337158203125, -0.007087230682373047, -0.005885124206542969, -0.004683017730712891, -0.0034809112548828125, -0.0022788047790527344, -0.0010766983032226562, 0.00012540817260742188, 0.0013275146484375, 0.002529621124267578, 0.0037317276000976562, 0.004933834075927734, 0.0061359405517578125, 0.007338047027587891, 0.008540153503417969, 0.009742259979248047, 0.010944366455078125, 0.012146472930908203, 0.013348579406738281, 0.01455068588256836, 0.015752792358398438, 0.016954898834228516, 0.018157005310058594, 0.019359111785888672, 0.02056121826171875, 0.021763324737548828, 0.022965431213378906, 0.024167537689208984, 0.025369644165039062, 0.02657175064086914, 0.02777385711669922, 0.028975963592529297, 0.030178070068359375, 0.03138017654418945, 0.03258228302001953, 0.03378438949584961, 0.03498649597167969, 0.036188602447509766, 0.037390708923339844, 0.03859281539916992, 0.039794921875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 8.0, 14.0, 10.0, 15.0, 17.0, 15.0, 19.0, 33.0, 22.0, 35.0, 50.0, 47.0, 51.0, 56.0, 53.0, 45.0, 55.0, 59.0, 52.0, 54.0, 48.0, 44.0, 31.0, 37.0, 32.0, 20.0, 17.0, 13.0, 8.0, 6.0, 9.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04840087890625, -0.0467371940612793, -0.045073509216308594, -0.04340982437133789, -0.04174613952636719, -0.040082454681396484, -0.03841876983642578, -0.03675508499145508, -0.035091400146484375, -0.03342771530151367, -0.03176403045654297, -0.030100345611572266, -0.028436660766601562, -0.02677297592163086, -0.025109291076660156, -0.023445606231689453, -0.02178192138671875, -0.020118236541748047, -0.018454551696777344, -0.01679086685180664, -0.015127182006835938, -0.013463497161865234, -0.011799812316894531, -0.010136127471923828, -0.008472442626953125, -0.006808757781982422, -0.005145072937011719, -0.0034813880920410156, -0.0018177032470703125, -0.00015401840209960938, 0.0015096664428710938, 0.003173351287841797, 0.0048370361328125, 0.006500720977783203, 0.008164405822753906, 0.00982809066772461, 0.011491775512695312, 0.013155460357666016, 0.014819145202636719, 0.016482830047607422, 0.018146514892578125, 0.019810199737548828, 0.02147388458251953, 0.023137569427490234, 0.024801254272460938, 0.02646493911743164, 0.028128623962402344, 0.029792308807373047, 0.03145599365234375, 0.03311967849731445, 0.034783363342285156, 0.03644704818725586, 0.03811073303222656, 0.039774417877197266, 0.04143810272216797, 0.04310178756713867, 0.044765472412109375, 0.04642915725708008, 0.04809284210205078, 0.049756526947021484, 0.05142021179199219, 0.05308389663696289, 0.054747581481933594, 0.0564112663269043, 0.058074951171875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 5.0, 3.0, 6.0, 4.0, 2.0, 8.0, 9.0, 14.0, 11.0, 29.0, 36.0, 76.0, 123.0, 170.0, 288.0, 569.0, 1153.0, 2681.0, 9104.0, 508395.0, 511600.0, 9208.0, 2680.0, 1062.0, 528.0, 307.0, 183.0, 100.0, 48.0, 44.0, 34.0, 19.0, 13.0, 6.0, 9.0, 4.0, 9.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07330322265625, -0.07101249694824219, -0.06872177124023438, -0.06643104553222656, -0.06414031982421875, -0.06184959411621094, -0.059558868408203125, -0.05726814270019531, -0.0549774169921875, -0.05268669128417969, -0.050395965576171875, -0.04810523986816406, -0.04581451416015625, -0.04352378845214844, -0.041233062744140625, -0.03894233703613281, -0.036651611328125, -0.03436088562011719, -0.032070159912109375, -0.029779434204101562, -0.02748870849609375, -0.025197982788085938, -0.022907257080078125, -0.020616531372070312, -0.0183258056640625, -0.016035079956054688, -0.013744354248046875, -0.011453628540039062, -0.00916290283203125, -0.0068721771240234375, -0.004581451416015625, -0.0022907257080078125, 0.0, 0.0022907257080078125, 0.004581451416015625, 0.0068721771240234375, 0.00916290283203125, 0.011453628540039062, 0.013744354248046875, 0.016035079956054688, 0.0183258056640625, 0.020616531372070312, 0.022907257080078125, 0.025197982788085938, 0.02748870849609375, 0.029779434204101562, 0.032070159912109375, 0.03436088562011719, 0.036651611328125, 0.03894233703613281, 0.041233062744140625, 0.04352378845214844, 0.04581451416015625, 0.04810523986816406, 0.050395965576171875, 0.05268669128417969, 0.0549774169921875, 0.05726814270019531, 0.059558868408203125, 0.06184959411621094, 0.06414031982421875, 0.06643104553222656, 0.06872177124023438, 0.07101249694824219, 0.07330322265625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 5.0, 13.0, 4.0, 4.0, 15.0, 15.0, 16.0, 19.0, 24.0, 36.0, 60.0, 94.0, 134.0, 157.0, 116.0, 83.0, 55.0, 23.0, 32.0, 14.0, 16.0, 11.0, 10.0, 5.0, 5.0, 5.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.8770179748535156e-05, -5.723442882299423e-05, -5.569867789745331e-05, -5.4162926971912384e-05, -5.262717604637146e-05, -5.1091425120830536e-05, -4.955567419528961e-05, -4.801992326974869e-05, -4.6484172344207764e-05, -4.494842141866684e-05, -4.3412670493125916e-05, -4.187691956758499e-05, -4.034116864204407e-05, -3.880541771650314e-05, -3.726966679096222e-05, -3.5733915865421295e-05, -3.419816493988037e-05, -3.266241401433945e-05, -3.112666308879852e-05, -2.95909121632576e-05, -2.8055161237716675e-05, -2.651941031217575e-05, -2.4983659386634827e-05, -2.3447908461093903e-05, -2.191215753555298e-05, -2.0376406610012054e-05, -1.884065568447113e-05, -1.7304904758930206e-05, -1.5769153833389282e-05, -1.4233402907848358e-05, -1.2697651982307434e-05, -1.116190105676651e-05, -9.626150131225586e-06, -8.090399205684662e-06, -6.554648280143738e-06, -5.018897354602814e-06, -3.4831464290618896e-06, -1.9473955035209656e-06, -4.116445779800415e-07, 1.1241063475608826e-06, 2.6598572731018066e-06, 4.195608198642731e-06, 5.731359124183655e-06, 7.267110049724579e-06, 8.802860975265503e-06, 1.0338611900806427e-05, 1.1874362826347351e-05, 1.3410113751888275e-05, 1.49458646774292e-05, 1.6481615602970123e-05, 1.8017366528511047e-05, 1.955311745405197e-05, 2.1088868379592896e-05, 2.262461930513382e-05, 2.4160370230674744e-05, 2.5696121156215668e-05, 2.7231872081756592e-05, 2.8767623007297516e-05, 3.030337393283844e-05, 3.1839124858379364e-05, 3.337487578392029e-05, 3.491062670946121e-05, 3.6446377635002136e-05, 3.798212856054306e-05, 3.9517879486083984e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 2.0, 3.0, 10.0, 8.0, 7.0, 12.0, 19.0, 23.0, 20.0, 43.0, 68.0, 90.0, 177.0, 351.0, 690.0, 1521.0, 3946.0, 14294.0, 148026.0, 818587.0, 47611.0, 7927.0, 2686.0, 1187.0, 555.0, 276.0, 143.0, 103.0, 43.0, 33.0, 23.0, 16.0, 15.0, 8.0, 3.0, 8.0, 5.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0341796875, -0.033121585845947266, -0.03206348419189453, -0.031005382537841797, -0.029947280883789062, -0.028889179229736328, -0.027831077575683594, -0.02677297592163086, -0.025714874267578125, -0.02465677261352539, -0.023598670959472656, -0.022540569305419922, -0.021482467651367188, -0.020424365997314453, -0.01936626434326172, -0.018308162689208984, -0.01725006103515625, -0.016191959381103516, -0.015133857727050781, -0.014075756072998047, -0.013017654418945312, -0.011959552764892578, -0.010901451110839844, -0.00984334945678711, -0.008785247802734375, -0.007727146148681641, -0.006669044494628906, -0.005610942840576172, -0.0045528411865234375, -0.003494739532470703, -0.0024366378784179688, -0.0013785362243652344, -0.0003204345703125, 0.0007376670837402344, 0.0017957687377929688, 0.002853870391845703, 0.0039119720458984375, 0.004970073699951172, 0.006028175354003906, 0.007086277008056641, 0.008144378662109375, 0.00920248031616211, 0.010260581970214844, 0.011318683624267578, 0.012376785278320312, 0.013434886932373047, 0.014492988586425781, 0.015551090240478516, 0.01660919189453125, 0.017667293548583984, 0.01872539520263672, 0.019783496856689453, 0.020841598510742188, 0.021899700164794922, 0.022957801818847656, 0.02401590347290039, 0.025074005126953125, 0.02613210678100586, 0.027190208435058594, 0.028248310089111328, 0.029306411743164062, 0.030364513397216797, 0.03142261505126953, 0.032480716705322266, 0.033538818359375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 11.0, 7.0, 8.0, 16.0, 21.0, 19.0, 40.0, 49.0, 51.0, 79.0, 99.0, 96.0, 99.0, 89.0, 70.0, 68.0, 45.0, 27.0, 26.0, 16.0, 13.0, 11.0, 8.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.020294189453125, -0.019695281982421875, -0.01909637451171875, -0.018497467041015625, -0.0178985595703125, -0.017299652099609375, -0.01670074462890625, -0.016101837158203125, -0.0155029296875, -0.014904022216796875, -0.01430511474609375, -0.013706207275390625, -0.0131072998046875, -0.012508392333984375, -0.01190948486328125, -0.011310577392578125, -0.010711669921875, -0.010112762451171875, -0.00951385498046875, -0.008914947509765625, -0.0083160400390625, -0.007717132568359375, -0.00711822509765625, -0.006519317626953125, -0.00592041015625, -0.005321502685546875, -0.00472259521484375, -0.004123687744140625, -0.0035247802734375, -0.002925872802734375, -0.00232696533203125, -0.001728057861328125, -0.001129150390625, -0.000530242919921875, 6.866455078125e-05, 0.000667572021484375, 0.0012664794921875, 0.001865386962890625, 0.00246429443359375, 0.003063201904296875, 0.003662109375, 0.004261016845703125, 0.00485992431640625, 0.005458831787109375, 0.0060577392578125, 0.006656646728515625, 0.00725555419921875, 0.007854461669921875, 0.008453369140625, 0.009052276611328125, 0.00965118408203125, 0.010250091552734375, 0.0108489990234375, 0.011447906494140625, 0.01204681396484375, 0.012645721435546875, 0.01324462890625, 0.013843536376953125, 0.01444244384765625, 0.015041351318359375, 0.0156402587890625, 0.016239166259765625, 0.01683807373046875, 0.017436981201171875, 0.018035888671875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 29.0, 101.0, 571.0, 261.0, 30.0, 7.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6955938339233398, -1.6507084369659424, -1.6058229207992554, -1.560937523841858, -1.516052007675171, -1.4711666107177734, -1.426281213760376, -1.3813958168029785, -1.3365103006362915, -1.291624903678894, -1.246739387512207, -1.2018539905548096, -1.156968593597412, -1.112083077430725, -1.0671976804733276, -1.0223121643066406, -0.9774267673492432, -0.9325413107872009, -0.8876558542251587, -0.8427704572677612, -0.797885000705719, -0.7529995441436768, -0.7081141471862793, -0.6632286906242371, -0.6183432340621948, -0.5734577775001526, -0.5285723209381104, -0.4836869239807129, -0.43880146741867065, -0.3939160108566284, -0.34903058409690857, -0.3041451573371887, -0.2592597007751465, -0.21437425911426544, -0.1694888174533844, -0.12460337579250336, -0.07971793413162231, -0.03483249247074127, 0.01005294919013977, 0.05493837594985962, 0.09982383251190186, 0.1447092741727829, 0.18959471583366394, 0.23448015749454498, 0.279365599155426, 0.32425105571746826, 0.3691364824771881, 0.41402190923690796, 0.4589073657989502, 0.5037928223609924, 0.5486782789230347, 0.5935636758804321, 0.6384491324424744, 0.6833345890045166, 0.7282199859619141, 0.7731054425239563, 0.8179908990859985, 0.8628763556480408, 0.907761812210083, 0.9526472091674805, 0.9975326657295227, 1.042418122291565, 1.0873035192489624, 1.1321890354156494, 1.1770744323730469]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 1.0, 10.0, 5.0, 5.0, 6.0, 11.0, 10.0, 22.0, 17.0, 24.0, 26.0, 28.0, 32.0, 30.0, 23.0, 41.0, 51.0, 57.0, 66.0, 65.0, 51.0, 50.0, 28.0, 41.0, 48.0, 34.0, 33.0, 27.0, 24.0, 27.0, 19.0, 13.0, 17.0, 12.0, 11.0, 8.0, 5.0, 3.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.226351797580719, -0.21975180506706238, -0.21315181255340576, -0.20655182003974915, -0.19995182752609253, -0.1933518350124359, -0.1867518573999405, -0.18015186488628387, -0.17355187237262726, -0.16695187985897064, -0.16035188734531403, -0.1537518948316574, -0.147151917219162, -0.14055192470550537, -0.13395193219184875, -0.12735193967819214, -0.12075194716453552, -0.1141519546508789, -0.10755196213722229, -0.10095197707414627, -0.09435198456048965, -0.08775199204683304, -0.08115200698375702, -0.0745520144701004, -0.06795202195644379, -0.06135202944278717, -0.05475204065442085, -0.048152051866054535, -0.04155205935239792, -0.0349520668387413, -0.028352078050374985, -0.021752089262008667, -0.01515209674835205, -0.008552106097340584, -0.0019521154463291168, 0.00464787520468235, 0.011247865855693817, 0.017847858369350433, 0.02444784715771675, 0.03104783594608307, 0.037647828459739685, 0.0442478209733963, 0.05084780976176262, 0.05744779855012894, 0.06404779106378555, 0.07064778357744217, 0.07724776864051819, 0.0838477611541748, 0.09044775366783142, 0.09704774618148804, 0.10364773869514465, 0.11024772375822067, 0.11684771627187729, 0.1234477087855339, 0.13004769384860992, 0.13664768636226654, 0.14324767887592316, 0.14984767138957977, 0.1564476639032364, 0.163047656416893, 0.16964763402938843, 0.17624762654304504, 0.18284761905670166, 0.18944761157035828, 0.1960476040840149]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 6.0, 12.0, 20.0, 33.0, 57.0, 108.0, 342.0, 2243.0, 649141.0, 3538292.0, 3303.0, 383.0, 145.0, 75.0, 52.0, 34.0, 14.0, 8.0, 8.0, 10.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050872802734375, -0.04665803909301758, -0.042443275451660156, -0.038228511810302734, -0.03401374816894531, -0.02979898452758789, -0.02558422088623047, -0.021369457244873047, -0.017154693603515625, -0.012939929962158203, -0.008725166320800781, -0.004510402679443359, -0.0002956390380859375, 0.003919124603271484, 0.008133888244628906, 0.012348651885986328, 0.01656341552734375, 0.020778179168701172, 0.024992942810058594, 0.029207706451416016, 0.03342247009277344, 0.03763723373413086, 0.04185199737548828, 0.0460667610168457, 0.050281524658203125, 0.05449628829956055, 0.05871105194091797, 0.06292581558227539, 0.06714057922363281, 0.07135534286499023, 0.07557010650634766, 0.07978487014770508, 0.0839996337890625, 0.08821439743041992, 0.09242916107177734, 0.09664392471313477, 0.10085868835449219, 0.10507345199584961, 0.10928821563720703, 0.11350297927856445, 0.11771774291992188, 0.1219325065612793, 0.12614727020263672, 0.13036203384399414, 0.13457679748535156, 0.13879156112670898, 0.1430063247680664, 0.14722108840942383, 0.15143585205078125, 0.15565061569213867, 0.1598653793334961, 0.16408014297485352, 0.16829490661621094, 0.17250967025756836, 0.17672443389892578, 0.1809391975402832, 0.18515396118164062, 0.18936872482299805, 0.19358348846435547, 0.1977982521057129, 0.2020130157470703, 0.20622777938842773, 0.21044254302978516, 0.21465730667114258, 0.2188720703125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 8.0, 14.0, 18.0, 30.0, 27.0, 41.0, 50.0, 73.0, 68.0, 70.0, 95.0, 84.0, 77.0, 65.0, 64.0, 46.0, 44.0, 40.0, 22.0, 18.0, 10.0, 6.0, 7.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0237274169921875, -0.023083925247192383, -0.022440433502197266, -0.02179694175720215, -0.02115345001220703, -0.020509958267211914, -0.019866466522216797, -0.01922297477722168, -0.018579483032226562, -0.017935991287231445, -0.017292499542236328, -0.01664900779724121, -0.016005516052246094, -0.015362024307250977, -0.01471853256225586, -0.014075040817260742, -0.013431549072265625, -0.012788057327270508, -0.01214456558227539, -0.011501073837280273, -0.010857582092285156, -0.010214090347290039, -0.009570598602294922, -0.008927106857299805, -0.008283615112304688, -0.00764012336730957, -0.006996631622314453, -0.006353139877319336, -0.005709648132324219, -0.0050661563873291016, -0.004422664642333984, -0.003779172897338867, -0.00313568115234375, -0.002492189407348633, -0.0018486976623535156, -0.0012052059173583984, -0.0005617141723632812, 8.177757263183594e-05, 0.0007252693176269531, 0.0013687610626220703, 0.0020122528076171875, 0.0026557445526123047, 0.003299236297607422, 0.003942728042602539, 0.004586219787597656, 0.0052297115325927734, 0.005873203277587891, 0.006516695022583008, 0.007160186767578125, 0.007803678512573242, 0.00844717025756836, 0.009090662002563477, 0.009734153747558594, 0.010377645492553711, 0.011021137237548828, 0.011664628982543945, 0.012308120727539062, 0.01295161247253418, 0.013595104217529297, 0.014238595962524414, 0.014882087707519531, 0.015525579452514648, 0.016169071197509766, 0.016812562942504883, 0.0174560546875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 15.0, 10.0, 18.0, 21.0, 26.0, 53.0, 68.0, 81.0, 192.0, 434.0, 1425.0, 8271.0, 129836.0, 3949546.0, 93662.0, 7759.0, 1648.0, 550.0, 248.0, 112.0, 74.0, 56.0, 46.0, 33.0, 32.0, 17.0, 11.0, 10.0, 3.0, 7.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0782470703125, -0.07609987258911133, -0.07395267486572266, -0.07180547714233398, -0.06965827941894531, -0.06751108169555664, -0.06536388397216797, -0.0632166862487793, -0.061069488525390625, -0.05892229080200195, -0.05677509307861328, -0.05462789535522461, -0.05248069763183594, -0.050333499908447266, -0.048186302185058594, -0.04603910446166992, -0.04389190673828125, -0.04174470901489258, -0.039597511291503906, -0.037450313568115234, -0.03530311584472656, -0.03315591812133789, -0.03100872039794922, -0.028861522674560547, -0.026714324951171875, -0.024567127227783203, -0.02241992950439453, -0.02027273178100586, -0.018125534057617188, -0.015978336334228516, -0.013831138610839844, -0.011683940887451172, -0.0095367431640625, -0.007389545440673828, -0.005242347717285156, -0.0030951499938964844, -0.0009479522705078125, 0.0011992454528808594, 0.0033464431762695312, 0.005493640899658203, 0.007640838623046875, 0.009788036346435547, 0.011935234069824219, 0.01408243179321289, 0.016229629516601562, 0.018376827239990234, 0.020524024963378906, 0.022671222686767578, 0.02481842041015625, 0.026965618133544922, 0.029112815856933594, 0.031260013580322266, 0.03340721130371094, 0.03555440902709961, 0.03770160675048828, 0.03984880447387695, 0.041996002197265625, 0.0441431999206543, 0.04629039764404297, 0.04843759536743164, 0.05058479309082031, 0.052731990814208984, 0.054879188537597656, 0.05702638626098633, 0.059173583984375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 2.0, 4.0, 7.0, 10.0, 5.0, 10.0, 18.0, 20.0, 27.0, 42.0, 46.0, 68.0, 130.0, 249.0, 635.0, 1053.0, 840.0, 351.0, 165.0, 111.0, 66.0, 51.0, 36.0, 30.0, 31.0, 11.0, 9.0, 13.0, 4.0, 7.0, 5.0, 3.0, 2.0, 4.0, 0.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.031982421875, -0.030908584594726562, -0.029834747314453125, -0.028760910034179688, -0.02768707275390625, -0.026613235473632812, -0.025539398193359375, -0.024465560913085938, -0.0233917236328125, -0.022317886352539062, -0.021244049072265625, -0.020170211791992188, -0.01909637451171875, -0.018022537231445312, -0.016948699951171875, -0.015874862670898438, -0.014801025390625, -0.013727188110351562, -0.012653350830078125, -0.011579513549804688, -0.01050567626953125, -0.009431838989257812, -0.008358001708984375, -0.0072841644287109375, -0.0062103271484375, -0.0051364898681640625, -0.004062652587890625, -0.0029888153076171875, -0.00191497802734375, -0.0008411407470703125, 0.000232696533203125, 0.0013065338134765625, 0.00238037109375, 0.0034542083740234375, 0.004528045654296875, 0.0056018829345703125, 0.00667572021484375, 0.0077495574951171875, 0.008823394775390625, 0.009897232055664062, 0.0109710693359375, 0.012044906616210938, 0.013118743896484375, 0.014192581176757812, 0.01526641845703125, 0.016340255737304688, 0.017414093017578125, 0.018487930297851562, 0.019561767578125, 0.020635604858398438, 0.021709442138671875, 0.022783279418945312, 0.02385711669921875, 0.024930953979492188, 0.026004791259765625, 0.027078628540039062, 0.0281524658203125, 0.029226303100585938, 0.030300140380859375, 0.03137397766113281, 0.03244781494140625, 0.03352165222167969, 0.034595489501953125, 0.03566932678222656, 0.0367431640625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 0.0, 1.0, 5.0, 11.0, 12.0, 39.0, 58.0, 167.0, 235.0, 249.0, 119.0, 44.0, 24.0, 18.0, 10.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5413346290588379, -0.5231657028198242, -0.5049967765808105, -0.4868278503417969, -0.4686588943004608, -0.45048996806144714, -0.43232104182243347, -0.4141520857810974, -0.39598315954208374, -0.37781423330307007, -0.3596453070640564, -0.3414763808250427, -0.32330742478370667, -0.305138498544693, -0.2869695723056793, -0.26880061626434326, -0.250631719827652, -0.2324627935886383, -0.21429385244846344, -0.19612492620944977, -0.1779559850692749, -0.15978705883026123, -0.14161813259124756, -0.12344919145107269, -0.10528026521205902, -0.08711133152246475, -0.06894239783287048, -0.05077347159385681, -0.03260453790426254, -0.014435604214668274, 0.003733322024345398, 0.021902263164520264, 0.040071189403533936, 0.058240123093128204, 0.07640905678272247, 0.09457798302173615, 0.11274691671133041, 0.13091585040092468, 0.14908477663993835, 0.16725371778011322, 0.1854226440191269, 0.20359157025814056, 0.22176051139831543, 0.2399294376373291, 0.2580983638763428, 0.27626729011535645, 0.2944362163543701, 0.3126051723957062, 0.33077409863471985, 0.3489430248737335, 0.3671119511127472, 0.38528090715408325, 0.4034498333930969, 0.4216187596321106, 0.43978768587112427, 0.45795661211013794, 0.4761255383491516, 0.4942944645881653, 0.512463390827179, 0.5306323170661926, 0.5488012433052063, 0.5669702291488647, 0.5851391553878784, 0.6033080816268921, 0.6214770078659058]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 4.0, 2.0, 5.0, 7.0, 12.0, 11.0, 11.0, 17.0, 12.0, 29.0, 28.0, 24.0, 56.0, 35.0, 48.0, 57.0, 39.0, 52.0, 53.0, 38.0, 57.0, 56.0, 44.0, 45.0, 27.0, 32.0, 21.0, 30.0, 24.0, 23.0, 23.0, 15.0, 20.0, 13.0, 5.0, 5.0, 4.0, 5.0, 7.0, 2.0, 4.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15900921821594238, -0.15388479828834534, -0.1487603783607483, -0.14363594353199005, -0.138511523604393, -0.13338710367679596, -0.12826266884803772, -0.12313824892044067, -0.11801382899284363, -0.11288940906524658, -0.10776498168706894, -0.1026405543088913, -0.09751613438129425, -0.0923917144536972, -0.08726728707551956, -0.08214285969734192, -0.07701843976974487, -0.07189401984214783, -0.06676959246397018, -0.06164516881108284, -0.056520745158195496, -0.05139632150530815, -0.04627189785242081, -0.04114747419953346, -0.03602305054664612, -0.030898626893758774, -0.02577420324087143, -0.020649779587984085, -0.01552535593509674, -0.010400932282209396, -0.005276508629322052, -0.00015208497643470764, 0.004972338676452637, 0.010096762329339981, 0.015221185982227325, 0.02034560963511467, 0.025470033288002014, 0.03059445694088936, 0.0357188805937767, 0.04084330424666405, 0.04596772789955139, 0.051092151552438736, 0.05621657520532608, 0.061340998858213425, 0.06646542251110077, 0.07158984243869781, 0.07671426981687546, 0.0818386971950531, 0.08696311712265015, 0.09208753705024719, 0.09721196442842484, 0.10233639180660248, 0.10746081173419952, 0.11258523166179657, 0.11770965903997421, 0.12283408641815186, 0.1279585063457489, 0.13308292627334595, 0.138207346200943, 0.14333178102970123, 0.14845620095729828, 0.15358062088489532, 0.15870505571365356, 0.1638294756412506, 0.16895389556884766]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 2.0, 7.0, 8.0, 9.0, 10.0, 23.0, 21.0, 30.0, 75.0, 145.0, 252.0, 523.0, 1409.0, 3740.0, 11525.0, 42212.0, 169236.0, 458044.0, 266281.0, 68443.0, 17936.0, 5316.0, 1867.0, 729.0, 328.0, 176.0, 87.0, 40.0, 25.0, 13.0, 14.0, 11.0, 2.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0272369384765625, -0.026215791702270508, -0.025194644927978516, -0.024173498153686523, -0.02315235137939453, -0.02213120460510254, -0.021110057830810547, -0.020088911056518555, -0.019067764282226562, -0.01804661750793457, -0.017025470733642578, -0.016004323959350586, -0.014983177185058594, -0.013962030410766602, -0.01294088363647461, -0.011919736862182617, -0.010898590087890625, -0.009877443313598633, -0.00885629653930664, -0.007835149765014648, -0.006814002990722656, -0.005792856216430664, -0.004771709442138672, -0.0037505626678466797, -0.0027294158935546875, -0.0017082691192626953, -0.0006871223449707031, 0.00033402442932128906, 0.0013551712036132812, 0.0023763179779052734, 0.0033974647521972656, 0.004418611526489258, 0.00543975830078125, 0.006460905075073242, 0.007482051849365234, 0.008503198623657227, 0.009524345397949219, 0.010545492172241211, 0.011566638946533203, 0.012587785720825195, 0.013608932495117188, 0.01463007926940918, 0.015651226043701172, 0.016672372817993164, 0.017693519592285156, 0.01871466636657715, 0.01973581314086914, 0.020756959915161133, 0.021778106689453125, 0.022799253463745117, 0.02382040023803711, 0.0248415470123291, 0.025862693786621094, 0.026883840560913086, 0.027904987335205078, 0.02892613410949707, 0.029947280883789062, 0.030968427658081055, 0.03198957443237305, 0.03301072120666504, 0.03403186798095703, 0.03505301475524902, 0.036074161529541016, 0.03709530830383301, 0.038116455078125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 7.0, 6.0, 6.0, 18.0, 17.0, 33.0, 29.0, 35.0, 51.0, 65.0, 58.0, 66.0, 75.0, 70.0, 70.0, 61.0, 63.0, 51.0, 45.0, 43.0, 24.0, 22.0, 23.0, 12.0, 15.0, 11.0, 6.0, 6.0, 2.0, 6.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0211944580078125, -0.020598173141479492, -0.020001888275146484, -0.019405603408813477, -0.01880931854248047, -0.01821303367614746, -0.017616748809814453, -0.017020463943481445, -0.016424179077148438, -0.01582789421081543, -0.015231609344482422, -0.014635324478149414, -0.014039039611816406, -0.013442754745483398, -0.01284646987915039, -0.012250185012817383, -0.011653900146484375, -0.011057615280151367, -0.01046133041381836, -0.009865045547485352, -0.009268760681152344, -0.008672475814819336, -0.008076190948486328, -0.00747990608215332, -0.0068836212158203125, -0.006287336349487305, -0.005691051483154297, -0.005094766616821289, -0.004498481750488281, -0.0039021968841552734, -0.0033059120178222656, -0.002709627151489258, -0.00211334228515625, -0.0015170574188232422, -0.0009207725524902344, -0.00032448768615722656, 0.00027179718017578125, 0.0008680820465087891, 0.0014643669128417969, 0.0020606517791748047, 0.0026569366455078125, 0.0032532215118408203, 0.003849506378173828, 0.004445791244506836, 0.005042076110839844, 0.0056383609771728516, 0.006234645843505859, 0.006830930709838867, 0.007427215576171875, 0.008023500442504883, 0.00861978530883789, 0.009216070175170898, 0.009812355041503906, 0.010408639907836914, 0.011004924774169922, 0.01160120964050293, 0.012197494506835938, 0.012793779373168945, 0.013390064239501953, 0.013986349105834961, 0.014582633972167969, 0.015178918838500977, 0.015775203704833984, 0.016371488571166992, 0.0169677734375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 3.0, 7.0, 16.0, 7.0, 16.0, 23.0, 18.0, 34.0, 59.0, 61.0, 135.0, 192.0, 291.0, 478.0, 932.0, 1773.0, 4521.0, 17330.0, 166408.0, 771772.0, 67857.0, 10104.0, 3187.0, 1399.0, 739.0, 442.0, 242.0, 152.0, 100.0, 70.0, 55.0, 32.0, 23.0, 14.0, 10.0, 7.0, 8.0, 9.0, 4.0, 4.0, 6.0, 1.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.06573486328125, -0.06370162963867188, -0.06166839599609375, -0.059635162353515625, -0.0576019287109375, -0.055568695068359375, -0.05353546142578125, -0.051502227783203125, -0.049468994140625, -0.047435760498046875, -0.04540252685546875, -0.043369293212890625, -0.0413360595703125, -0.039302825927734375, -0.03726959228515625, -0.035236358642578125, -0.033203125, -0.031169891357421875, -0.02913665771484375, -0.027103424072265625, -0.0250701904296875, -0.023036956787109375, -0.02100372314453125, -0.018970489501953125, -0.016937255859375, -0.014904022216796875, -0.01287078857421875, -0.010837554931640625, -0.0088043212890625, -0.006771087646484375, -0.00473785400390625, -0.002704620361328125, -0.00067138671875, 0.001361846923828125, 0.00339508056640625, 0.005428314208984375, 0.0074615478515625, 0.009494781494140625, 0.01152801513671875, 0.013561248779296875, 0.015594482421875, 0.017627716064453125, 0.01966094970703125, 0.021694183349609375, 0.0237274169921875, 0.025760650634765625, 0.02779388427734375, 0.029827117919921875, 0.0318603515625, 0.033893585205078125, 0.03592681884765625, 0.037960052490234375, 0.0399932861328125, 0.042026519775390625, 0.04405975341796875, 0.046092987060546875, 0.048126220703125, 0.050159454345703125, 0.05219268798828125, 0.054225921630859375, 0.0562591552734375, 0.058292388916015625, 0.06032562255859375, 0.062358856201171875, 0.06439208984375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 5.0, 3.0, 8.0, 6.0, 6.0, 10.0, 12.0, 21.0, 14.0, 17.0, 30.0, 28.0, 38.0, 41.0, 37.0, 46.0, 54.0, 51.0, 45.0, 50.0, 53.0, 64.0, 51.0, 55.0, 39.0, 27.0, 36.0, 22.0, 28.0, 28.0, 16.0, 15.0, 9.0, 3.0, 12.0, 10.0, 4.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0634765625, -0.061443328857421875, -0.05941009521484375, -0.057376861572265625, -0.0553436279296875, -0.053310394287109375, -0.05127716064453125, -0.049243927001953125, -0.047210693359375, -0.045177459716796875, -0.04314422607421875, -0.041110992431640625, -0.0390777587890625, -0.037044525146484375, -0.03501129150390625, -0.032978057861328125, -0.03094482421875, -0.028911590576171875, -0.02687835693359375, -0.024845123291015625, -0.0228118896484375, -0.020778656005859375, -0.01874542236328125, -0.016712188720703125, -0.014678955078125, -0.012645721435546875, -0.01061248779296875, -0.008579254150390625, -0.0065460205078125, -0.004512786865234375, -0.00247955322265625, -0.000446319580078125, 0.0015869140625, 0.003620147705078125, 0.00565338134765625, 0.007686614990234375, 0.0097198486328125, 0.011753082275390625, 0.01378631591796875, 0.015819549560546875, 0.017852783203125, 0.019886016845703125, 0.02191925048828125, 0.023952484130859375, 0.0259857177734375, 0.028018951416015625, 0.03005218505859375, 0.032085418701171875, 0.03411865234375, 0.036151885986328125, 0.03818511962890625, 0.040218353271484375, 0.0422515869140625, 0.044284820556640625, 0.04631805419921875, 0.048351287841796875, 0.050384521484375, 0.052417755126953125, 0.05445098876953125, 0.056484222412109375, 0.0585174560546875, 0.060550689697265625, 0.06258392333984375, 0.06461715698242188, 0.066650390625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 8.0, 5.0, 5.0, 17.0, 18.0, 29.0, 28.0, 51.0, 66.0, 101.0, 150.0, 239.0, 438.0, 722.0, 1157.0, 2135.0, 4280.0, 10792.0, 49205.0, 919576.0, 40746.0, 9907.0, 4026.0, 2007.0, 1083.0, 632.0, 401.0, 250.0, 145.0, 110.0, 69.0, 49.0, 33.0, 21.0, 15.0, 10.0, 6.0, 10.0, 8.0, 2.0, 4.0, 2.0, 4.0, 2.0], "bins": [-0.07757568359375, -0.07560968399047852, -0.07364368438720703, -0.07167768478393555, -0.06971168518066406, -0.06774568557739258, -0.0657796859741211, -0.06381368637084961, -0.061847686767578125, -0.05988168716430664, -0.057915687561035156, -0.05594968795776367, -0.05398368835449219, -0.0520176887512207, -0.05005168914794922, -0.048085689544677734, -0.04611968994140625, -0.044153690338134766, -0.04218769073486328, -0.0402216911315918, -0.03825569152832031, -0.03628969192504883, -0.034323692321777344, -0.03235769271850586, -0.030391693115234375, -0.02842569351196289, -0.026459693908691406, -0.024493694305419922, -0.022527694702148438, -0.020561695098876953, -0.01859569549560547, -0.016629695892333984, -0.0146636962890625, -0.012697696685791016, -0.010731697082519531, -0.008765697479248047, -0.0067996978759765625, -0.004833698272705078, -0.0028676986694335938, -0.0009016990661621094, 0.001064300537109375, 0.0030303001403808594, 0.004996299743652344, 0.006962299346923828, 0.008928298950195312, 0.010894298553466797, 0.012860298156738281, 0.014826297760009766, 0.01679229736328125, 0.018758296966552734, 0.02072429656982422, 0.022690296173095703, 0.024656295776367188, 0.026622295379638672, 0.028588294982910156, 0.03055429458618164, 0.032520294189453125, 0.03448629379272461, 0.036452293395996094, 0.03841829299926758, 0.04038429260253906, 0.04235029220581055, 0.04431629180908203, 0.046282291412353516, 0.048248291015625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 5.0, 8.0, 6.0, 12.0, 7.0, 13.0, 14.0, 16.0, 15.0, 26.0, 32.0, 45.0, 58.0, 73.0, 123.0, 138.0, 101.0, 71.0, 47.0, 35.0, 26.0, 24.0, 19.0, 9.0, 16.0, 15.0, 7.0, 11.0, 7.0, 4.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.704164505004883e-05, -5.546770989894867e-05, -5.389377474784851e-05, -5.231983959674835e-05, -5.074590444564819e-05, -4.9171969294548035e-05, -4.7598034143447876e-05, -4.602409899234772e-05, -4.445016384124756e-05, -4.28762286901474e-05, -4.130229353904724e-05, -3.972835838794708e-05, -3.8154423236846924e-05, -3.6580488085746765e-05, -3.5006552934646606e-05, -3.343261778354645e-05, -3.185868263244629e-05, -3.028474748134613e-05, -2.871081233024597e-05, -2.7136877179145813e-05, -2.5562942028045654e-05, -2.3989006876945496e-05, -2.2415071725845337e-05, -2.0841136574745178e-05, -1.926720142364502e-05, -1.769326627254486e-05, -1.6119331121444702e-05, -1.4545395970344543e-05, -1.2971460819244385e-05, -1.1397525668144226e-05, -9.823590517044067e-06, -8.249655365943909e-06, -6.67572021484375e-06, -5.101785063743591e-06, -3.5278499126434326e-06, -1.953914761543274e-06, -3.7997961044311523e-07, 1.1939555406570435e-06, 2.767890691757202e-06, 4.341825842857361e-06, 5.9157609939575195e-06, 7.489696145057678e-06, 9.063631296157837e-06, 1.0637566447257996e-05, 1.2211501598358154e-05, 1.3785436749458313e-05, 1.535937190055847e-05, 1.693330705165863e-05, 1.850724220275879e-05, 2.0081177353858948e-05, 2.1655112504959106e-05, 2.3229047656059265e-05, 2.4802982807159424e-05, 2.6376917958259583e-05, 2.795085310935974e-05, 2.95247882604599e-05, 3.109872341156006e-05, 3.267265856266022e-05, 3.4246593713760376e-05, 3.5820528864860535e-05, 3.739446401596069e-05, 3.896839916706085e-05, 4.054233431816101e-05, 4.211626946926117e-05, 4.369020462036133e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 6.0, 7.0, 11.0, 16.0, 34.0, 43.0, 77.0, 133.0, 286.0, 609.0, 1598.0, 5101.0, 31058.0, 976125.0, 26047.0, 4674.0, 1473.0, 642.0, 284.0, 136.0, 69.0, 42.0, 23.0, 23.0, 14.0, 11.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.096923828125, -0.09363460540771484, -0.09034538269042969, -0.08705615997314453, -0.08376693725585938, -0.08047771453857422, -0.07718849182128906, -0.0738992691040039, -0.07061004638671875, -0.0673208236694336, -0.06403160095214844, -0.06074237823486328, -0.057453155517578125, -0.05416393280029297, -0.05087471008300781, -0.047585487365722656, -0.0442962646484375, -0.041007041931152344, -0.03771781921386719, -0.03442859649658203, -0.031139373779296875, -0.02785015106201172, -0.024560928344726562, -0.021271705627441406, -0.01798248291015625, -0.014693260192871094, -0.011404037475585938, -0.008114814758300781, -0.004825592041015625, -0.0015363693237304688, 0.0017528533935546875, 0.005042076110839844, 0.008331298828125, 0.011620521545410156, 0.014909744262695312, 0.01819896697998047, 0.021488189697265625, 0.02477741241455078, 0.028066635131835938, 0.031355857849121094, 0.03464508056640625, 0.037934303283691406, 0.04122352600097656, 0.04451274871826172, 0.047801971435546875, 0.05109119415283203, 0.05438041687011719, 0.057669639587402344, 0.0609588623046875, 0.06424808502197266, 0.06753730773925781, 0.07082653045654297, 0.07411575317382812, 0.07740497589111328, 0.08069419860839844, 0.0839834213256836, 0.08727264404296875, 0.0905618667602539, 0.09385108947753906, 0.09714031219482422, 0.10042953491210938, 0.10371875762939453, 0.10700798034667969, 0.11029720306396484, 0.11358642578125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 9.0, 10.0, 14.0, 26.0, 81.0, 277.0, 357.0, 136.0, 37.0, 19.0, 7.0, 4.0, 2.0, 3.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10443115234375, -0.10169124603271484, -0.09895133972167969, -0.09621143341064453, -0.09347152709960938, -0.09073162078857422, -0.08799171447753906, -0.0852518081665039, -0.08251190185546875, -0.0797719955444336, -0.07703208923339844, -0.07429218292236328, -0.07155227661132812, -0.06881237030029297, -0.06607246398925781, -0.06333255767822266, -0.0605926513671875, -0.057852745056152344, -0.05511283874511719, -0.05237293243408203, -0.049633026123046875, -0.04689311981201172, -0.04415321350097656, -0.041413307189941406, -0.03867340087890625, -0.035933494567871094, -0.03319358825683594, -0.03045368194580078, -0.027713775634765625, -0.02497386932373047, -0.022233963012695312, -0.019494056701660156, -0.016754150390625, -0.014014244079589844, -0.011274337768554688, -0.008534431457519531, -0.005794525146484375, -0.0030546188354492188, -0.0003147125244140625, 0.0024251937866210938, 0.00516510009765625, 0.007905006408691406, 0.010644912719726562, 0.013384819030761719, 0.016124725341796875, 0.01886463165283203, 0.021604537963867188, 0.024344444274902344, 0.0270843505859375, 0.029824256896972656, 0.03256416320800781, 0.03530406951904297, 0.038043975830078125, 0.04078388214111328, 0.04352378845214844, 0.046263694763183594, 0.04900360107421875, 0.051743507385253906, 0.05448341369628906, 0.05722332000732422, 0.059963226318359375, 0.06270313262939453, 0.06544303894042969, 0.06818294525146484, 0.0709228515625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 1.0, 4.0, 29.0, 75.0, 234.0, 377.0, 159.0, 64.0, 36.0, 4.0, 8.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7154682874679565, -0.6739500761032104, -0.6324318051338196, -0.5909135937690735, -0.5493953227996826, -0.5078771114349365, -0.46635890007019043, -0.42484065890312195, -0.38332241773605347, -0.341804176568985, -0.3002859354019165, -0.2587677240371704, -0.21724948287010193, -0.17573124170303345, -0.13421301543712616, -0.09269478917121887, -0.05117654800415039, -0.009658314287662506, 0.03185991942882538, 0.07337815314531326, 0.11489638686180115, 0.15641462802886963, 0.19793285429477692, 0.2394510805606842, 0.2809693217277527, 0.32248756289482117, 0.36400580406188965, 0.40552401542663574, 0.4470422565937042, 0.4885604977607727, 0.5300787091255188, 0.5715969800949097, 0.6131151914596558, 0.6546334028244019, 0.6961516737937927, 0.7376698851585388, 0.7791881561279297, 0.8207063674926758, 0.8622245788574219, 0.903742790222168, 0.9452610611915588, 0.9867792725563049, 1.0282975435256958, 1.069815754890442, 1.111333966255188, 1.1528522968292236, 1.1943705081939697, 1.2358887195587158, 1.277406930923462, 1.318925142288208, 1.360443353652954, 1.4019616842269897, 1.4434798955917358, 1.484998106956482, 1.526516318321228, 1.5680345296859741, 1.6095528602600098, 1.6510710716247559, 1.692589282989502, 1.7341076135635376, 1.7756258249282837, 1.8171440362930298, 1.8586622476577759, 1.900180459022522, 1.941698670387268]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 3.0, 5.0, 4.0, 5.0, 7.0, 8.0, 5.0, 13.0, 14.0, 17.0, 14.0, 17.0, 22.0, 28.0, 21.0, 18.0, 42.0, 30.0, 38.0, 27.0, 39.0, 62.0, 75.0, 66.0, 46.0, 59.0, 38.0, 32.0, 28.0, 23.0, 26.0, 21.0, 20.0, 14.0, 14.0, 16.0, 19.0, 19.0, 10.0, 8.0, 10.0, 5.0, 4.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22172784805297852, -0.21322104334831238, -0.20471423864364624, -0.1962074339389801, -0.18770062923431396, -0.17919382452964783, -0.1706870198249817, -0.16218021512031555, -0.15367341041564941, -0.14516660571098328, -0.13665980100631714, -0.128152996301651, -0.11964619159698486, -0.11113938689231873, -0.10263258963823318, -0.09412578493356705, -0.0856189876794815, -0.07711218297481537, -0.06860537827014923, -0.06009857729077339, -0.051591772586107254, -0.043084967881441116, -0.03457816690206528, -0.02607136219739914, -0.017564557492733, -0.009057753719389439, -0.0005509499460458755, 0.007955852895975113, 0.01646265760064125, 0.02496946230530739, 0.03347626328468323, 0.041983067989349365, 0.0504898726940155, 0.05899667739868164, 0.06750348210334778, 0.07601028680801392, 0.08451709151268005, 0.09302389621734619, 0.10153069347143173, 0.11003749817609787, 0.11854430288076401, 0.12705110013484955, 0.13555790483951569, 0.14406470954418182, 0.15257151424884796, 0.1610783189535141, 0.16958512365818024, 0.17809192836284637, 0.1865987330675125, 0.19510553777217865, 0.2036123424768448, 0.21211914718151093, 0.22062595188617706, 0.2291327565908432, 0.23763954639434814, 0.24614635109901428, 0.2546531558036804, 0.26315996050834656, 0.2716667652130127, 0.28017356991767883, 0.28868037462234497, 0.2971871793270111, 0.30569398403167725, 0.3142007887363434, 0.3227075934410095]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 4.0, 12.0, 15.0, 15.0, 29.0, 30.0, 33.0, 61.0, 76.0, 158.0, 300.0, 585.0, 2074.0, 11646.0, 195826.0, 3858760.0, 113232.0, 8500.0, 1570.0, 597.0, 255.0, 161.0, 103.0, 55.0, 42.0, 39.0, 18.0, 12.0, 19.0, 7.0, 5.0, 7.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.06439208984375, -0.06240653991699219, -0.060420989990234375, -0.05843544006347656, -0.05644989013671875, -0.05446434020996094, -0.052478790283203125, -0.05049324035644531, -0.0485076904296875, -0.04652214050292969, -0.044536590576171875, -0.04255104064941406, -0.04056549072265625, -0.03857994079589844, -0.036594390869140625, -0.03460884094238281, -0.032623291015625, -0.030637741088867188, -0.028652191162109375, -0.026666641235351562, -0.02468109130859375, -0.022695541381835938, -0.020709991455078125, -0.018724441528320312, -0.0167388916015625, -0.014753341674804688, -0.012767791748046875, -0.010782241821289062, -0.00879669189453125, -0.0068111419677734375, -0.004825592041015625, -0.0028400421142578125, -0.0008544921875, 0.0011310577392578125, 0.003116607666015625, 0.0051021575927734375, 0.00708770751953125, 0.009073257446289062, 0.011058807373046875, 0.013044357299804688, 0.0150299072265625, 0.017015457153320312, 0.019001007080078125, 0.020986557006835938, 0.02297210693359375, 0.024957656860351562, 0.026943206787109375, 0.028928756713867188, 0.030914306640625, 0.03289985656738281, 0.034885406494140625, 0.03687095642089844, 0.03885650634765625, 0.04084205627441406, 0.042827606201171875, 0.04481315612792969, 0.0467987060546875, 0.04878425598144531, 0.050769805908203125, 0.05275535583496094, 0.05474090576171875, 0.05672645568847656, 0.058712005615234375, 0.06069755554199219, 0.06268310546875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 6.0, 8.0, 12.0, 15.0, 15.0, 34.0, 27.0, 30.0, 31.0, 42.0, 38.0, 50.0, 57.0, 72.0, 54.0, 65.0, 53.0, 47.0, 66.0, 49.0, 43.0, 33.0, 28.0, 28.0, 11.0, 18.0, 11.0, 15.0, 7.0, 10.0, 6.0, 3.0, 3.0, 3.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.018096923828125, -0.017548799514770508, -0.017000675201416016, -0.016452550888061523, -0.01590442657470703, -0.015356302261352539, -0.014808177947998047, -0.014260053634643555, -0.013711929321289062, -0.01316380500793457, -0.012615680694580078, -0.012067556381225586, -0.011519432067871094, -0.010971307754516602, -0.01042318344116211, -0.009875059127807617, -0.009326934814453125, -0.008778810501098633, -0.00823068618774414, -0.0076825618743896484, -0.007134437561035156, -0.006586313247680664, -0.006038188934326172, -0.00549006462097168, -0.0049419403076171875, -0.004393815994262695, -0.003845691680908203, -0.003297567367553711, -0.0027494430541992188, -0.0022013187408447266, -0.0016531944274902344, -0.0011050701141357422, -0.00055694580078125, -8.821487426757812e-06, 0.0005393028259277344, 0.0010874271392822266, 0.0016355514526367188, 0.002183675765991211, 0.002731800079345703, 0.0032799243927001953, 0.0038280487060546875, 0.00437617301940918, 0.004924297332763672, 0.005472421646118164, 0.006020545959472656, 0.0065686702728271484, 0.007116794586181641, 0.007664918899536133, 0.008213043212890625, 0.008761167526245117, 0.00930929183959961, 0.009857416152954102, 0.010405540466308594, 0.010953664779663086, 0.011501789093017578, 0.01204991340637207, 0.012598037719726562, 0.013146162033081055, 0.013694286346435547, 0.014242410659790039, 0.014790534973144531, 0.015338659286499023, 0.015886783599853516, 0.016434907913208008, 0.0169830322265625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 3.0, 18.0, 22.0, 23.0, 34.0, 59.0, 69.0, 94.0, 188.0, 352.0, 1307.0, 79285.0, 4106489.0, 5081.0, 461.0, 225.0, 155.0, 100.0, 76.0, 60.0, 44.0, 45.0, 22.0, 14.0, 19.0, 14.0, 7.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.212890625, -0.205352783203125, -0.19781494140625, -0.190277099609375, -0.1827392578125, -0.175201416015625, -0.16766357421875, -0.160125732421875, -0.152587890625, -0.145050048828125, -0.13751220703125, -0.129974365234375, -0.1224365234375, -0.114898681640625, -0.10736083984375, -0.099822998046875, -0.09228515625, -0.084747314453125, -0.07720947265625, -0.069671630859375, -0.0621337890625, -0.054595947265625, -0.04705810546875, -0.039520263671875, -0.031982421875, -0.024444580078125, -0.01690673828125, -0.009368896484375, -0.0018310546875, 0.005706787109375, 0.01324462890625, 0.020782470703125, 0.0283203125, 0.035858154296875, 0.04339599609375, 0.050933837890625, 0.0584716796875, 0.066009521484375, 0.07354736328125, 0.081085205078125, 0.088623046875, 0.096160888671875, 0.10369873046875, 0.111236572265625, 0.1187744140625, 0.126312255859375, 0.13385009765625, 0.141387939453125, 0.14892578125, 0.156463623046875, 0.16400146484375, 0.171539306640625, 0.1790771484375, 0.186614990234375, 0.19415283203125, 0.201690673828125, 0.209228515625, 0.216766357421875, 0.22430419921875, 0.231842041015625, 0.2393798828125, 0.246917724609375, 0.25445556640625, 0.261993408203125, 0.26953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 18.0, 38.0, 98.0, 300.0, 2105.0, 1159.0, 215.0, 81.0, 36.0, 8.0, 14.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.076904296875, -0.0725860595703125, -0.068267822265625, -0.0639495849609375, -0.05963134765625, -0.0553131103515625, -0.050994873046875, -0.0466766357421875, -0.0423583984375, -0.0380401611328125, -0.033721923828125, -0.0294036865234375, -0.02508544921875, -0.0207672119140625, -0.016448974609375, -0.0121307373046875, -0.0078125, -0.0034942626953125, 0.000823974609375, 0.0051422119140625, 0.00946044921875, 0.0137786865234375, 0.018096923828125, 0.0224151611328125, 0.0267333984375, 0.0310516357421875, 0.035369873046875, 0.0396881103515625, 0.04400634765625, 0.0483245849609375, 0.052642822265625, 0.0569610595703125, 0.061279296875, 0.0655975341796875, 0.069915771484375, 0.0742340087890625, 0.07855224609375, 0.0828704833984375, 0.087188720703125, 0.0915069580078125, 0.0958251953125, 0.1001434326171875, 0.104461669921875, 0.1087799072265625, 0.11309814453125, 0.1174163818359375, 0.121734619140625, 0.1260528564453125, 0.13037109375, 0.1346893310546875, 0.139007568359375, 0.1433258056640625, 0.14764404296875, 0.1519622802734375, 0.156280517578125, 0.1605987548828125, 0.1649169921875, 0.1692352294921875, 0.173553466796875, 0.1778717041015625, 0.18218994140625, 0.1865081787109375, 0.190826416015625, 0.1951446533203125, 0.199462890625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 3.0, 7.0, 10.0, 12.0, 16.0, 49.0, 106.0, 188.0, 288.0, 163.0, 69.0, 40.0, 19.0, 11.0, 6.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7050898671150208, -0.6719392538070679, -0.638788640499115, -0.6056380271911621, -0.5724873542785645, -0.5393368005752563, -0.5061861276626587, -0.4730355143547058, -0.43988490104675293, -0.40673428773880005, -0.37358367443084717, -0.3404330313205719, -0.307282418012619, -0.27413180470466614, -0.24098117649555206, -0.207830548286438, -0.1746799349784851, -0.14152932167053223, -0.10837869346141815, -0.07522807270288467, -0.042077451944351196, -0.008926838636398315, 0.02422378957271576, 0.057374417781829834, 0.09052503108978271, 0.12367565184831619, 0.15682627260684967, 0.18997690081596375, 0.22312751412391663, 0.2562781274318695, 0.2894287705421448, 0.32257938385009766, 0.3557300567626953, 0.3888806700706482, 0.4220312833786011, 0.45518192648887634, 0.4883325397968292, 0.5214831829071045, 0.5546337962150574, 0.5877844095230103, 0.6209350228309631, 0.654085636138916, 0.6872362494468689, 0.7203868627548218, 0.7535375356674194, 0.7866880893707275, 0.8198387622833252, 0.8529893755912781, 0.886139988899231, 0.9192906022071838, 0.9524412155151367, 0.9855918288230896, 1.0187424421310425, 1.0518931150436401, 1.0850436687469482, 1.118194341659546, 1.1513450145721436, 1.1844956874847412, 1.2176462411880493, 1.250796914100647, 1.283947467803955, 1.3170981407165527, 1.3502486944198608, 1.3833993673324585, 1.4165499210357666]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 2.0, 6.0, 14.0, 19.0, 11.0, 16.0, 28.0, 28.0, 31.0, 36.0, 36.0, 42.0, 48.0, 77.0, 46.0, 56.0, 54.0, 51.0, 46.0, 60.0, 53.0, 33.0, 33.0, 32.0, 33.0, 28.0, 20.0, 19.0, 3.0, 8.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.34015971422195435, -0.3299034535884857, -0.3196471929550171, -0.30939093232154846, -0.29913467168807983, -0.2888784110546112, -0.2786221504211426, -0.26836588978767395, -0.2581096291542053, -0.2478533685207367, -0.23759710788726807, -0.22734084725379944, -0.2170845866203308, -0.20682832598686218, -0.19657206535339355, -0.18631580471992493, -0.1760595440864563, -0.16580328345298767, -0.15554702281951904, -0.14529076218605042, -0.1350345015525818, -0.12477824091911316, -0.11452198028564453, -0.1042657196521759, -0.09400945901870728, -0.08375319838523865, -0.07349693775177002, -0.06324067711830139, -0.052984416484832764, -0.042728155851364136, -0.03247189521789551, -0.02221563458442688, -0.011959373950958252, -0.001703113317489624, 0.008553147315979004, 0.018809407949447632, 0.02906566858291626, 0.03932192921638489, 0.049578189849853516, 0.059834450483322144, 0.07009071111679077, 0.0803469717502594, 0.09060323238372803, 0.10085949301719666, 0.11111575365066528, 0.12137201428413391, 0.13162827491760254, 0.14188453555107117, 0.1521407961845398, 0.16239705681800842, 0.17265331745147705, 0.18290957808494568, 0.1931658387184143, 0.20342209935188293, 0.21367835998535156, 0.2239346206188202, 0.23419088125228882, 0.24444714188575745, 0.2547034025192261, 0.2649596631526947, 0.27521592378616333, 0.28547218441963196, 0.2957284450531006, 0.3059847056865692, 0.31624096632003784]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 2.0, 7.0, 9.0, 13.0, 10.0, 17.0, 23.0, 38.0, 53.0, 69.0, 96.0, 168.0, 303.0, 435.0, 773.0, 1488.0, 2583.0, 5126.0, 11004.0, 25096.0, 67444.0, 199555.0, 406474.0, 208224.0, 70522.0, 26361.0, 11317.0, 5173.0, 2667.0, 1362.0, 808.0, 496.0, 296.0, 178.0, 125.0, 65.0, 54.0, 27.0, 24.0, 20.0, 14.0, 8.0, 9.0, 6.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.039093017578125, -0.03785276412963867, -0.036612510681152344, -0.035372257232666016, -0.03413200378417969, -0.03289175033569336, -0.03165149688720703, -0.030411243438720703, -0.029170989990234375, -0.027930736541748047, -0.02669048309326172, -0.02545022964477539, -0.024209976196289062, -0.022969722747802734, -0.021729469299316406, -0.020489215850830078, -0.01924896240234375, -0.018008708953857422, -0.016768455505371094, -0.015528202056884766, -0.014287948608398438, -0.01304769515991211, -0.011807441711425781, -0.010567188262939453, -0.009326934814453125, -0.008086681365966797, -0.006846427917480469, -0.005606174468994141, -0.0043659210205078125, -0.0031256675720214844, -0.0018854141235351562, -0.0006451606750488281, 0.0005950927734375, 0.0018353462219238281, 0.0030755996704101562, 0.004315853118896484, 0.0055561065673828125, 0.006796360015869141, 0.008036613464355469, 0.009276866912841797, 0.010517120361328125, 0.011757373809814453, 0.012997627258300781, 0.01423788070678711, 0.015478134155273438, 0.016718387603759766, 0.017958641052246094, 0.019198894500732422, 0.02043914794921875, 0.021679401397705078, 0.022919654846191406, 0.024159908294677734, 0.025400161743164062, 0.02664041519165039, 0.02788066864013672, 0.029120922088623047, 0.030361175537109375, 0.0316014289855957, 0.03284168243408203, 0.03408193588256836, 0.03532218933105469, 0.036562442779541016, 0.037802696228027344, 0.03904294967651367, 0.040283203125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 5.0, 6.0, 9.0, 7.0, 7.0, 10.0, 15.0, 19.0, 15.0, 27.0, 17.0, 24.0, 26.0, 42.0, 42.0, 47.0, 53.0, 46.0, 47.0, 58.0, 50.0, 47.0, 44.0, 58.0, 47.0, 35.0, 38.0, 34.0, 23.0, 17.0, 14.0, 15.0, 11.0, 7.0, 6.0, 7.0, 6.0, 4.0, 5.0, 2.0, 5.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.02191162109375, -0.021276235580444336, -0.020640850067138672, -0.020005464553833008, -0.019370079040527344, -0.01873469352722168, -0.018099308013916016, -0.01746392250061035, -0.016828536987304688, -0.016193151473999023, -0.01555776596069336, -0.014922380447387695, -0.014286994934082031, -0.013651609420776367, -0.013016223907470703, -0.012380838394165039, -0.011745452880859375, -0.011110067367553711, -0.010474681854248047, -0.009839296340942383, -0.009203910827636719, -0.008568525314331055, -0.00793313980102539, -0.0072977542877197266, -0.0066623687744140625, -0.0060269832611083984, -0.005391597747802734, -0.00475621223449707, -0.004120826721191406, -0.003485441207885742, -0.002850055694580078, -0.002214670181274414, -0.00157928466796875, -0.0009438991546630859, -0.0003085136413574219, 0.0003268718719482422, 0.0009622573852539062, 0.0015976428985595703, 0.0022330284118652344, 0.0028684139251708984, 0.0035037994384765625, 0.0041391849517822266, 0.004774570465087891, 0.005409955978393555, 0.006045341491699219, 0.006680727005004883, 0.007316112518310547, 0.007951498031616211, 0.008586883544921875, 0.009222269058227539, 0.009857654571533203, 0.010493040084838867, 0.011128425598144531, 0.011763811111450195, 0.01239919662475586, 0.013034582138061523, 0.013669967651367188, 0.014305353164672852, 0.014940738677978516, 0.01557612419128418, 0.016211509704589844, 0.016846895217895508, 0.017482280731201172, 0.018117666244506836, 0.0187530517578125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 2.0, 8.0, 10.0, 7.0, 15.0, 24.0, 32.0, 62.0, 108.0, 110.0, 156.0, 303.0, 444.0, 915.0, 1777.0, 4803.0, 18422.0, 207047.0, 759642.0, 41326.0, 7885.0, 2630.0, 1220.0, 629.0, 340.0, 220.0, 108.0, 78.0, 59.0, 45.0, 37.0, 23.0, 20.0, 7.0, 7.0, 8.0, 6.0, 3.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1275634765625, -0.12347602844238281, -0.11938858032226562, -0.11530113220214844, -0.11121368408203125, -0.10712623596191406, -0.10303878784179688, -0.09895133972167969, -0.0948638916015625, -0.09077644348144531, -0.08668899536132812, -0.08260154724121094, -0.07851409912109375, -0.07442665100097656, -0.07033920288085938, -0.06625175476074219, -0.062164306640625, -0.05807685852050781, -0.053989410400390625, -0.04990196228027344, -0.04581451416015625, -0.04172706604003906, -0.037639617919921875, -0.03355216979980469, -0.0294647216796875, -0.025377273559570312, -0.021289825439453125, -0.017202377319335938, -0.01311492919921875, -0.009027481079101562, -0.004940032958984375, -0.0008525848388671875, 0.00323486328125, 0.0073223114013671875, 0.011409759521484375, 0.015497207641601562, 0.01958465576171875, 0.023672103881835938, 0.027759552001953125, 0.03184700012207031, 0.0359344482421875, 0.04002189636230469, 0.044109344482421875, 0.04819679260253906, 0.05228424072265625, 0.05637168884277344, 0.060459136962890625, 0.06454658508300781, 0.068634033203125, 0.07272148132324219, 0.07680892944335938, 0.08089637756347656, 0.08498382568359375, 0.08907127380371094, 0.09315872192382812, 0.09724617004394531, 0.1013336181640625, 0.10542106628417969, 0.10950851440429688, 0.11359596252441406, 0.11768341064453125, 0.12177085876464844, 0.12585830688476562, 0.1299457550048828, 0.134033203125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 4.0, 4.0, 7.0, 14.0, 5.0, 19.0, 20.0, 18.0, 33.0, 31.0, 30.0, 34.0, 37.0, 42.0, 50.0, 46.0, 58.0, 64.0, 55.0, 43.0, 59.0, 42.0, 42.0, 36.0, 32.0, 43.0, 28.0, 25.0, 21.0, 14.0, 10.0, 9.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0843505859375, -0.08096694946289062, -0.07758331298828125, -0.07419967651367188, -0.0708160400390625, -0.06743240356445312, -0.06404876708984375, -0.060665130615234375, -0.057281494140625, -0.053897857666015625, -0.05051422119140625, -0.047130584716796875, -0.0437469482421875, -0.040363311767578125, -0.03697967529296875, -0.033596038818359375, -0.03021240234375, -0.026828765869140625, -0.02344512939453125, -0.020061492919921875, -0.0166778564453125, -0.013294219970703125, -0.00991058349609375, -0.006526947021484375, -0.003143310546875, 0.000240325927734375, 0.00362396240234375, 0.007007598876953125, 0.0103912353515625, 0.013774871826171875, 0.01715850830078125, 0.020542144775390625, 0.02392578125, 0.027309417724609375, 0.03069305419921875, 0.034076690673828125, 0.0374603271484375, 0.040843963623046875, 0.04422760009765625, 0.047611236572265625, 0.050994873046875, 0.054378509521484375, 0.05776214599609375, 0.061145782470703125, 0.0645294189453125, 0.06791305541992188, 0.07129669189453125, 0.07468032836914062, 0.07806396484375, 0.08144760131835938, 0.08483123779296875, 0.08821487426757812, 0.0915985107421875, 0.09498214721679688, 0.09836578369140625, 0.10174942016601562, 0.105133056640625, 0.10851669311523438, 0.11190032958984375, 0.11528396606445312, 0.1186676025390625, 0.12205123901367188, 0.12543487548828125, 0.12881851196289062, 0.1322021484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 8.0, 19.0, 30.0, 43.0, 80.0, 143.0, 157.0, 352.0, 628.0, 1370.0, 2918.0, 7228.0, 22541.0, 193075.0, 766722.0, 35757.0, 10187.0, 3850.0, 1643.0, 811.0, 409.0, 246.0, 147.0, 72.0, 49.0, 19.0, 11.0, 14.0, 8.0, 7.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07342529296875, -0.07106876373291016, -0.06871223449707031, -0.06635570526123047, -0.06399917602539062, -0.06164264678955078, -0.05928611755371094, -0.056929588317871094, -0.05457305908203125, -0.052216529846191406, -0.04986000061035156, -0.04750347137451172, -0.045146942138671875, -0.04279041290283203, -0.04043388366699219, -0.038077354431152344, -0.0357208251953125, -0.033364295959472656, -0.031007766723632812, -0.02865123748779297, -0.026294708251953125, -0.02393817901611328, -0.021581649780273438, -0.019225120544433594, -0.01686859130859375, -0.014512062072753906, -0.012155532836914062, -0.009799003601074219, -0.007442474365234375, -0.005085945129394531, -0.0027294158935546875, -0.00037288665771484375, 0.001983642578125, 0.004340171813964844, 0.0066967010498046875, 0.009053230285644531, 0.011409759521484375, 0.013766288757324219, 0.016122817993164062, 0.018479347229003906, 0.02083587646484375, 0.023192405700683594, 0.025548934936523438, 0.02790546417236328, 0.030261993408203125, 0.03261852264404297, 0.03497505187988281, 0.037331581115722656, 0.0396881103515625, 0.042044639587402344, 0.04440116882324219, 0.04675769805908203, 0.049114227294921875, 0.05147075653076172, 0.05382728576660156, 0.056183815002441406, 0.05854034423828125, 0.060896873474121094, 0.06325340270996094, 0.06560993194580078, 0.06796646118164062, 0.07032299041748047, 0.07267951965332031, 0.07503604888916016, 0.077392578125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 4.0, 7.0, 4.0, 6.0, 7.0, 9.0, 10.0, 4.0, 12.0, 21.0, 27.0, 36.0, 32.0, 37.0, 45.0, 69.0, 65.0, 95.0, 104.0, 92.0, 49.0, 56.0, 37.0, 25.0, 26.0, 21.0, 20.0, 18.0, 11.0, 7.0, 8.0, 5.0, 6.0, 5.0, 6.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.063678741455078e-05, -2.963189035654068e-05, -2.862699329853058e-05, -2.7622096240520477e-05, -2.6617199182510376e-05, -2.5612302124500275e-05, -2.4607405066490173e-05, -2.3602508008480072e-05, -2.259761095046997e-05, -2.159271389245987e-05, -2.0587816834449768e-05, -1.9582919776439667e-05, -1.8578022718429565e-05, -1.7573125660419464e-05, -1.6568228602409363e-05, -1.556333154439926e-05, -1.455843448638916e-05, -1.3553537428379059e-05, -1.2548640370368958e-05, -1.1543743312358856e-05, -1.0538846254348755e-05, -9.533949196338654e-06, -8.529052138328552e-06, -7.524155080318451e-06, -6.51925802230835e-06, -5.514360964298248e-06, -4.509463906288147e-06, -3.5045668482780457e-06, -2.4996697902679443e-06, -1.494772732257843e-06, -4.898756742477417e-07, 5.150213837623596e-07, 1.519918441772461e-06, 2.5248154997825623e-06, 3.5297125577926636e-06, 4.534609615802765e-06, 5.539506673812866e-06, 6.5444037318229675e-06, 7.549300789833069e-06, 8.55419784784317e-06, 9.559094905853271e-06, 1.0563991963863373e-05, 1.1568889021873474e-05, 1.2573786079883575e-05, 1.3578683137893677e-05, 1.4583580195903778e-05, 1.558847725391388e-05, 1.659337431192398e-05, 1.7598271369934082e-05, 1.8603168427944183e-05, 1.9608065485954285e-05, 2.0612962543964386e-05, 2.1617859601974487e-05, 2.262275665998459e-05, 2.362765371799469e-05, 2.463255077600479e-05, 2.5637447834014893e-05, 2.6642344892024994e-05, 2.7647241950035095e-05, 2.8652139008045197e-05, 2.9657036066055298e-05, 3.06619331240654e-05, 3.16668301820755e-05, 3.26717272400856e-05, 3.36766242980957e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 11.0, 9.0, 12.0, 16.0, 22.0, 29.0, 41.0, 58.0, 86.0, 143.0, 210.0, 382.0, 606.0, 1264.0, 2558.0, 6161.0, 18053.0, 105455.0, 822949.0, 66492.0, 14232.0, 5092.0, 2188.0, 1039.0, 549.0, 321.0, 202.0, 104.0, 83.0, 49.0, 36.0, 27.0, 20.0, 19.0, 12.0, 10.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.072265625, -0.07022428512573242, -0.06818294525146484, -0.06614160537719727, -0.06410026550292969, -0.06205892562866211, -0.06001758575439453, -0.05797624588012695, -0.055934906005859375, -0.0538935661315918, -0.05185222625732422, -0.04981088638305664, -0.04776954650878906, -0.045728206634521484, -0.043686866760253906, -0.04164552688598633, -0.03960418701171875, -0.03756284713745117, -0.035521507263183594, -0.033480167388916016, -0.03143882751464844, -0.02939748764038086, -0.02735614776611328, -0.025314807891845703, -0.023273468017578125, -0.021232128143310547, -0.01919078826904297, -0.01714944839477539, -0.015108108520507812, -0.013066768646240234, -0.011025428771972656, -0.008984088897705078, -0.0069427490234375, -0.004901409149169922, -0.0028600692749023438, -0.0008187294006347656, 0.0012226104736328125, 0.0032639503479003906, 0.005305290222167969, 0.007346630096435547, 0.009387969970703125, 0.011429309844970703, 0.013470649719238281, 0.01551198959350586, 0.017553329467773438, 0.019594669342041016, 0.021636009216308594, 0.023677349090576172, 0.02571868896484375, 0.027760028839111328, 0.029801368713378906, 0.031842708587646484, 0.03388404846191406, 0.03592538833618164, 0.03796672821044922, 0.0400080680847168, 0.042049407958984375, 0.04409074783325195, 0.04613208770751953, 0.04817342758178711, 0.05021476745605469, 0.052256107330322266, 0.054297447204589844, 0.05633878707885742, 0.058380126953125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 3.0, 5.0, 5.0, 3.0, 5.0, 8.0, 6.0, 11.0, 9.0, 11.0, 19.0, 21.0, 45.0, 59.0, 86.0, 113.0, 144.0, 132.0, 94.0, 54.0, 47.0, 27.0, 17.0, 15.0, 13.0, 10.0, 6.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.057373046875, -0.05580854415893555, -0.054244041442871094, -0.05267953872680664, -0.05111503601074219, -0.049550533294677734, -0.04798603057861328, -0.04642152786254883, -0.044857025146484375, -0.04329252243041992, -0.04172801971435547, -0.040163516998291016, -0.03859901428222656, -0.03703451156616211, -0.035470008850097656, -0.0339055061340332, -0.03234100341796875, -0.030776500701904297, -0.029211997985839844, -0.02764749526977539, -0.026082992553710938, -0.024518489837646484, -0.02295398712158203, -0.021389484405517578, -0.019824981689453125, -0.018260478973388672, -0.01669597625732422, -0.015131473541259766, -0.013566970825195312, -0.01200246810913086, -0.010437965393066406, -0.008873462677001953, -0.0073089599609375, -0.005744457244873047, -0.004179954528808594, -0.0026154518127441406, -0.0010509490966796875, 0.0005135536193847656, 0.0020780563354492188, 0.003642559051513672, 0.005207061767578125, 0.006771564483642578, 0.008336067199707031, 0.009900569915771484, 0.011465072631835938, 0.01302957534790039, 0.014594078063964844, 0.016158580780029297, 0.01772308349609375, 0.019287586212158203, 0.020852088928222656, 0.02241659164428711, 0.023981094360351562, 0.025545597076416016, 0.02711009979248047, 0.028674602508544922, 0.030239105224609375, 0.03180360794067383, 0.03336811065673828, 0.034932613372802734, 0.03649711608886719, 0.03806161880493164, 0.039626121520996094, 0.04119062423706055, 0.042755126953125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 7.0, 3.0, 2.0, 6.0, 19.0, 24.0, 62.0, 95.0, 189.0, 238.0, 133.0, 82.0, 46.0, 33.0, 22.0, 14.0, 6.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0570756196975708, -1.025195837020874, -0.9933161735534668, -0.9614364504814148, -0.9295567274093628, -0.8976770043373108, -0.8657972812652588, -0.833917498588562, -0.8020378351211548, -0.7701581120491028, -0.7382783889770508, -0.7063986659049988, -0.6745189428329468, -0.6426392197608948, -0.6107594966888428, -0.578879714012146, -0.546999990940094, -0.515120267868042, -0.48324054479599, -0.451360821723938, -0.419481098651886, -0.387601375579834, -0.3557216227054596, -0.3238418996334076, -0.2919621765613556, -0.2600824534893036, -0.2282027304172516, -0.1963229924440384, -0.1644432693719864, -0.1325635462999344, -0.10068380832672119, -0.06880408525466919, -0.03692430257797241, -0.005044575780630112, 0.02683515101671219, 0.05871488153934479, 0.09059460461139679, 0.12247432768344879, 0.154354065656662, 0.186233788728714, 0.218113511800766, 0.249993234872818, 0.28187295794487, 0.3137527108192444, 0.3456324338912964, 0.3775121569633484, 0.4093918800354004, 0.4412716031074524, 0.4731513261795044, 0.5050310492515564, 0.5369107723236084, 0.5687904953956604, 0.6006702184677124, 0.6325499415397644, 0.6644296646118164, 0.6963094472885132, 0.7281891107559204, 0.7600688338279724, 0.7919485569000244, 0.8238282799720764, 0.8557080030441284, 0.8875877261161804, 0.9194674491882324, 0.9513472318649292, 0.9832269549369812]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 6.0, 4.0, 4.0, 7.0, 13.0, 18.0, 15.0, 13.0, 21.0, 29.0, 26.0, 36.0, 21.0, 42.0, 35.0, 40.0, 52.0, 89.0, 84.0, 76.0, 43.0, 45.0, 42.0, 19.0, 26.0, 29.0, 23.0, 26.0, 24.0, 15.0, 14.0, 11.0, 12.0, 9.0, 8.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.529944658279419, -0.5129480361938477, -0.495951384305954, -0.4789547324180603, -0.4619580805301666, -0.44496142864227295, -0.42796480655670166, -0.410968154668808, -0.3939715027809143, -0.37697485089302063, -0.35997822880744934, -0.34298157691955566, -0.325984925031662, -0.3089882731437683, -0.291991651058197, -0.27499499917030334, -0.25799837708473206, -0.24100174009799957, -0.2240050882101059, -0.2070084512233734, -0.19001179933547974, -0.17301516234874725, -0.15601852536201477, -0.1390218734741211, -0.12202523648738861, -0.10502859205007553, -0.08803194761276245, -0.07103531062602997, -0.05403866618871689, -0.03704202175140381, -0.020045384764671326, -0.003048740327358246, 0.013947904109954834, 0.030944546684622765, 0.047941189259290695, 0.06493782997131348, 0.08193447440862656, 0.09893111884593964, 0.11592775583267212, 0.1329244077205658, 0.14992104470729828, 0.16691768169403076, 0.18391433358192444, 0.20091097056865692, 0.2179076075553894, 0.23490425944328308, 0.25190091133117676, 0.26889753341674805, 0.2858941853046417, 0.3028908371925354, 0.3198874592781067, 0.33688411116600037, 0.35388076305389404, 0.37087738513946533, 0.387874037027359, 0.4048706889152527, 0.421867311000824, 0.43886396288871765, 0.45586058497428894, 0.4728572368621826, 0.4898538887500763, 0.50685054063797, 0.5238471627235413, 0.5408437848091125, 0.5578404664993286]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 3.0, 6.0, 15.0, 20.0, 24.0, 35.0, 65.0, 89.0, 146.0, 228.0, 324.0, 595.0, 1092.0, 2219.0, 5478.0, 17832.0, 125618.0, 3035971.0, 935339.0, 51075.0, 10743.0, 3697.0, 1627.0, 821.0, 448.0, 243.0, 171.0, 97.0, 66.0, 45.0, 37.0, 29.0, 22.0, 9.0, 13.0, 7.0, 10.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.056060791015625, -0.05417966842651367, -0.052298545837402344, -0.050417423248291016, -0.04853630065917969, -0.04665517807006836, -0.04477405548095703, -0.0428929328918457, -0.041011810302734375, -0.03913068771362305, -0.03724956512451172, -0.03536844253540039, -0.03348731994628906, -0.031606197357177734, -0.029725074768066406, -0.027843952178955078, -0.02596282958984375, -0.024081707000732422, -0.022200584411621094, -0.020319461822509766, -0.018438339233398438, -0.01655721664428711, -0.014676094055175781, -0.012794971466064453, -0.010913848876953125, -0.009032726287841797, -0.007151603698730469, -0.005270481109619141, -0.0033893585205078125, -0.0015082359313964844, 0.00037288665771484375, 0.002254009246826172, 0.0041351318359375, 0.006016254425048828, 0.007897377014160156, 0.009778499603271484, 0.011659622192382812, 0.01354074478149414, 0.015421867370605469, 0.017302989959716797, 0.019184112548828125, 0.021065235137939453, 0.02294635772705078, 0.02482748031616211, 0.026708602905273438, 0.028589725494384766, 0.030470848083496094, 0.03235197067260742, 0.03423309326171875, 0.03611421585083008, 0.037995338439941406, 0.039876461029052734, 0.04175758361816406, 0.04363870620727539, 0.04551982879638672, 0.04740095138549805, 0.049282073974609375, 0.0511631965637207, 0.05304431915283203, 0.05492544174194336, 0.05680656433105469, 0.058687686920166016, 0.060568809509277344, 0.06244993209838867, 0.0643310546875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 10.0, 7.0, 5.0, 11.0, 8.0, 8.0, 15.0, 20.0, 21.0, 15.0, 29.0, 30.0, 47.0, 48.0, 53.0, 53.0, 42.0, 65.0, 59.0, 65.0, 56.0, 50.0, 48.0, 41.0, 32.0, 27.0, 30.0, 21.0, 14.0, 17.0, 14.0, 4.0, 7.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0257720947265625, -0.02491140365600586, -0.02405071258544922, -0.023190021514892578, -0.022329330444335938, -0.021468639373779297, -0.020607948303222656, -0.019747257232666016, -0.018886566162109375, -0.018025875091552734, -0.017165184020996094, -0.016304492950439453, -0.015443801879882812, -0.014583110809326172, -0.013722419738769531, -0.01286172866821289, -0.01200103759765625, -0.01114034652709961, -0.010279655456542969, -0.009418964385986328, -0.008558273315429688, -0.007697582244873047, -0.006836891174316406, -0.005976200103759766, -0.005115509033203125, -0.004254817962646484, -0.0033941268920898438, -0.002533435821533203, -0.0016727447509765625, -0.0008120536804199219, 4.863739013671875e-05, 0.0009093284606933594, 0.00177001953125, 0.0026307106018066406, 0.0034914016723632812, 0.004352092742919922, 0.0052127838134765625, 0.006073474884033203, 0.006934165954589844, 0.007794857025146484, 0.008655548095703125, 0.009516239166259766, 0.010376930236816406, 0.011237621307373047, 0.012098312377929688, 0.012959003448486328, 0.013819694519042969, 0.01468038558959961, 0.01554107666015625, 0.01640176773071289, 0.01726245880126953, 0.018123149871826172, 0.018983840942382812, 0.019844532012939453, 0.020705223083496094, 0.021565914154052734, 0.022426605224609375, 0.023287296295166016, 0.024147987365722656, 0.025008678436279297, 0.025869369506835938, 0.026730060577392578, 0.02759075164794922, 0.02845144271850586, 0.0293121337890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 6.0, 16.0, 14.0, 24.0, 35.0, 61.0, 75.0, 103.0, 173.0, 412.0, 1811.0, 3844371.0, 344936.0, 1274.0, 403.0, 146.0, 131.0, 80.0, 64.0, 51.0, 25.0, 25.0, 13.0, 18.0, 6.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4453125, -0.42992401123046875, -0.4145355224609375, -0.39914703369140625, -0.383758544921875, -0.36837005615234375, -0.3529815673828125, -0.33759307861328125, -0.32220458984375, -0.30681610107421875, -0.2914276123046875, -0.27603912353515625, -0.260650634765625, -0.24526214599609375, -0.2298736572265625, -0.21448516845703125, -0.1990966796875, -0.18370819091796875, -0.1683197021484375, -0.15293121337890625, -0.137542724609375, -0.12215423583984375, -0.1067657470703125, -0.09137725830078125, -0.07598876953125, -0.06060028076171875, -0.0452117919921875, -0.02982330322265625, -0.014434814453125, 0.00095367431640625, 0.0163421630859375, 0.03173065185546875, 0.047119140625, 0.06250762939453125, 0.0778961181640625, 0.09328460693359375, 0.108673095703125, 0.12406158447265625, 0.1394500732421875, 0.15483856201171875, 0.17022705078125, 0.18561553955078125, 0.2010040283203125, 0.21639251708984375, 0.231781005859375, 0.24716949462890625, 0.2625579833984375, 0.27794647216796875, 0.2933349609375, 0.30872344970703125, 0.3241119384765625, 0.33950042724609375, 0.354888916015625, 0.37027740478515625, 0.3856658935546875, 0.40105438232421875, 0.41644287109375, 0.43183135986328125, 0.4472198486328125, 0.46260833740234375, 0.477996826171875, 0.49338531494140625, 0.5087738037109375, 0.5241622924804688, 0.53955078125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 10.0, 16.0, 23.0, 39.0, 107.0, 405.0, 2056.0, 1095.0, 189.0, 83.0, 28.0, 14.0, 10.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0933837890625, -0.08781242370605469, -0.08224105834960938, -0.07666969299316406, -0.07109832763671875, -0.06552696228027344, -0.059955596923828125, -0.05438423156738281, -0.0488128662109375, -0.04324150085449219, -0.037670135498046875, -0.03209877014160156, -0.02652740478515625, -0.020956039428710938, -0.015384674072265625, -0.009813308715820312, -0.004241943359375, 0.0013294219970703125, 0.006900787353515625, 0.012472152709960938, 0.01804351806640625, 0.023614883422851562, 0.029186248779296875, 0.03475761413574219, 0.0403289794921875, 0.04590034484863281, 0.051471710205078125, 0.05704307556152344, 0.06261444091796875, 0.06818580627441406, 0.07375717163085938, 0.07932853698730469, 0.08489990234375, 0.09047126770019531, 0.09604263305664062, 0.10161399841308594, 0.10718536376953125, 0.11275672912597656, 0.11832809448242188, 0.12389945983886719, 0.1294708251953125, 0.1350421905517578, 0.14061355590820312, 0.14618492126464844, 0.15175628662109375, 0.15732765197753906, 0.16289901733398438, 0.1684703826904297, 0.174041748046875, 0.1796131134033203, 0.18518447875976562, 0.19075584411621094, 0.19632720947265625, 0.20189857482910156, 0.20746994018554688, 0.2130413055419922, 0.2186126708984375, 0.2241840362548828, 0.22975540161132812, 0.23532676696777344, 0.24089813232421875, 0.24646949768066406, 0.2520408630371094, 0.2576122283935547, 0.26318359375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 11.0, 19.0, 33.0, 95.0, 197.0, 282.0, 197.0, 82.0, 39.0, 11.0, 13.0, 7.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7471466064453125, -0.6986462473869324, -0.6501458883285522, -0.6016455292701721, -0.553145170211792, -0.5046448111534119, -0.45614445209503174, -0.4076440930366516, -0.3591437339782715, -0.31064337491989136, -0.26214301586151123, -0.2136426568031311, -0.16514229774475098, -0.11664193868637085, -0.06814157962799072, -0.019641220569610596, 0.02885913848876953, 0.07735949754714966, 0.12585985660552979, 0.1743602156639099, 0.22286057472229004, 0.27136093378067017, 0.3198612928390503, 0.3683616518974304, 0.41686201095581055, 0.4653623700141907, 0.5138627290725708, 0.5623630881309509, 0.610863447189331, 0.6593638062477112, 0.7078641653060913, 0.7563645243644714, 0.8048648834228516, 0.8533652424812317, 0.9018656015396118, 0.9503659605979919, 0.9988663196563721, 1.0473666191101074, 1.0958670377731323, 1.1443674564361572, 1.1928677558898926, 1.241368055343628, 1.2898684740066528, 1.3383688926696777, 1.386869192123413, 1.4353694915771484, 1.4838699102401733, 1.5323703289031982, 1.5808706283569336, 1.629370927810669, 1.6778713464736938, 1.7263717651367188, 1.774872064590454, 1.8233723640441895, 1.8718727827072144, 1.9203732013702393, 1.9688735008239746, 2.01737380027771, 2.0658740997314453, 2.1143746376037598, 2.162874937057495, 2.2113752365112305, 2.259875774383545, 2.3083760738372803, 2.3568763732910156]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 5.0, 6.0, 9.0, 13.0, 22.0, 25.0, 27.0, 35.0, 36.0, 43.0, 54.0, 54.0, 54.0, 54.0, 52.0, 58.0, 55.0, 43.0, 53.0, 45.0, 35.0, 42.0, 32.0, 30.0, 28.0, 18.0, 19.0, 11.0, 9.0, 5.0, 6.0, 5.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.45279455184936523, -0.4397910237312317, -0.42678749561309814, -0.4137839674949646, -0.40078043937683105, -0.3877769112586975, -0.37477338314056396, -0.3617698550224304, -0.3487663269042969, -0.33576279878616333, -0.3227592706680298, -0.30975574254989624, -0.2967522144317627, -0.28374868631362915, -0.2707451581954956, -0.25774163007736206, -0.24473808705806732, -0.23173455893993378, -0.21873103082180023, -0.2057275027036667, -0.19272397458553314, -0.1797204315662384, -0.16671690344810486, -0.1537133753299713, -0.14070984721183777, -0.12770631909370422, -0.11470279097557068, -0.10169926285743713, -0.08869573473930359, -0.07569219917058945, -0.0626886710524559, -0.04968514293432236, -0.03668162226676941, -0.023678094148635864, -0.01067456416785717, 0.002328965812921524, 0.015332493931055069, 0.028336025774478912, 0.04133955389261246, 0.054343082010746, 0.06734661012887955, 0.08035013824701309, 0.09335366636514664, 0.10635720193386078, 0.11936073005199432, 0.13236425817012787, 0.1453677862882614, 0.15837131440639496, 0.1713748425245285, 0.18437837064266205, 0.1973818987607956, 0.21038542687892914, 0.22338895499706268, 0.23639249801635742, 0.24939602613449097, 0.2623995542526245, 0.27540308237075806, 0.2884066104888916, 0.30141013860702515, 0.3144136667251587, 0.32741719484329224, 0.3404207229614258, 0.3534242510795593, 0.36642777919769287, 0.3794313073158264]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 7.0, 7.0, 2.0, 7.0, 14.0, 24.0, 30.0, 49.0, 55.0, 99.0, 133.0, 204.0, 386.0, 647.0, 1072.0, 1996.0, 3758.0, 8045.0, 17641.0, 44543.0, 130616.0, 358496.0, 309646.0, 104462.0, 37040.0, 15113.0, 6828.0, 3423.0, 1731.0, 962.0, 564.0, 342.0, 219.0, 147.0, 82.0, 59.0, 31.0, 20.0, 19.0, 14.0, 9.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0479736328125, -0.04612159729003906, -0.044269561767578125, -0.04241752624511719, -0.04056549072265625, -0.03871345520019531, -0.036861419677734375, -0.03500938415527344, -0.0331573486328125, -0.03130531311035156, -0.029453277587890625, -0.027601242065429688, -0.02574920654296875, -0.023897171020507812, -0.022045135498046875, -0.020193099975585938, -0.018341064453125, -0.016489028930664062, -0.014636993408203125, -0.012784957885742188, -0.01093292236328125, -0.009080886840820312, -0.007228851318359375, -0.0053768157958984375, -0.0035247802734375, -0.0016727447509765625, 0.000179290771484375, 0.0020313262939453125, 0.00388336181640625, 0.0057353973388671875, 0.007587432861328125, 0.009439468383789062, 0.01129150390625, 0.013143539428710938, 0.014995574951171875, 0.016847610473632812, 0.01869964599609375, 0.020551681518554688, 0.022403717041015625, 0.024255752563476562, 0.0261077880859375, 0.027959823608398438, 0.029811859130859375, 0.03166389465332031, 0.03351593017578125, 0.03536796569824219, 0.037220001220703125, 0.03907203674316406, 0.040924072265625, 0.04277610778808594, 0.044628143310546875, 0.04648017883300781, 0.04833221435546875, 0.05018424987792969, 0.052036285400390625, 0.05388832092285156, 0.0557403564453125, 0.05759239196777344, 0.059444427490234375, 0.06129646301269531, 0.06314849853515625, 0.06500053405761719, 0.06685256958007812, 0.06870460510253906, 0.070556640625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 2.0, 7.0, 6.0, 6.0, 9.0, 13.0, 11.0, 14.0, 18.0, 26.0, 30.0, 18.0, 34.0, 26.0, 38.0, 46.0, 39.0, 46.0, 46.0, 42.0, 48.0, 48.0, 46.0, 34.0, 41.0, 41.0, 32.0, 27.0, 25.0, 32.0, 20.0, 23.0, 22.0, 13.0, 9.0, 10.0, 13.0, 8.0, 6.0, 4.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.0307769775390625, -0.029875516891479492, -0.028974056243896484, -0.028072595596313477, -0.02717113494873047, -0.02626967430114746, -0.025368213653564453, -0.024466753005981445, -0.023565292358398438, -0.02266383171081543, -0.021762371063232422, -0.020860910415649414, -0.019959449768066406, -0.0190579891204834, -0.01815652847290039, -0.017255067825317383, -0.016353607177734375, -0.015452146530151367, -0.01455068588256836, -0.013649225234985352, -0.012747764587402344, -0.011846303939819336, -0.010944843292236328, -0.01004338264465332, -0.009141921997070312, -0.008240461349487305, -0.007339000701904297, -0.006437540054321289, -0.005536079406738281, -0.0046346187591552734, -0.0037331581115722656, -0.002831697463989258, -0.00193023681640625, -0.0010287761688232422, -0.00012731552124023438, 0.0007741451263427734, 0.0016756057739257812, 0.002577066421508789, 0.003478527069091797, 0.004379987716674805, 0.0052814483642578125, 0.00618290901184082, 0.007084369659423828, 0.007985830307006836, 0.008887290954589844, 0.009788751602172852, 0.01069021224975586, 0.011591672897338867, 0.012493133544921875, 0.013394594192504883, 0.01429605484008789, 0.015197515487670898, 0.016098976135253906, 0.017000436782836914, 0.017901897430419922, 0.01880335807800293, 0.019704818725585938, 0.020606279373168945, 0.021507740020751953, 0.02240920066833496, 0.02331066131591797, 0.024212121963500977, 0.025113582611083984, 0.026015043258666992, 0.02691650390625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 8.0, 12.0, 10.0, 13.0, 25.0, 15.0, 44.0, 77.0, 92.0, 155.0, 271.0, 529.0, 1326.0, 4033.0, 19946.0, 264103.0, 709735.0, 38667.0, 6142.0, 1797.0, 682.0, 322.0, 199.0, 111.0, 80.0, 51.0, 31.0, 18.0, 20.0, 10.0, 11.0, 4.0, 5.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1805419921875, -0.1749267578125, -0.1693115234375, -0.1636962890625, -0.1580810546875, -0.1524658203125, -0.1468505859375, -0.1412353515625, -0.1356201171875, -0.1300048828125, -0.1243896484375, -0.1187744140625, -0.1131591796875, -0.1075439453125, -0.1019287109375, -0.0963134765625, -0.0906982421875, -0.0850830078125, -0.0794677734375, -0.0738525390625, -0.0682373046875, -0.0626220703125, -0.0570068359375, -0.0513916015625, -0.0457763671875, -0.0401611328125, -0.0345458984375, -0.0289306640625, -0.0233154296875, -0.0177001953125, -0.0120849609375, -0.0064697265625, -0.0008544921875, 0.0047607421875, 0.0103759765625, 0.0159912109375, 0.0216064453125, 0.0272216796875, 0.0328369140625, 0.0384521484375, 0.0440673828125, 0.0496826171875, 0.0552978515625, 0.0609130859375, 0.0665283203125, 0.0721435546875, 0.0777587890625, 0.0833740234375, 0.0889892578125, 0.0946044921875, 0.1002197265625, 0.1058349609375, 0.1114501953125, 0.1170654296875, 0.1226806640625, 0.1282958984375, 0.1339111328125, 0.1395263671875, 0.1451416015625, 0.1507568359375, 0.1563720703125, 0.1619873046875, 0.1676025390625, 0.1732177734375, 0.1788330078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 7.0, 9.0, 7.0, 9.0, 12.0, 8.0, 16.0, 21.0, 17.0, 38.0, 27.0, 31.0, 38.0, 40.0, 45.0, 58.0, 53.0, 50.0, 50.0, 60.0, 53.0, 52.0, 41.0, 47.0, 30.0, 35.0, 36.0, 26.0, 13.0, 23.0, 8.0, 10.0, 8.0, 10.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12548828125, -0.1214599609375, -0.117431640625, -0.1134033203125, -0.109375, -0.1053466796875, -0.101318359375, -0.0972900390625, -0.09326171875, -0.0892333984375, -0.085205078125, -0.0811767578125, -0.0771484375, -0.0731201171875, -0.069091796875, -0.0650634765625, -0.06103515625, -0.0570068359375, -0.052978515625, -0.0489501953125, -0.044921875, -0.0408935546875, -0.036865234375, -0.0328369140625, -0.02880859375, -0.0247802734375, -0.020751953125, -0.0167236328125, -0.0126953125, -0.0086669921875, -0.004638671875, -0.0006103515625, 0.00341796875, 0.0074462890625, 0.011474609375, 0.0155029296875, 0.01953125, 0.0235595703125, 0.027587890625, 0.0316162109375, 0.03564453125, 0.0396728515625, 0.043701171875, 0.0477294921875, 0.0517578125, 0.0557861328125, 0.059814453125, 0.0638427734375, 0.06787109375, 0.0718994140625, 0.075927734375, 0.0799560546875, 0.083984375, 0.0880126953125, 0.092041015625, 0.0960693359375, 0.10009765625, 0.1041259765625, 0.108154296875, 0.1121826171875, 0.1162109375, 0.1202392578125, 0.124267578125, 0.1282958984375, 0.13232421875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 2.0, 4.0, 15.0, 13.0, 13.0, 20.0, 31.0, 46.0, 54.0, 74.0, 100.0, 141.0, 204.0, 277.0, 432.0, 676.0, 1053.0, 1835.0, 3616.0, 7707.0, 22153.0, 93530.0, 707454.0, 158195.0, 30903.0, 10035.0, 4236.0, 2158.0, 1177.0, 771.0, 509.0, 332.0, 229.0, 149.0, 97.0, 80.0, 55.0, 45.0, 37.0, 23.0, 17.0, 12.0, 6.0, 7.0, 6.0, 6.0, 5.0, 4.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.052886962890625, -0.051215171813964844, -0.04954338073730469, -0.04787158966064453, -0.046199798583984375, -0.04452800750732422, -0.04285621643066406, -0.041184425354003906, -0.03951263427734375, -0.037840843200683594, -0.03616905212402344, -0.03449726104736328, -0.032825469970703125, -0.03115367889404297, -0.029481887817382812, -0.027810096740722656, -0.0261383056640625, -0.024466514587402344, -0.022794723510742188, -0.02112293243408203, -0.019451141357421875, -0.01777935028076172, -0.016107559204101562, -0.014435768127441406, -0.01276397705078125, -0.011092185974121094, -0.009420394897460938, -0.007748603820800781, -0.006076812744140625, -0.004405021667480469, -0.0027332305908203125, -0.0010614395141601562, 0.0006103515625, 0.0022821426391601562, 0.0039539337158203125, 0.005625724792480469, 0.007297515869140625, 0.008969306945800781, 0.010641098022460938, 0.012312889099121094, 0.01398468017578125, 0.015656471252441406, 0.017328262329101562, 0.01900005340576172, 0.020671844482421875, 0.02234363555908203, 0.024015426635742188, 0.025687217712402344, 0.0273590087890625, 0.029030799865722656, 0.030702590942382812, 0.03237438201904297, 0.034046173095703125, 0.03571796417236328, 0.03738975524902344, 0.039061546325683594, 0.04073333740234375, 0.042405128479003906, 0.04407691955566406, 0.04574871063232422, 0.047420501708984375, 0.04909229278564453, 0.05076408386230469, 0.052435874938964844, 0.054107666015625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 8.0, 2.0, 2.0, 3.0, 1.0, 3.0, 8.0, 8.0, 9.0, 13.0, 23.0, 40.0, 69.0, 64.0, 84.0, 128.0, 106.0, 104.0, 80.0, 83.0, 52.0, 38.0, 28.0, 19.0, 16.0, 1.0, 3.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.141164779663086e-05, -3.0310824513435364e-05, -2.9210001230239868e-05, -2.8109177947044373e-05, -2.7008354663848877e-05, -2.590753138065338e-05, -2.4806708097457886e-05, -2.370588481426239e-05, -2.2605061531066895e-05, -2.15042382478714e-05, -2.0403414964675903e-05, -1.9302591681480408e-05, -1.8201768398284912e-05, -1.7100945115089417e-05, -1.600012183189392e-05, -1.4899298548698425e-05, -1.379847526550293e-05, -1.2697651982307434e-05, -1.1596828699111938e-05, -1.0496005415916443e-05, -9.395182132720947e-06, -8.294358849525452e-06, -7.193535566329956e-06, -6.0927122831344604e-06, -4.991888999938965e-06, -3.891065716743469e-06, -2.7902424335479736e-06, -1.689419150352478e-06, -5.885958671569824e-07, 5.122274160385132e-07, 1.6130506992340088e-06, 2.7138739824295044e-06, 3.814697265625e-06, 4.915520548820496e-06, 6.016343832015991e-06, 7.117167115211487e-06, 8.217990398406982e-06, 9.318813681602478e-06, 1.0419636964797974e-05, 1.152046024799347e-05, 1.2621283531188965e-05, 1.372210681438446e-05, 1.4822930097579956e-05, 1.592375338077545e-05, 1.7024576663970947e-05, 1.8125399947166443e-05, 1.922622323036194e-05, 2.0327046513557434e-05, 2.142786979675293e-05, 2.2528693079948425e-05, 2.362951636314392e-05, 2.4730339646339417e-05, 2.5831162929534912e-05, 2.6931986212730408e-05, 2.8032809495925903e-05, 2.91336327791214e-05, 3.0234456062316895e-05, 3.133527934551239e-05, 3.2436102628707886e-05, 3.353692591190338e-05, 3.463774919509888e-05, 3.573857247829437e-05, 3.683939576148987e-05, 3.7940219044685364e-05, 3.904104232788086e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 5.0, 8.0, 4.0, 6.0, 12.0, 13.0, 29.0, 30.0, 48.0, 68.0, 104.0, 139.0, 186.0, 311.0, 473.0, 738.0, 1210.0, 2048.0, 3734.0, 6963.0, 14996.0, 38855.0, 137434.0, 614032.0, 152886.0, 42113.0, 15718.0, 7274.0, 3684.0, 2013.0, 1222.0, 746.0, 469.0, 316.0, 197.0, 134.0, 94.0, 72.0, 47.0, 44.0, 20.0, 21.0, 17.0, 6.0, 4.0, 4.0, 3.0, 0.0, 4.0, 0.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039703369140625, -0.03840303421020508, -0.037102699279785156, -0.035802364349365234, -0.03450202941894531, -0.03320169448852539, -0.03190135955810547, -0.030601024627685547, -0.029300689697265625, -0.028000354766845703, -0.02670001983642578, -0.02539968490600586, -0.024099349975585938, -0.022799015045166016, -0.021498680114746094, -0.020198345184326172, -0.01889801025390625, -0.017597675323486328, -0.016297340393066406, -0.014997005462646484, -0.013696670532226562, -0.01239633560180664, -0.011096000671386719, -0.009795665740966797, -0.008495330810546875, -0.007194995880126953, -0.005894660949707031, -0.004594326019287109, -0.0032939910888671875, -0.0019936561584472656, -0.0006933212280273438, 0.0006070137023925781, 0.0019073486328125, 0.003207683563232422, 0.004508018493652344, 0.005808353424072266, 0.0071086883544921875, 0.00840902328491211, 0.009709358215332031, 0.011009693145751953, 0.012310028076171875, 0.013610363006591797, 0.014910697937011719, 0.01621103286743164, 0.017511367797851562, 0.018811702728271484, 0.020112037658691406, 0.021412372589111328, 0.02271270751953125, 0.024013042449951172, 0.025313377380371094, 0.026613712310791016, 0.027914047241210938, 0.02921438217163086, 0.03051471710205078, 0.0318150520324707, 0.033115386962890625, 0.03441572189331055, 0.03571605682373047, 0.03701639175415039, 0.03831672668457031, 0.039617061614990234, 0.040917396545410156, 0.04221773147583008, 0.04351806640625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 10.0, 6.0, 15.0, 27.0, 39.0, 39.0, 53.0, 65.0, 89.0, 109.0, 104.0, 98.0, 82.0, 41.0, 55.0, 42.0, 30.0, 19.0, 20.0, 10.0, 10.0, 8.0, 10.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0499267578125, -0.04828977584838867, -0.046652793884277344, -0.045015811920166016, -0.04337882995605469, -0.04174184799194336, -0.04010486602783203, -0.0384678840637207, -0.036830902099609375, -0.03519392013549805, -0.03355693817138672, -0.03191995620727539, -0.030282974243164062, -0.028645992279052734, -0.027009010314941406, -0.025372028350830078, -0.02373504638671875, -0.022098064422607422, -0.020461082458496094, -0.018824100494384766, -0.017187118530273438, -0.01555013656616211, -0.013913154602050781, -0.012276172637939453, -0.010639190673828125, -0.009002208709716797, -0.007365226745605469, -0.005728244781494141, -0.0040912628173828125, -0.0024542808532714844, -0.0008172988891601562, 0.0008196830749511719, 0.0024566650390625, 0.004093647003173828, 0.005730628967285156, 0.007367610931396484, 0.009004592895507812, 0.01064157485961914, 0.012278556823730469, 0.013915538787841797, 0.015552520751953125, 0.017189502716064453, 0.01882648468017578, 0.02046346664428711, 0.022100448608398438, 0.023737430572509766, 0.025374412536621094, 0.027011394500732422, 0.02864837646484375, 0.030285358428955078, 0.031922340393066406, 0.033559322357177734, 0.03519630432128906, 0.03683328628540039, 0.03847026824951172, 0.04010725021362305, 0.041744232177734375, 0.0433812141418457, 0.04501819610595703, 0.04665517807006836, 0.04829216003417969, 0.049929141998291016, 0.051566123962402344, 0.05320310592651367, 0.054840087890625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 6.0, 15.0, 15.0, 39.0, 88.0, 192.0, 342.0, 155.0, 82.0, 33.0, 18.0, 10.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2531659603118896, -2.2084152698516846, -2.1636648178100586, -2.1189141273498535, -2.0741634368896484, -2.0294129848480225, -1.9846622943878174, -1.9399117231369019, -1.8951611518859863, -1.8504105806350708, -1.8056598901748657, -1.7609093189239502, -1.7161587476730347, -1.6714081764221191, -1.626657485961914, -1.5819069147109985, -1.5371562242507935, -1.492405652999878, -1.4476549625396729, -1.4029043912887573, -1.3581538200378418, -1.3134031295776367, -1.2686525583267212, -1.2239019870758057, -1.1791512966156006, -1.134400725364685, -1.08965003490448, -1.0448994636535645, -1.000148892402649, -0.9553982615470886, -0.9106476306915283, -0.8658970594406128, -0.8211463689804077, -0.7763957381248474, -0.7316451668739319, -0.6868945360183716, -0.642143964767456, -0.5973933339118958, -0.5526427030563354, -0.5078921318054199, -0.4631415009498596, -0.4183908998966217, -0.3736402988433838, -0.3288896679878235, -0.28413906693458557, -0.23938846588134766, -0.19463783502578735, -0.14988723397254944, -0.10513663291931152, -0.06038602441549301, -0.0156354159116745, 0.02911520004272461, 0.07386580109596252, 0.11861640214920044, 0.16336703300476074, 0.20811763405799866, 0.2528682351112366, 0.2976188361644745, 0.3423694372177124, 0.3871200680732727, 0.4318706691265106, 0.47662127017974854, 0.5213719010353088, 0.5661225318908691, 0.6108731031417847]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 9.0, 9.0, 9.0, 7.0, 5.0, 7.0, 12.0, 27.0, 10.0, 24.0, 27.0, 32.0, 25.0, 32.0, 52.0, 44.0, 65.0, 86.0, 86.0, 64.0, 51.0, 42.0, 42.0, 25.0, 37.0, 23.0, 21.0, 27.0, 17.0, 19.0, 11.0, 11.0, 6.0, 10.0, 7.0, 6.0, 3.0, 7.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5554711818695068, -0.5392701029777527, -0.5230690240859985, -0.5068679451942444, -0.4906668961048126, -0.47446581721305847, -0.4582647681236267, -0.44206368923187256, -0.4258626103401184, -0.40966153144836426, -0.3934604525566101, -0.37725940346717834, -0.3610583245754242, -0.34485724568367004, -0.3286561965942383, -0.31245511770248413, -0.29625403881073, -0.28005295991897583, -0.2638518810272217, -0.24765083193778992, -0.23144975304603577, -0.21524867415428162, -0.19904761016368866, -0.1828465461730957, -0.16664546728134155, -0.1504443883895874, -0.13424332439899445, -0.11804225295782089, -0.10184118151664734, -0.08564011007547379, -0.06943903863430023, -0.05323796719312668, -0.037036895751953125, -0.02083582431077957, -0.004634752869606018, 0.011566318571567535, 0.02776739001274109, 0.04396846145391464, 0.060169532895088196, 0.07637060433626175, 0.0925716757774353, 0.10877274721860886, 0.12497381865978241, 0.14117488265037537, 0.15737596154212952, 0.17357704043388367, 0.18977810442447662, 0.20597916841506958, 0.22218024730682373, 0.23838132619857788, 0.25458240509033203, 0.2707834541797638, 0.28698453307151794, 0.3031856119632721, 0.31938666105270386, 0.335587739944458, 0.35178881883621216, 0.3679898977279663, 0.38419097661972046, 0.4003920257091522, 0.41659310460090637, 0.4327941834926605, 0.4489952325820923, 0.46519631147384644, 0.4813973903656006]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 4.0, 11.0, 12.0, 18.0, 18.0, 16.0, 22.0, 39.0, 55.0, 105.0, 151.0, 230.0, 361.0, 560.0, 975.0, 1887.0, 3867.0, 9744.0, 40109.0, 716576.0, 3252771.0, 136388.0, 18476.0, 6031.0, 2560.0, 1328.0, 723.0, 406.0, 272.0, 165.0, 111.0, 85.0, 58.0, 34.0, 25.0, 20.0, 16.0, 12.0, 10.0, 10.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.07086181640625, -0.06826210021972656, -0.06566238403320312, -0.06306266784667969, -0.06046295166015625, -0.05786323547363281, -0.055263519287109375, -0.05266380310058594, -0.0500640869140625, -0.04746437072753906, -0.044864654541015625, -0.04226493835449219, -0.03966522216796875, -0.03706550598144531, -0.034465789794921875, -0.03186607360839844, -0.029266357421875, -0.026666641235351562, -0.024066925048828125, -0.021467208862304688, -0.01886749267578125, -0.016267776489257812, -0.013668060302734375, -0.011068344116210938, -0.0084686279296875, -0.0058689117431640625, -0.003269195556640625, -0.0006694793701171875, 0.00193023681640625, 0.0045299530029296875, 0.007129669189453125, 0.009729385375976562, 0.0123291015625, 0.014928817749023438, 0.017528533935546875, 0.020128250122070312, 0.02272796630859375, 0.025327682495117188, 0.027927398681640625, 0.030527114868164062, 0.0331268310546875, 0.03572654724121094, 0.038326263427734375, 0.04092597961425781, 0.04352569580078125, 0.04612541198730469, 0.048725128173828125, 0.05132484436035156, 0.053924560546875, 0.05652427673339844, 0.059123992919921875, 0.06172370910644531, 0.06432342529296875, 0.06692314147949219, 0.06952285766601562, 0.07212257385253906, 0.0747222900390625, 0.07732200622558594, 0.07992172241210938, 0.08252143859863281, 0.08512115478515625, 0.08772087097167969, 0.09032058715820312, 0.09292030334472656, 0.09552001953125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 9.0, 7.0, 11.0, 18.0, 10.0, 18.0, 21.0, 32.0, 29.0, 25.0, 48.0, 49.0, 41.0, 38.0, 42.0, 51.0, 53.0, 52.0, 44.0, 57.0, 54.0, 35.0, 41.0, 29.0, 31.0, 30.0, 22.0, 11.0, 24.0, 13.0, 5.0, 11.0, 8.0, 3.0, 8.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0303192138671875, -0.029388904571533203, -0.028458595275878906, -0.02752828598022461, -0.026597976684570312, -0.025667667388916016, -0.02473735809326172, -0.023807048797607422, -0.022876739501953125, -0.021946430206298828, -0.02101612091064453, -0.020085811614990234, -0.019155502319335938, -0.01822519302368164, -0.017294883728027344, -0.016364574432373047, -0.01543426513671875, -0.014503955841064453, -0.013573646545410156, -0.01264333724975586, -0.011713027954101562, -0.010782718658447266, -0.009852409362792969, -0.008922100067138672, -0.007991790771484375, -0.007061481475830078, -0.006131172180175781, -0.005200862884521484, -0.0042705535888671875, -0.0033402442932128906, -0.0024099349975585938, -0.0014796257019042969, -0.00054931640625, 0.0003809928894042969, 0.0013113021850585938, 0.0022416114807128906, 0.0031719207763671875, 0.004102230072021484, 0.005032539367675781, 0.005962848663330078, 0.006893157958984375, 0.007823467254638672, 0.008753776550292969, 0.009684085845947266, 0.010614395141601562, 0.01154470443725586, 0.012475013732910156, 0.013405323028564453, 0.01433563232421875, 0.015265941619873047, 0.016196250915527344, 0.01712656021118164, 0.018056869506835938, 0.018987178802490234, 0.01991748809814453, 0.020847797393798828, 0.021778106689453125, 0.022708415985107422, 0.02363872528076172, 0.024569034576416016, 0.025499343872070312, 0.02642965316772461, 0.027359962463378906, 0.028290271759033203, 0.0292205810546875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 15.0, 8.0, 15.0, 35.0, 66.0, 132.0, 278.0, 780.0, 2698.0, 28912.0, 4119550.0, 37658.0, 2944.0, 707.0, 257.0, 126.0, 45.0, 23.0, 11.0, 10.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.330322265625, -0.3191375732421875, -0.307952880859375, -0.2967681884765625, -0.28558349609375, -0.2743988037109375, -0.263214111328125, -0.2520294189453125, -0.2408447265625, -0.2296600341796875, -0.218475341796875, -0.2072906494140625, -0.19610595703125, -0.1849212646484375, -0.173736572265625, -0.1625518798828125, -0.1513671875, -0.1401824951171875, -0.128997802734375, -0.1178131103515625, -0.10662841796875, -0.0954437255859375, -0.084259033203125, -0.0730743408203125, -0.0618896484375, -0.0507049560546875, -0.039520263671875, -0.0283355712890625, -0.01715087890625, -0.0059661865234375, 0.005218505859375, 0.0164031982421875, 0.027587890625, 0.0387725830078125, 0.049957275390625, 0.0611419677734375, 0.07232666015625, 0.0835113525390625, 0.094696044921875, 0.1058807373046875, 0.1170654296875, 0.1282501220703125, 0.139434814453125, 0.1506195068359375, 0.16180419921875, 0.1729888916015625, 0.184173583984375, 0.1953582763671875, 0.20654296875, 0.2177276611328125, 0.228912353515625, 0.2400970458984375, 0.25128173828125, 0.2624664306640625, 0.273651123046875, 0.2848358154296875, 0.2960205078125, 0.3072052001953125, 0.318389892578125, 0.3295745849609375, 0.34075927734375, 0.3519439697265625, 0.363128662109375, 0.3743133544921875, 0.385498046875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 7.0, 6.0, 17.0, 24.0, 40.0, 114.0, 432.0, 2008.0, 1071.0, 210.0, 71.0, 30.0, 24.0, 14.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2880859375, -0.2808341979980469, -0.27358245849609375, -0.2663307189941406, -0.2590789794921875, -0.2518272399902344, -0.24457550048828125, -0.23732376098632812, -0.230072021484375, -0.22282028198242188, -0.21556854248046875, -0.20831680297851562, -0.2010650634765625, -0.19381332397460938, -0.18656158447265625, -0.17930984497070312, -0.17205810546875, -0.16480636596679688, -0.15755462646484375, -0.15030288696289062, -0.1430511474609375, -0.13579940795898438, -0.12854766845703125, -0.12129592895507812, -0.114044189453125, -0.10679244995117188, -0.09954071044921875, -0.09228897094726562, -0.0850372314453125, -0.07778549194335938, -0.07053375244140625, -0.06328201293945312, -0.0560302734375, -0.048778533935546875, -0.04152679443359375, -0.034275054931640625, -0.0270233154296875, -0.019771575927734375, -0.01251983642578125, -0.005268096923828125, 0.001983642578125, 0.009235382080078125, 0.01648712158203125, 0.023738861083984375, 0.0309906005859375, 0.038242340087890625, 0.04549407958984375, 0.052745819091796875, 0.05999755859375, 0.06724929809570312, 0.07450103759765625, 0.08175277709960938, 0.0890045166015625, 0.09625625610351562, 0.10350799560546875, 0.11075973510742188, 0.118011474609375, 0.12526321411132812, 0.13251495361328125, 0.13976669311523438, 0.1470184326171875, 0.15427017211914062, 0.16152191162109375, 0.16877365112304688, 0.176025390625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 14.0, 18.0, 43.0, 101.0, 187.0, 281.0, 205.0, 86.0, 31.0, 16.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.298693895339966, -2.2515151500701904, -2.204336643218994, -2.1571578979492188, -2.1099791526794434, -2.062800407409668, -2.0156216621398926, -1.9684431552886963, -1.921264410018921, -1.8740856647491455, -1.8269070386886597, -1.7797284126281738, -1.7325496673583984, -1.685370922088623, -1.6381922960281372, -1.5910136699676514, -1.543834924697876, -1.4966561794281006, -1.4494775533676147, -1.402298927307129, -1.3551201820373535, -1.3079414367675781, -1.2607628107070923, -1.2135841846466064, -1.166405439376831, -1.1192266941070557, -1.0720480680465698, -1.024869441986084, -0.9776906967163086, -0.930512011051178, -0.8833333253860474, -0.8361546397209167, -0.7889760732650757, -0.7417973875999451, -0.6946187019348145, -0.6474400162696838, -0.6002613306045532, -0.5530826449394226, -0.505903959274292, -0.4587252736091614, -0.41154658794403076, -0.36436790227890015, -0.31718921661376953, -0.2700105309486389, -0.2228318452835083, -0.17565315961837769, -0.12847447395324707, -0.08129578828811646, -0.03411710262298584, 0.013061583042144775, 0.06024026870727539, 0.107418954372406, 0.15459764003753662, 0.20177632570266724, 0.24895501136779785, 0.29613369703292847, 0.3433123826980591, 0.3904910683631897, 0.4376697540283203, 0.4848484396934509, 0.5320271253585815, 0.5792058110237122, 0.6263844966888428, 0.6735631823539734, 0.720741868019104]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 6.0, 3.0, 7.0, 9.0, 14.0, 11.0, 8.0, 15.0, 17.0, 25.0, 26.0, 29.0, 42.0, 33.0, 35.0, 45.0, 31.0, 40.0, 40.0, 49.0, 40.0, 33.0, 51.0, 32.0, 36.0, 43.0, 37.0, 26.0, 25.0, 32.0, 20.0, 17.0, 17.0, 15.0, 10.0, 14.0, 11.0, 5.0, 12.0, 5.0, 1.0, 7.0, 4.0, 3.0, 0.0, 8.0, 1.0, 1.0, 5.0], "bins": [-0.4417431950569153, -0.42889025807380676, -0.41603735089302063, -0.4031844139099121, -0.390331506729126, -0.37747856974601746, -0.36462563276290894, -0.3517727255821228, -0.3389197885990143, -0.32606685161590576, -0.31321394443511963, -0.3003610074520111, -0.2875080704689026, -0.27465516328811646, -0.26180222630500793, -0.2489493042230606, -0.23609638214111328, -0.22324346005916595, -0.21039053797721863, -0.1975376009941101, -0.18468467891216278, -0.17183175683021545, -0.15897881984710693, -0.1461258977651596, -0.13327297568321228, -0.12042005360126495, -0.10756712406873703, -0.0947141945362091, -0.08186127245426178, -0.06900835037231445, -0.05615542083978653, -0.043302491307258606, -0.03044956922531128, -0.017596643418073654, -0.004743717610836029, 0.008109208196401596, 0.02096213400363922, 0.03381505608558655, 0.04666798561811447, 0.059520915150642395, 0.07237383723258972, 0.08522675931453705, 0.09807968884706497, 0.1109326183795929, 0.12378554046154022, 0.13663846254348755, 0.14949139952659607, 0.1623443216085434, 0.17519724369049072, 0.18805016577243805, 0.20090308785438538, 0.2137560248374939, 0.22660894691944122, 0.23946186900138855, 0.25231480598449707, 0.2651677131652832, 0.2780206501483917, 0.29087358713150024, 0.3037264943122864, 0.3165794312953949, 0.3294323682785034, 0.34228527545928955, 0.35513821244239807, 0.3679911494255066, 0.3808440566062927]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 11.0, 3.0, 20.0, 18.0, 25.0, 45.0, 69.0, 90.0, 150.0, 223.0, 335.0, 453.0, 769.0, 1400.0, 2415.0, 4149.0, 8011.0, 16150.0, 34809.0, 81997.0, 207319.0, 354188.0, 193605.0, 76337.0, 33219.0, 15436.0, 7555.0, 4049.0, 2211.0, 1343.0, 765.0, 467.0, 306.0, 209.0, 107.0, 89.0, 70.0, 42.0, 22.0, 18.0, 14.0, 9.0, 6.0, 10.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.053802490234375, -0.05224132537841797, -0.05068016052246094, -0.049118995666503906, -0.047557830810546875, -0.045996665954589844, -0.04443550109863281, -0.04287433624267578, -0.04131317138671875, -0.03975200653076172, -0.03819084167480469, -0.036629676818847656, -0.035068511962890625, -0.033507347106933594, -0.03194618225097656, -0.03038501739501953, -0.0288238525390625, -0.02726268768310547, -0.025701522827148438, -0.024140357971191406, -0.022579193115234375, -0.021018028259277344, -0.019456863403320312, -0.01789569854736328, -0.01633453369140625, -0.014773368835449219, -0.013212203979492188, -0.011651039123535156, -0.010089874267578125, -0.008528709411621094, -0.0069675445556640625, -0.005406379699707031, -0.00384521484375, -0.0022840499877929688, -0.0007228851318359375, 0.0008382797241210938, 0.002399444580078125, 0.003960609436035156, 0.0055217742919921875, 0.007082939147949219, 0.00864410400390625, 0.010205268859863281, 0.011766433715820312, 0.013327598571777344, 0.014888763427734375, 0.016449928283691406, 0.018011093139648438, 0.01957225799560547, 0.0211334228515625, 0.02269458770751953, 0.024255752563476562, 0.025816917419433594, 0.027378082275390625, 0.028939247131347656, 0.030500411987304688, 0.03206157684326172, 0.03362274169921875, 0.03518390655517578, 0.03674507141113281, 0.038306236267089844, 0.039867401123046875, 0.041428565979003906, 0.04298973083496094, 0.04455089569091797, 0.046112060546875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 6.0, 10.0, 15.0, 19.0, 19.0, 17.0, 21.0, 27.0, 35.0, 32.0, 49.0, 52.0, 52.0, 48.0, 61.0, 44.0, 74.0, 51.0, 57.0, 56.0, 40.0, 32.0, 34.0, 29.0, 24.0, 21.0, 13.0, 10.0, 12.0, 10.0, 4.0, 5.0, 3.0, 2.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.039154052734375, -0.037824153900146484, -0.03649425506591797, -0.03516435623168945, -0.03383445739746094, -0.03250455856323242, -0.031174659729003906, -0.02984476089477539, -0.028514862060546875, -0.02718496322631836, -0.025855064392089844, -0.024525165557861328, -0.023195266723632812, -0.021865367889404297, -0.02053546905517578, -0.019205570220947266, -0.01787567138671875, -0.016545772552490234, -0.015215873718261719, -0.013885974884033203, -0.012556076049804688, -0.011226177215576172, -0.009896278381347656, -0.00856637954711914, -0.007236480712890625, -0.005906581878662109, -0.004576683044433594, -0.003246784210205078, -0.0019168853759765625, -0.0005869865417480469, 0.0007429122924804688, 0.0020728111267089844, 0.0034027099609375, 0.004732608795166016, 0.006062507629394531, 0.007392406463623047, 0.008722305297851562, 0.010052204132080078, 0.011382102966308594, 0.01271200180053711, 0.014041900634765625, 0.01537179946899414, 0.016701698303222656, 0.018031597137451172, 0.019361495971679688, 0.020691394805908203, 0.02202129364013672, 0.023351192474365234, 0.02468109130859375, 0.026010990142822266, 0.02734088897705078, 0.028670787811279297, 0.030000686645507812, 0.03133058547973633, 0.032660484313964844, 0.03399038314819336, 0.035320281982421875, 0.03665018081665039, 0.037980079650878906, 0.03930997848510742, 0.04063987731933594, 0.04196977615356445, 0.04329967498779297, 0.044629573822021484, 0.04595947265625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 9.0, 4.0, 8.0, 13.0, 10.0, 18.0, 18.0, 32.0, 47.0, 57.0, 67.0, 108.0, 128.0, 189.0, 274.0, 502.0, 981.0, 2035.0, 5403.0, 19473.0, 105571.0, 733235.0, 144438.0, 24367.0, 6522.0, 2351.0, 1063.0, 522.0, 317.0, 239.0, 144.0, 114.0, 73.0, 47.0, 39.0, 39.0, 21.0, 25.0, 14.0, 13.0, 4.0, 5.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1192626953125, -0.11536216735839844, -0.11146163940429688, -0.10756111145019531, -0.10366058349609375, -0.09976005554199219, -0.09585952758789062, -0.09195899963378906, -0.0880584716796875, -0.08415794372558594, -0.08025741577148438, -0.07635688781738281, -0.07245635986328125, -0.06855583190917969, -0.06465530395507812, -0.06075477600097656, -0.056854248046875, -0.05295372009277344, -0.049053192138671875, -0.04515266418457031, -0.04125213623046875, -0.03735160827636719, -0.033451080322265625, -0.029550552368164062, -0.0256500244140625, -0.021749496459960938, -0.017848968505859375, -0.013948440551757812, -0.01004791259765625, -0.0061473846435546875, -0.002246856689453125, 0.0016536712646484375, 0.00555419921875, 0.009454727172851562, 0.013355255126953125, 0.017255783081054688, 0.02115631103515625, 0.025056838989257812, 0.028957366943359375, 0.03285789489746094, 0.0367584228515625, 0.04065895080566406, 0.044559478759765625, 0.04846000671386719, 0.05236053466796875, 0.05626106262207031, 0.060161590576171875, 0.06406211853027344, 0.067962646484375, 0.07186317443847656, 0.07576370239257812, 0.07966423034667969, 0.08356475830078125, 0.08746528625488281, 0.09136581420898438, 0.09526634216308594, 0.0991668701171875, 0.10306739807128906, 0.10696792602539062, 0.11086845397949219, 0.11476898193359375, 0.11866950988769531, 0.12257003784179688, 0.12647056579589844, 0.13037109375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 7.0, 7.0, 5.0, 7.0, 11.0, 10.0, 17.0, 9.0, 13.0, 20.0, 15.0, 19.0, 37.0, 41.0, 44.0, 52.0, 54.0, 49.0, 60.0, 62.0, 68.0, 60.0, 50.0, 39.0, 44.0, 27.0, 34.0, 22.0, 15.0, 21.0, 8.0, 17.0, 9.0, 8.0, 8.0, 8.0, 3.0, 3.0, 3.0, 5.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1744384765625, -0.16887664794921875, -0.1633148193359375, -0.15775299072265625, -0.152191162109375, -0.14662933349609375, -0.1410675048828125, -0.13550567626953125, -0.12994384765625, -0.12438201904296875, -0.1188201904296875, -0.11325836181640625, -0.107696533203125, -0.10213470458984375, -0.0965728759765625, -0.09101104736328125, -0.08544921875, -0.07988739013671875, -0.0743255615234375, -0.06876373291015625, -0.063201904296875, -0.05764007568359375, -0.0520782470703125, -0.04651641845703125, -0.04095458984375, -0.03539276123046875, -0.0298309326171875, -0.02426910400390625, -0.018707275390625, -0.01314544677734375, -0.0075836181640625, -0.00202178955078125, 0.0035400390625, 0.00910186767578125, 0.0146636962890625, 0.02022552490234375, 0.025787353515625, 0.03134918212890625, 0.0369110107421875, 0.04247283935546875, 0.04803466796875, 0.05359649658203125, 0.0591583251953125, 0.06472015380859375, 0.070281982421875, 0.07584381103515625, 0.0814056396484375, 0.08696746826171875, 0.092529296875, 0.09809112548828125, 0.1036529541015625, 0.10921478271484375, 0.114776611328125, 0.12033843994140625, 0.1259002685546875, 0.13146209716796875, 0.13702392578125, 0.14258575439453125, 0.1481475830078125, 0.15370941162109375, 0.159271240234375, 0.16483306884765625, 0.1703948974609375, 0.17595672607421875, 0.1815185546875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 6.0, 9.0, 1.0, 16.0, 10.0, 16.0, 28.0, 47.0, 47.0, 59.0, 105.0, 137.0, 227.0, 321.0, 546.0, 1006.0, 1967.0, 4247.0, 11594.0, 41842.0, 599422.0, 329191.0, 38240.0, 10973.0, 4161.0, 1823.0, 958.0, 529.0, 333.0, 202.0, 132.0, 100.0, 75.0, 51.0, 36.0, 26.0, 24.0, 16.0, 12.0, 5.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.06787109375, -0.06593036651611328, -0.06398963928222656, -0.062048912048339844, -0.060108184814453125, -0.058167457580566406, -0.05622673034667969, -0.05428600311279297, -0.05234527587890625, -0.05040454864501953, -0.04846382141113281, -0.046523094177246094, -0.044582366943359375, -0.042641639709472656, -0.04070091247558594, -0.03876018524169922, -0.0368194580078125, -0.03487873077392578, -0.03293800354003906, -0.030997276306152344, -0.029056549072265625, -0.027115821838378906, -0.025175094604492188, -0.02323436737060547, -0.02129364013671875, -0.01935291290283203, -0.017412185668945312, -0.015471458435058594, -0.013530731201171875, -0.011590003967285156, -0.009649276733398438, -0.007708549499511719, -0.005767822265625, -0.0038270950317382812, -0.0018863677978515625, 5.435943603515625e-05, 0.001995086669921875, 0.003935813903808594, 0.0058765411376953125, 0.007817268371582031, 0.00975799560546875, 0.011698722839355469, 0.013639450073242188, 0.015580177307128906, 0.017520904541015625, 0.019461631774902344, 0.021402359008789062, 0.02334308624267578, 0.0252838134765625, 0.02722454071044922, 0.029165267944335938, 0.031105995178222656, 0.033046722412109375, 0.034987449645996094, 0.03692817687988281, 0.03886890411376953, 0.04080963134765625, 0.04275035858154297, 0.04469108581542969, 0.046631813049316406, 0.048572540283203125, 0.050513267517089844, 0.05245399475097656, 0.05439472198486328, 0.05633544921875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 6.0, 5.0, 10.0, 7.0, 8.0, 13.0, 18.0, 19.0, 28.0, 34.0, 37.0, 55.0, 86.0, 97.0, 106.0, 89.0, 58.0, 73.0, 58.0, 45.0, 28.0, 23.0, 20.0, 25.0, 10.0, 6.0, 10.0, 6.0, 1.0, 3.0, 2.0, 5.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8967857360839844e-05, -2.8157606720924377e-05, -2.734735608100891e-05, -2.6537105441093445e-05, -2.572685480117798e-05, -2.4916604161262512e-05, -2.4106353521347046e-05, -2.329610288143158e-05, -2.2485852241516113e-05, -2.1675601601600647e-05, -2.086535096168518e-05, -2.0055100321769714e-05, -1.9244849681854248e-05, -1.8434599041938782e-05, -1.7624348402023315e-05, -1.681409776210785e-05, -1.6003847122192383e-05, -1.5193596482276917e-05, -1.438334584236145e-05, -1.3573095202445984e-05, -1.2762844562530518e-05, -1.1952593922615051e-05, -1.1142343282699585e-05, -1.0332092642784119e-05, -9.521842002868652e-06, -8.711591362953186e-06, -7.90134072303772e-06, -7.091090083122253e-06, -6.280839443206787e-06, -5.470588803291321e-06, -4.6603381633758545e-06, -3.850087523460388e-06, -3.039836883544922e-06, -2.2295862436294556e-06, -1.4193356037139893e-06, -6.09084963798523e-07, 2.0116567611694336e-07, 1.0114163160324097e-06, 1.821666955947876e-06, 2.6319175958633423e-06, 3.4421682357788086e-06, 4.252418875694275e-06, 5.062669515609741e-06, 5.8729201555252075e-06, 6.683170795440674e-06, 7.49342143535614e-06, 8.303672075271606e-06, 9.113922715187073e-06, 9.924173355102539e-06, 1.0734423995018005e-05, 1.1544674634933472e-05, 1.2354925274848938e-05, 1.3165175914764404e-05, 1.397542655467987e-05, 1.4785677194595337e-05, 1.5595927834510803e-05, 1.640617847442627e-05, 1.7216429114341736e-05, 1.8026679754257202e-05, 1.883693039417267e-05, 1.9647181034088135e-05, 2.04574316740036e-05, 2.1267682313919067e-05, 2.2077932953834534e-05, 2.288818359375e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 2.0, 7.0, 9.0, 7.0, 13.0, 15.0, 14.0, 28.0, 40.0, 56.0, 101.0, 158.0, 231.0, 460.0, 865.0, 2056.0, 5419.0, 18091.0, 97708.0, 813505.0, 84319.0, 16444.0, 5062.0, 1990.0, 857.0, 455.0, 243.0, 123.0, 81.0, 49.0, 27.0, 31.0, 28.0, 12.0, 14.0, 7.0, 5.0, 7.0, 7.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.07171630859375, -0.06943702697753906, -0.06715774536132812, -0.06487846374511719, -0.06259918212890625, -0.06031990051269531, -0.058040618896484375, -0.05576133728027344, -0.0534820556640625, -0.05120277404785156, -0.048923492431640625, -0.04664421081542969, -0.04436492919921875, -0.04208564758300781, -0.039806365966796875, -0.03752708435058594, -0.035247802734375, -0.03296852111816406, -0.030689239501953125, -0.028409957885742188, -0.02613067626953125, -0.023851394653320312, -0.021572113037109375, -0.019292831420898438, -0.0170135498046875, -0.014734268188476562, -0.012454986572265625, -0.010175704956054688, -0.00789642333984375, -0.0056171417236328125, -0.003337860107421875, -0.0010585784912109375, 0.001220703125, 0.0034999847412109375, 0.005779266357421875, 0.008058547973632812, 0.01033782958984375, 0.012617111206054688, 0.014896392822265625, 0.017175674438476562, 0.0194549560546875, 0.021734237670898438, 0.024013519287109375, 0.026292800903320312, 0.02857208251953125, 0.030851364135742188, 0.033130645751953125, 0.03540992736816406, 0.037689208984375, 0.03996849060058594, 0.042247772216796875, 0.04452705383300781, 0.04680633544921875, 0.04908561706542969, 0.051364898681640625, 0.05364418029785156, 0.0559234619140625, 0.05820274353027344, 0.060482025146484375, 0.06276130676269531, 0.06504058837890625, 0.06731986999511719, 0.06959915161132812, 0.07187843322753906, 0.07415771484375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 4.0, 7.0, 4.0, 15.0, 17.0, 19.0, 22.0, 38.0, 29.0, 60.0, 69.0, 130.0, 174.0, 120.0, 91.0, 33.0, 37.0, 32.0, 19.0, 16.0, 15.0, 16.0, 5.0, 6.0, 5.0, 2.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045440673828125, -0.04342031478881836, -0.04139995574951172, -0.03937959671020508, -0.03735923767089844, -0.0353388786315918, -0.033318519592285156, -0.031298160552978516, -0.029277801513671875, -0.027257442474365234, -0.025237083435058594, -0.023216724395751953, -0.021196365356445312, -0.019176006317138672, -0.01715564727783203, -0.01513528823852539, -0.01311492919921875, -0.01109457015991211, -0.009074211120605469, -0.007053852081298828, -0.0050334930419921875, -0.003013134002685547, -0.0009927749633789062, 0.0010275840759277344, 0.003047943115234375, 0.005068302154541016, 0.007088661193847656, 0.009109020233154297, 0.011129379272460938, 0.013149738311767578, 0.015170097351074219, 0.01719045639038086, 0.0192108154296875, 0.02123117446899414, 0.02325153350830078, 0.025271892547607422, 0.027292251586914062, 0.029312610626220703, 0.031332969665527344, 0.033353328704833984, 0.035373687744140625, 0.037394046783447266, 0.039414405822753906, 0.04143476486206055, 0.04345512390136719, 0.04547548294067383, 0.04749584197998047, 0.04951620101928711, 0.05153656005859375, 0.05355691909790039, 0.05557727813720703, 0.05759763717651367, 0.05961799621582031, 0.06163835525512695, 0.0636587142944336, 0.06567907333374023, 0.06769943237304688, 0.06971979141235352, 0.07174015045166016, 0.0737605094909668, 0.07578086853027344, 0.07780122756958008, 0.07982158660888672, 0.08184194564819336, 0.0838623046875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 4.0, 0.0, 6.0, 7.0, 13.0, 10.0, 30.0, 53.0, 74.0, 98.0, 218.0, 253.0, 107.0, 56.0, 33.0, 21.0, 6.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6746373176574707, -1.6383001804351807, -1.6019630432128906, -1.5656259059906006, -1.5292887687683105, -1.492951512336731, -1.456614375114441, -1.4202772378921509, -1.3839401006698608, -1.3476029634475708, -1.3112658262252808, -1.2749286890029907, -1.2385914325714111, -1.202254295349121, -1.165917158126831, -1.129580020904541, -1.093242883682251, -1.056905746459961, -1.020568609237671, -0.9842314124107361, -0.947894275188446, -0.911557137966156, -0.8752199411392212, -0.8388828039169312, -0.8025456666946411, -0.7662085294723511, -0.729871392250061, -0.6935341954231262, -0.6571970582008362, -0.6208599209785461, -0.5845227241516113, -0.5481855869293213, -0.5118483304977417, -0.47551119327545166, -0.43917402625083923, -0.4028368592262268, -0.36649972200393677, -0.33016258478164673, -0.2938254177570343, -0.2574882507324219, -0.22115111351013184, -0.1848139613866806, -0.14847680926322937, -0.11213965713977814, -0.0758025050163269, -0.03946535289287567, -0.0031282007694244385, 0.03320896625518799, 0.06954610347747803, 0.10588325560092926, 0.1422204077243805, 0.17855755984783173, 0.21489471197128296, 0.251231849193573, 0.2875690162181854, 0.32390618324279785, 0.3602433204650879, 0.39658045768737793, 0.43291762471199036, 0.4692547917366028, 0.5055919289588928, 0.5419290661811829, 0.5782662630081177, 0.6146034002304077, 0.6509405374526978]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 3.0, 6.0, 3.0, 10.0, 11.0, 16.0, 18.0, 15.0, 29.0, 26.0, 21.0, 31.0, 33.0, 48.0, 48.0, 77.0, 145.0, 94.0, 64.0, 47.0, 38.0, 37.0, 28.0, 27.0, 15.0, 23.0, 13.0, 16.0, 16.0, 11.0, 6.0, 10.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.05391526222229, -1.0260175466537476, -0.9981198310852051, -0.9702221155166626, -0.9423243403434753, -0.9144266247749329, -0.8865289092063904, -0.8586311936378479, -0.8307334184646606, -0.8028357028961182, -0.7749379873275757, -0.7470402717590332, -0.719142496585846, -0.6912447810173035, -0.663347065448761, -0.6354493498802185, -0.607551634311676, -0.5796539187431335, -0.5517562031745911, -0.5238584280014038, -0.49596071243286133, -0.46806299686431885, -0.44016528129577637, -0.4122675657272339, -0.384369820356369, -0.35647210478782654, -0.32857435941696167, -0.3006766438484192, -0.2727789282798767, -0.24488118290901184, -0.21698346734046936, -0.18908573687076569, -0.161188006401062, -0.13329027593135834, -0.10539255291223526, -0.07749482989311218, -0.04959709942340851, -0.021699368953704834, 0.0061983466148376465, 0.03409607708454132, 0.061993807554244995, 0.08989153802394867, 0.11778926104307175, 0.14568698406219482, 0.1735847145318985, 0.20148244500160217, 0.22938016057014465, 0.2572779059410095, 0.285175621509552, 0.3130733370780945, 0.34097108244895935, 0.36886879801750183, 0.3967665433883667, 0.4246642589569092, 0.45256197452545166, 0.48045969009399414, 0.5083574056625366, 0.5362551212310791, 0.5641528367996216, 0.5920505523681641, 0.6199483275413513, 0.6478460431098938, 0.6757437586784363, 0.7036414742469788, 0.731539249420166]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 10.0, 12.0, 14.0, 21.0, 21.0, 29.0, 39.0, 61.0, 92.0, 119.0, 188.0, 378.0, 631.0, 1122.0, 2246.0, 5522.0, 21402.0, 348205.0, 3584278.0, 203936.0, 16594.0, 4750.0, 2072.0, 980.0, 548.0, 348.0, 221.0, 134.0, 90.0, 64.0, 40.0, 22.0, 22.0, 22.0, 12.0, 12.0, 7.0, 6.0, 5.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11785888671875, -0.1143331527709961, -0.11080741882324219, -0.10728168487548828, -0.10375595092773438, -0.10023021697998047, -0.09670448303222656, -0.09317874908447266, -0.08965301513671875, -0.08612728118896484, -0.08260154724121094, -0.07907581329345703, -0.07555007934570312, -0.07202434539794922, -0.06849861145019531, -0.0649728775024414, -0.0614471435546875, -0.057921409606933594, -0.05439567565917969, -0.05086994171142578, -0.047344207763671875, -0.04381847381591797, -0.04029273986816406, -0.036767005920410156, -0.03324127197265625, -0.029715538024902344, -0.026189804077148438, -0.02266407012939453, -0.019138336181640625, -0.015612602233886719, -0.012086868286132812, -0.008561134338378906, -0.005035400390625, -0.0015096664428710938, 0.0020160675048828125, 0.005541801452636719, 0.009067535400390625, 0.012593269348144531, 0.016119003295898438, 0.019644737243652344, 0.02317047119140625, 0.026696205139160156, 0.030221939086914062, 0.03374767303466797, 0.037273406982421875, 0.04079914093017578, 0.04432487487792969, 0.047850608825683594, 0.0513763427734375, 0.054902076721191406, 0.05842781066894531, 0.06195354461669922, 0.06547927856445312, 0.06900501251220703, 0.07253074645996094, 0.07605648040771484, 0.07958221435546875, 0.08310794830322266, 0.08663368225097656, 0.09015941619873047, 0.09368515014648438, 0.09721088409423828, 0.10073661804199219, 0.1042623519897461, 0.1077880859375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 9.0, 15.0, 21.0, 25.0, 26.0, 27.0, 31.0, 41.0, 68.0, 59.0, 64.0, 53.0, 63.0, 74.0, 64.0, 50.0, 62.0, 46.0, 40.0, 38.0, 24.0, 27.0, 13.0, 17.0, 7.0, 7.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.048828125, -0.047373294830322266, -0.04591846466064453, -0.0444636344909668, -0.04300880432128906, -0.04155397415161133, -0.040099143981933594, -0.03864431381225586, -0.037189483642578125, -0.03573465347290039, -0.034279823303222656, -0.03282499313354492, -0.03137016296386719, -0.029915332794189453, -0.02846050262451172, -0.027005672454833984, -0.02555084228515625, -0.024096012115478516, -0.02264118194580078, -0.021186351776123047, -0.019731521606445312, -0.018276691436767578, -0.016821861267089844, -0.01536703109741211, -0.013912200927734375, -0.01245737075805664, -0.011002540588378906, -0.009547710418701172, -0.008092880249023438, -0.006638050079345703, -0.005183219909667969, -0.0037283897399902344, -0.0022735595703125, -0.0008187294006347656, 0.0006361007690429688, 0.002090930938720703, 0.0035457611083984375, 0.005000591278076172, 0.006455421447753906, 0.00791025161743164, 0.009365081787109375, 0.01081991195678711, 0.012274742126464844, 0.013729572296142578, 0.015184402465820312, 0.016639232635498047, 0.01809406280517578, 0.019548892974853516, 0.02100372314453125, 0.022458553314208984, 0.02391338348388672, 0.025368213653564453, 0.026823043823242188, 0.028277873992919922, 0.029732704162597656, 0.03118753433227539, 0.032642364501953125, 0.03409719467163086, 0.035552024841308594, 0.03700685501098633, 0.03846168518066406, 0.0399165153503418, 0.04137134552001953, 0.042826175689697266, 0.044281005859375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 10.0, 23.0, 37.0, 81.0, 171.0, 352.0, 618.0, 9957.0, 4180469.0, 1669.0, 447.0, 246.0, 121.0, 44.0, 19.0, 12.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1796875, -1.1442718505859375, -1.108856201171875, -1.0734405517578125, -1.03802490234375, -1.0026092529296875, -0.967193603515625, -0.9317779541015625, -0.8963623046875, -0.8609466552734375, -0.825531005859375, -0.7901153564453125, -0.75469970703125, -0.7192840576171875, -0.683868408203125, -0.6484527587890625, -0.613037109375, -0.5776214599609375, -0.542205810546875, -0.5067901611328125, -0.47137451171875, -0.4359588623046875, -0.400543212890625, -0.3651275634765625, -0.3297119140625, -0.2942962646484375, -0.258880615234375, -0.2234649658203125, -0.18804931640625, -0.1526336669921875, -0.117218017578125, -0.0818023681640625, -0.04638671875, -0.0109710693359375, 0.024444580078125, 0.0598602294921875, 0.09527587890625, 0.1306915283203125, 0.166107177734375, 0.2015228271484375, 0.2369384765625, 0.2723541259765625, 0.307769775390625, 0.3431854248046875, 0.37860107421875, 0.4140167236328125, 0.449432373046875, 0.4848480224609375, 0.520263671875, 0.5556793212890625, 0.591094970703125, 0.6265106201171875, 0.66192626953125, 0.6973419189453125, 0.732757568359375, 0.7681732177734375, 0.8035888671875, 0.8390045166015625, 0.874420166015625, 0.9098358154296875, 0.94525146484375, 0.9806671142578125, 1.016082763671875, 1.0514984130859375, 1.0869140625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 9.0, 17.0, 40.0, 180.0, 1595.0, 1898.0, 246.0, 64.0, 21.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7666015625, -0.7521457672119141, -0.7376899719238281, -0.7232341766357422, -0.7087783813476562, -0.6943225860595703, -0.6798667907714844, -0.6654109954833984, -0.6509552001953125, -0.6364994049072266, -0.6220436096191406, -0.6075878143310547, -0.5931320190429688, -0.5786762237548828, -0.5642204284667969, -0.5497646331787109, -0.535308837890625, -0.5208530426025391, -0.5063972473144531, -0.4919414520263672, -0.47748565673828125, -0.4630298614501953, -0.4485740661621094, -0.43411827087402344, -0.4196624755859375, -0.40520668029785156, -0.3907508850097656, -0.3762950897216797, -0.36183929443359375, -0.3473834991455078, -0.3329277038574219, -0.31847190856933594, -0.30401611328125, -0.28956031799316406, -0.2751045227050781, -0.2606487274169922, -0.24619293212890625, -0.2317371368408203, -0.21728134155273438, -0.20282554626464844, -0.1883697509765625, -0.17391395568847656, -0.15945816040039062, -0.1450023651123047, -0.13054656982421875, -0.11609077453613281, -0.10163497924804688, -0.08717918395996094, -0.072723388671875, -0.05826759338378906, -0.043811798095703125, -0.029356002807617188, -0.01490020751953125, -0.0004444122314453125, 0.014011383056640625, 0.028467178344726562, 0.0429229736328125, 0.05737876892089844, 0.07183456420898438, 0.08629035949707031, 0.10074615478515625, 0.11520195007324219, 0.12965774536132812, 0.14411354064941406, 0.1585693359375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 2.0, 1.0, 8.0, 7.0, 15.0, 19.0, 21.0, 40.0, 94.0, 163.0, 286.0, 193.0, 86.0, 33.0, 18.0, 11.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4946515560150146, -3.4040281772613525, -3.3134047985076904, -3.2227814197540283, -3.132158041000366, -3.041534900665283, -2.950911521911621, -2.860288143157959, -2.769664764404297, -2.6790413856506348, -2.5884180068969727, -2.4977946281433105, -2.4071712493896484, -2.3165478706359863, -2.225924491882324, -2.135301351547241, -2.044677734375, -1.954054355621338, -1.8634309768676758, -1.7728075981140137, -1.6821843385696411, -1.591560959815979, -1.500937581062317, -1.4103143215179443, -1.3196909427642822, -1.2290675640106201, -1.138444185256958, -1.047820806503296, -0.9571975469589233, -0.8665741682052612, -0.7759507894515991, -0.6853274703025818, -0.5947041511535645, -0.5040807723999023, -0.413457453250885, -0.3228340744972229, -0.23221072554588318, -0.14158737659454346, -0.05096399784088135, 0.039659321308135986, 0.1302827000617981, 0.22090604901313782, 0.31152939796447754, 0.40215277671813965, 0.49277612566947937, 0.5833994746208191, 0.6740228533744812, 0.7646461725234985, 0.8552695512771606, 0.9458929300308228, 1.0365163087844849, 1.1271395683288574, 1.2177629470825195, 1.3083863258361816, 1.3990097045898438, 1.4896330833435059, 1.580256462097168, 1.67087984085083, 1.7615032196044922, 1.8521265983581543, 1.9427498579025269, 2.0333733558654785, 2.1239967346191406, 2.2146198749542236, 2.3052432537078857]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 4.0, 8.0, 7.0, 4.0, 9.0, 15.0, 14.0, 30.0, 24.0, 21.0, 34.0, 54.0, 46.0, 46.0, 64.0, 62.0, 56.0, 60.0, 63.0, 48.0, 51.0, 32.0, 51.0, 32.0, 36.0, 21.0, 26.0, 18.0, 11.0, 10.0, 6.0, 8.0, 8.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0613040924072266, -1.0201447010040283, -0.9789851903915405, -0.9378257393836975, -0.8966662883758545, -0.8555068969726562, -0.8143474459648132, -0.7731879949569702, -0.7320285439491272, -0.6908690929412842, -0.6497096419334412, -0.6085501909255981, -0.5673907995223999, -0.5262312889099121, -0.48507189750671387, -0.44391244649887085, -0.40275299549102783, -0.3615935444831848, -0.3204340934753418, -0.27927467226982117, -0.23811522126197815, -0.19695577025413513, -0.1557963341474533, -0.11463689804077148, -0.07347744703292847, -0.032318003475666046, 0.008841440081596375, 0.050000883638858795, 0.09116032719612122, 0.13231977820396423, 0.17347921431064606, 0.21463865041732788, 0.25579798221588135, 0.29695743322372437, 0.3381168842315674, 0.379276305437088, 0.42043575644493103, 0.46159520745277405, 0.5027546286582947, 0.5439140796661377, 0.5850735306739807, 0.6262329816818237, 0.6673924326896667, 0.7085518836975098, 0.749711275100708, 0.7908707857131958, 0.832030177116394, 0.8731896281242371, 0.9143490791320801, 0.9555085301399231, 0.9966679811477661, 1.0378273725509644, 1.0789868831634521, 1.1201462745666504, 1.1613057851791382, 1.2024651765823364, 1.2436246871948242, 1.2847840785980225, 1.3259435892105103, 1.3671029806137085, 1.4082624912261963, 1.4494218826293945, 1.4905813932418823, 1.5317407846450806, 1.5729001760482788]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 6.0, 4.0, 4.0, 8.0, 12.0, 25.0, 11.0, 26.0, 37.0, 67.0, 90.0, 122.0, 155.0, 230.0, 329.0, 451.0, 692.0, 1018.0, 1738.0, 2803.0, 5004.0, 9868.0, 21528.0, 55197.0, 186040.0, 486226.0, 179293.0, 54076.0, 21162.0, 9689.0, 4997.0, 2786.0, 1608.0, 1023.0, 693.0, 445.0, 344.0, 212.0, 155.0, 111.0, 77.0, 68.0, 40.0, 18.0, 20.0, 15.0, 16.0, 10.0, 7.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10028076171875, -0.09687995910644531, -0.09347915649414062, -0.09007835388183594, -0.08667755126953125, -0.08327674865722656, -0.07987594604492188, -0.07647514343261719, -0.0730743408203125, -0.06967353820800781, -0.06627273559570312, -0.06287193298339844, -0.05947113037109375, -0.05607032775878906, -0.052669525146484375, -0.04926872253417969, -0.045867919921875, -0.04246711730957031, -0.039066314697265625, -0.03566551208496094, -0.03226470947265625, -0.028863906860351562, -0.025463104248046875, -0.022062301635742188, -0.0186614990234375, -0.015260696411132812, -0.011859893798828125, -0.008459091186523438, -0.00505828857421875, -0.0016574859619140625, 0.001743316650390625, 0.0051441192626953125, 0.008544921875, 0.011945724487304688, 0.015346527099609375, 0.018747329711914062, 0.02214813232421875, 0.025548934936523438, 0.028949737548828125, 0.03235054016113281, 0.0357513427734375, 0.03915214538574219, 0.042552947998046875, 0.04595375061035156, 0.04935455322265625, 0.05275535583496094, 0.056156158447265625, 0.05955696105957031, 0.062957763671875, 0.06635856628417969, 0.06975936889648438, 0.07316017150878906, 0.07656097412109375, 0.07996177673339844, 0.08336257934570312, 0.08676338195800781, 0.0901641845703125, 0.09356498718261719, 0.09696578979492188, 0.10036659240722656, 0.10376739501953125, 0.10716819763183594, 0.11056900024414062, 0.11396980285644531, 0.11737060546875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 5.0, 5.0, 13.0, 8.0, 9.0, 13.0, 13.0, 21.0, 16.0, 32.0, 26.0, 30.0, 26.0, 47.0, 42.0, 58.0, 47.0, 46.0, 60.0, 53.0, 57.0, 44.0, 47.0, 38.0, 38.0, 38.0, 26.0, 15.0, 20.0, 10.0, 21.0, 11.0, 8.0, 11.0, 9.0, 8.0, 10.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06280517578125, -0.06068229675292969, -0.058559417724609375, -0.05643653869628906, -0.05431365966796875, -0.05219078063964844, -0.050067901611328125, -0.04794502258300781, -0.0458221435546875, -0.04369926452636719, -0.041576385498046875, -0.03945350646972656, -0.03733062744140625, -0.03520774841308594, -0.033084869384765625, -0.030961990356445312, -0.028839111328125, -0.026716232299804688, -0.024593353271484375, -0.022470474243164062, -0.02034759521484375, -0.018224716186523438, -0.016101837158203125, -0.013978958129882812, -0.0118560791015625, -0.009733200073242188, -0.007610321044921875, -0.0054874420166015625, -0.00336456298828125, -0.0012416839599609375, 0.000881195068359375, 0.0030040740966796875, 0.005126953125, 0.0072498321533203125, 0.009372711181640625, 0.011495590209960938, 0.01361846923828125, 0.015741348266601562, 0.017864227294921875, 0.019987106323242188, 0.0221099853515625, 0.024232864379882812, 0.026355743408203125, 0.028478622436523438, 0.03060150146484375, 0.03272438049316406, 0.034847259521484375, 0.03697013854980469, 0.039093017578125, 0.04121589660644531, 0.043338775634765625, 0.04546165466308594, 0.04758453369140625, 0.04970741271972656, 0.051830291748046875, 0.05395317077636719, 0.0560760498046875, 0.05819892883300781, 0.060321807861328125, 0.06244468688964844, 0.06456756591796875, 0.06669044494628906, 0.06881332397460938, 0.07093620300292969, 0.07305908203125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 8.0, 6.0, 2.0, 9.0, 7.0, 13.0, 17.0, 22.0, 25.0, 56.0, 74.0, 98.0, 170.0, 312.0, 554.0, 1373.0, 4868.0, 49796.0, 955268.0, 29729.0, 3753.0, 1130.0, 478.0, 266.0, 181.0, 99.0, 66.0, 50.0, 31.0, 24.0, 10.0, 14.0, 16.0, 5.0, 6.0, 1.0, 8.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.496337890625, -0.4800224304199219, -0.46370697021484375, -0.4473915100097656, -0.4310760498046875, -0.4147605895996094, -0.39844512939453125, -0.3821296691894531, -0.365814208984375, -0.3494987487792969, -0.33318328857421875, -0.3168678283691406, -0.3005523681640625, -0.2842369079589844, -0.26792144775390625, -0.2516059875488281, -0.23529052734375, -0.21897506713867188, -0.20265960693359375, -0.18634414672851562, -0.1700286865234375, -0.15371322631835938, -0.13739776611328125, -0.12108230590820312, -0.104766845703125, -0.08845138549804688, -0.07213592529296875, -0.055820465087890625, -0.0395050048828125, -0.023189544677734375, -0.00687408447265625, 0.009441375732421875, 0.0257568359375, 0.042072296142578125, 0.05838775634765625, 0.07470321655273438, 0.0910186767578125, 0.10733413696289062, 0.12364959716796875, 0.13996505737304688, 0.156280517578125, 0.17259597778320312, 0.18891143798828125, 0.20522689819335938, 0.2215423583984375, 0.23785781860351562, 0.25417327880859375, 0.2704887390136719, 0.28680419921875, 0.3031196594238281, 0.31943511962890625, 0.3357505798339844, 0.3520660400390625, 0.3683815002441406, 0.38469696044921875, 0.4010124206542969, 0.417327880859375, 0.4336433410644531, 0.44995880126953125, 0.4662742614746094, 0.4825897216796875, 0.4989051818847656, 0.5152206420898438, 0.5315361022949219, 0.5478515625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 4.0, 3.0, 5.0, 5.0, 10.0, 8.0, 18.0, 22.0, 24.0, 28.0, 40.0, 56.0, 64.0, 63.0, 98.0, 84.0, 92.0, 72.0, 60.0, 56.0, 49.0, 26.0, 26.0, 23.0, 18.0, 13.0, 3.0, 11.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.469482421875, -0.4537162780761719, -0.43795013427734375, -0.4221839904785156, -0.4064178466796875, -0.3906517028808594, -0.37488555908203125, -0.3591194152832031, -0.343353271484375, -0.3275871276855469, -0.31182098388671875, -0.2960548400878906, -0.2802886962890625, -0.2645225524902344, -0.24875640869140625, -0.23299026489257812, -0.21722412109375, -0.20145797729492188, -0.18569183349609375, -0.16992568969726562, -0.1541595458984375, -0.13839340209960938, -0.12262725830078125, -0.10686111450195312, -0.091094970703125, -0.07532882690429688, -0.05956268310546875, -0.043796539306640625, -0.0280303955078125, -0.012264251708984375, 0.00350189208984375, 0.019268035888671875, 0.0350341796875, 0.050800323486328125, 0.06656646728515625, 0.08233261108398438, 0.0980987548828125, 0.11386489868164062, 0.12963104248046875, 0.14539718627929688, 0.161163330078125, 0.17692947387695312, 0.19269561767578125, 0.20846176147460938, 0.2242279052734375, 0.23999404907226562, 0.25576019287109375, 0.2715263366699219, 0.28729248046875, 0.3030586242675781, 0.31882476806640625, 0.3345909118652344, 0.3503570556640625, 0.3661231994628906, 0.38188934326171875, 0.3976554870605469, 0.413421630859375, 0.4291877746582031, 0.44495391845703125, 0.4607200622558594, 0.4764862060546875, 0.4922523498535156, 0.5080184936523438, 0.5237846374511719, 0.53955078125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 9.0, 20.0, 18.0, 32.0, 73.0, 119.0, 271.0, 574.0, 1520.0, 4497.0, 22546.0, 899880.0, 105017.0, 9657.0, 2537.0, 930.0, 398.0, 200.0, 102.0, 63.0, 34.0, 23.0, 9.0, 8.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156494140625, -0.15123748779296875, -0.1459808349609375, -0.14072418212890625, -0.135467529296875, -0.13021087646484375, -0.1249542236328125, -0.11969757080078125, -0.11444091796875, -0.10918426513671875, -0.1039276123046875, -0.09867095947265625, -0.093414306640625, -0.08815765380859375, -0.0829010009765625, -0.07764434814453125, -0.0723876953125, -0.06713104248046875, -0.0618743896484375, -0.05661773681640625, -0.051361083984375, -0.04610443115234375, -0.0408477783203125, -0.03559112548828125, -0.03033447265625, -0.02507781982421875, -0.0198211669921875, -0.01456451416015625, -0.009307861328125, -0.00405120849609375, 0.0012054443359375, 0.00646209716796875, 0.01171875, 0.01697540283203125, 0.0222320556640625, 0.02748870849609375, 0.032745361328125, 0.03800201416015625, 0.0432586669921875, 0.04851531982421875, 0.05377197265625, 0.05902862548828125, 0.0642852783203125, 0.06954193115234375, 0.074798583984375, 0.08005523681640625, 0.0853118896484375, 0.09056854248046875, 0.0958251953125, 0.10108184814453125, 0.1063385009765625, 0.11159515380859375, 0.116851806640625, 0.12210845947265625, 0.1273651123046875, 0.13262176513671875, 0.13787841796875, 0.14313507080078125, 0.1483917236328125, 0.15364837646484375, 0.158905029296875, 0.16416168212890625, 0.1694183349609375, 0.17467498779296875, 0.179931640625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 4.0, 8.0, 5.0, 15.0, 18.0, 21.0, 25.0, 32.0, 53.0, 107.0, 129.0, 153.0, 120.0, 88.0, 58.0, 41.0, 28.0, 23.0, 15.0, 12.0, 12.0, 10.0, 5.0, 5.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.68952751159668e-05, -3.550667315721512e-05, -3.411807119846344e-05, -3.272946923971176e-05, -3.134086728096008e-05, -2.9952265322208405e-05, -2.8563663363456726e-05, -2.7175061404705048e-05, -2.578645944595337e-05, -2.439785748720169e-05, -2.3009255528450012e-05, -2.1620653569698334e-05, -2.0232051610946655e-05, -1.8843449652194977e-05, -1.74548476934433e-05, -1.606624573469162e-05, -1.4677643775939941e-05, -1.3289041817188263e-05, -1.1900439858436584e-05, -1.0511837899684906e-05, -9.123235940933228e-06, -7.734633982181549e-06, -6.346032023429871e-06, -4.957430064678192e-06, -3.5688281059265137e-06, -2.180226147174835e-06, -7.916241884231567e-07, 5.969777703285217e-07, 1.9855797290802e-06, 3.3741816878318787e-06, 4.762783646583557e-06, 6.151385605335236e-06, 7.539987564086914e-06, 8.928589522838593e-06, 1.0317191481590271e-05, 1.170579344034195e-05, 1.3094395399093628e-05, 1.4482997357845306e-05, 1.5871599316596985e-05, 1.7260201275348663e-05, 1.8648803234100342e-05, 2.003740519285202e-05, 2.14260071516037e-05, 2.2814609110355377e-05, 2.4203211069107056e-05, 2.5591813027858734e-05, 2.6980414986610413e-05, 2.836901694536209e-05, 2.975761890411377e-05, 3.114622086286545e-05, 3.2534822821617126e-05, 3.3923424780368805e-05, 3.5312026739120483e-05, 3.670062869787216e-05, 3.808923065662384e-05, 3.947783261537552e-05, 4.08664345741272e-05, 4.2255036532878876e-05, 4.3643638491630554e-05, 4.503224045038223e-05, 4.642084240913391e-05, 4.780944436788559e-05, 4.919804632663727e-05, 5.0586648285388947e-05, 5.1975250244140625e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 10.0, 5.0, 12.0, 16.0, 22.0, 29.0, 49.0, 82.0, 155.0, 315.0, 659.0, 1737.0, 6466.0, 56793.0, 931168.0, 42566.0, 5593.0, 1601.0, 616.0, 245.0, 137.0, 95.0, 68.0, 27.0, 27.0, 13.0, 11.0, 5.0, 5.0, 9.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14697265625, -0.14229965209960938, -0.13762664794921875, -0.13295364379882812, -0.1282806396484375, -0.12360763549804688, -0.11893463134765625, -0.11426162719726562, -0.109588623046875, -0.10491561889648438, -0.10024261474609375, -0.09556961059570312, -0.0908966064453125, -0.08622360229492188, -0.08155059814453125, -0.07687759399414062, -0.07220458984375, -0.06753158569335938, -0.06285858154296875, -0.058185577392578125, -0.0535125732421875, -0.048839569091796875, -0.04416656494140625, -0.039493560791015625, -0.034820556640625, -0.030147552490234375, -0.02547454833984375, -0.020801544189453125, -0.0161285400390625, -0.011455535888671875, -0.00678253173828125, -0.002109527587890625, 0.0025634765625, 0.007236480712890625, 0.01190948486328125, 0.016582489013671875, 0.0212554931640625, 0.025928497314453125, 0.03060150146484375, 0.035274505615234375, 0.039947509765625, 0.044620513916015625, 0.04929351806640625, 0.053966522216796875, 0.0586395263671875, 0.06331253051757812, 0.06798553466796875, 0.07265853881835938, 0.07733154296875, 0.08200454711914062, 0.08667755126953125, 0.09135055541992188, 0.0960235595703125, 0.10069656372070312, 0.10536956787109375, 0.11004257202148438, 0.114715576171875, 0.11938858032226562, 0.12406158447265625, 0.12873458862304688, 0.1334075927734375, 0.13808059692382812, 0.14275360107421875, 0.14742660522460938, 0.152099609375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 7.0, 7.0, 12.0, 7.0, 19.0, 16.0, 38.0, 42.0, 73.0, 115.0, 153.0, 159.0, 106.0, 67.0, 52.0, 29.0, 24.0, 24.0, 12.0, 7.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10614013671875, -0.10260581970214844, -0.09907150268554688, -0.09553718566894531, -0.09200286865234375, -0.08846855163574219, -0.08493423461914062, -0.08139991760253906, -0.0778656005859375, -0.07433128356933594, -0.07079696655273438, -0.06726264953613281, -0.06372833251953125, -0.06019401550292969, -0.056659698486328125, -0.05312538146972656, -0.049591064453125, -0.04605674743652344, -0.042522430419921875, -0.03898811340332031, -0.03545379638671875, -0.03191947937011719, -0.028385162353515625, -0.024850845336914062, -0.0213165283203125, -0.017782211303710938, -0.014247894287109375, -0.010713577270507812, -0.00717926025390625, -0.0036449432373046875, -0.000110626220703125, 0.0034236907958984375, 0.0069580078125, 0.010492324829101562, 0.014026641845703125, 0.017560958862304688, 0.02109527587890625, 0.024629592895507812, 0.028163909912109375, 0.03169822692871094, 0.0352325439453125, 0.03876686096191406, 0.042301177978515625, 0.04583549499511719, 0.04936981201171875, 0.05290412902832031, 0.056438446044921875, 0.05997276306152344, 0.063507080078125, 0.06704139709472656, 0.07057571411132812, 0.07411003112792969, 0.07764434814453125, 0.08117866516113281, 0.08471298217773438, 0.08824729919433594, 0.0917816162109375, 0.09531593322753906, 0.09885025024414062, 0.10238456726074219, 0.10591888427734375, 0.10945320129394531, 0.11298751831054688, 0.11652183532714844, 0.12005615234375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 22.0, 50.0, 140.0, 549.0, 165.0, 45.0, 20.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.825005531311035, -6.671842575073242, -6.518679141998291, -6.365516185760498, -6.212352752685547, -6.059189796447754, -5.906026363372803, -5.75286340713501, -5.599699974060059, -5.446537017822266, -5.2933735847473145, -5.1402106285095215, -4.98704719543457, -4.833884239196777, -4.680720806121826, -4.527557849884033, -4.374394416809082, -4.221231460571289, -4.068068027496338, -3.914904832839966, -3.7617416381835938, -3.6085784435272217, -3.4554152488708496, -3.3022522926330566, -3.1490893363952637, -2.9959261417388916, -2.8427629470825195, -2.6895997524261475, -2.5364365577697754, -2.3832733631134033, -2.2301101684570312, -2.0769472122192383, -1.923783540725708, -1.770620346069336, -1.6174571514129639, -1.4642939567565918, -1.3111307621002197, -1.1579675674438477, -1.0048044919967651, -0.8516412973403931, -0.698478102684021, -0.5453149080276489, -0.39215174317359924, -0.23898857831954956, -0.08582538366317749, 0.06733781099319458, 0.22050094604492188, 0.37366414070129395, 0.526827335357666, 0.6799905300140381, 0.8331537246704102, 0.9863168597221375, 1.1394801139831543, 1.2926433086395264, 1.4458063840866089, 1.598969578742981, 1.752132773399353, 1.905295968055725, 2.0584590435028076, 2.2116222381591797, 2.3647854328155518, 2.517948627471924, 2.671111822128296, 2.824275016784668, 2.97743821144104]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 8.0, 6.0, 11.0, 9.0, 16.0, 17.0, 17.0, 24.0, 27.0, 31.0, 24.0, 40.0, 33.0, 49.0, 117.0, 214.0, 64.0, 28.0, 31.0, 25.0, 30.0, 27.0, 21.0, 18.0, 15.0, 15.0, 13.0, 9.0, 16.0, 8.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.399120330810547, -2.3268136978149414, -2.254506826400757, -2.1821999549865723, -2.109893321990967, -2.0375866889953613, -1.9652798175811768, -1.8929730653762817, -1.8206663131713867, -1.7483595609664917, -1.6760528087615967, -1.6037460565567017, -1.5314393043518066, -1.4591325521469116, -1.3868257999420166, -1.3145190477371216, -1.2422122955322266, -1.1699055433273315, -1.0975987911224365, -1.0252920389175415, -0.9529852867126465, -0.8806785345077515, -0.8083717823028564, -0.7360650300979614, -0.6637582778930664, -0.5914515256881714, -0.5191447734832764, -0.44683802127838135, -0.37453126907348633, -0.3022245168685913, -0.2299177646636963, -0.15761101245880127, -0.08530449867248535, -0.012997746467590332, 0.05930900573730469, 0.1316157579421997, 0.20392251014709473, 0.27622926235198975, 0.34853601455688477, 0.4208427667617798, 0.4931495189666748, 0.5654562711715698, 0.6377630233764648, 0.7100697755813599, 0.7823765277862549, 0.8546832799911499, 0.9269900321960449, 0.9992967844009399, 1.071603536605835, 1.14391028881073, 1.216217041015625, 1.28852379322052, 1.360830545425415, 1.43313729763031, 1.505444049835205, 1.5777508020401, 1.6500575542449951, 1.7223643064498901, 1.7946710586547852, 1.8669778108596802, 1.9392845630645752, 2.0115914344787598, 2.0838980674743652, 2.1562047004699707, 2.2285115718841553]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 2.0, 7.0, 6.0, 4.0, 17.0, 12.0, 26.0, 40.0, 53.0, 59.0, 82.0, 130.0, 180.0, 257.0, 413.0, 627.0, 996.0, 1722.0, 2918.0, 5516.0, 12986.0, 38604.0, 170862.0, 963096.0, 2280599.0, 555697.0, 108445.0, 29483.0, 10265.0, 4664.0, 2480.0, 1413.0, 919.0, 551.0, 337.0, 255.0, 173.0, 111.0, 87.0, 48.0, 40.0, 25.0, 29.0, 17.0, 8.0, 9.0, 9.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0904541015625, -0.08726310729980469, -0.08407211303710938, -0.08088111877441406, -0.07769012451171875, -0.07449913024902344, -0.07130813598632812, -0.06811714172363281, -0.0649261474609375, -0.06173515319824219, -0.058544158935546875, -0.05535316467285156, -0.05216217041015625, -0.04897117614746094, -0.045780181884765625, -0.04258918762207031, -0.039398193359375, -0.03620719909667969, -0.033016204833984375, -0.029825210571289062, -0.02663421630859375, -0.023443222045898438, -0.020252227783203125, -0.017061233520507812, -0.0138702392578125, -0.010679244995117188, -0.007488250732421875, -0.0042972564697265625, -0.00110626220703125, 0.0020847320556640625, 0.005275726318359375, 0.008466720581054688, 0.01165771484375, 0.014848709106445312, 0.018039703369140625, 0.021230697631835938, 0.02442169189453125, 0.027612686157226562, 0.030803680419921875, 0.03399467468261719, 0.0371856689453125, 0.04037666320800781, 0.043567657470703125, 0.04675865173339844, 0.04994964599609375, 0.05314064025878906, 0.056331634521484375, 0.05952262878417969, 0.062713623046875, 0.06590461730957031, 0.06909561157226562, 0.07228660583496094, 0.07547760009765625, 0.07866859436035156, 0.08185958862304688, 0.08505058288574219, 0.0882415771484375, 0.09143257141113281, 0.09462356567382812, 0.09781455993652344, 0.10100555419921875, 0.10419654846191406, 0.10738754272460938, 0.11057853698730469, 0.11376953125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 5.0, 11.0, 4.0, 9.0, 8.0, 10.0, 15.0, 24.0, 26.0, 32.0, 41.0, 30.0, 60.0, 57.0, 53.0, 51.0, 67.0, 69.0, 69.0, 61.0, 38.0, 48.0, 39.0, 32.0, 20.0, 27.0, 17.0, 15.0, 14.0, 8.0, 5.0, 10.0, 5.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08648681640625, -0.0839090347290039, -0.08133125305175781, -0.07875347137451172, -0.07617568969726562, -0.07359790802001953, -0.07102012634277344, -0.06844234466552734, -0.06586456298828125, -0.06328678131103516, -0.06070899963378906, -0.05813121795654297, -0.055553436279296875, -0.05297565460205078, -0.05039787292480469, -0.047820091247558594, -0.0452423095703125, -0.042664527893066406, -0.04008674621582031, -0.03750896453857422, -0.034931182861328125, -0.03235340118408203, -0.029775619506835938, -0.027197837829589844, -0.02462005615234375, -0.022042274475097656, -0.019464492797851562, -0.01688671112060547, -0.014308929443359375, -0.011731147766113281, -0.009153366088867188, -0.006575584411621094, -0.003997802734375, -0.0014200210571289062, 0.0011577606201171875, 0.0037355422973632812, 0.006313323974609375, 0.008891105651855469, 0.011468887329101562, 0.014046669006347656, 0.01662445068359375, 0.019202232360839844, 0.021780014038085938, 0.02435779571533203, 0.026935577392578125, 0.02951335906982422, 0.03209114074707031, 0.034668922424316406, 0.0372467041015625, 0.039824485778808594, 0.04240226745605469, 0.04498004913330078, 0.047557830810546875, 0.05013561248779297, 0.05271339416503906, 0.055291175842285156, 0.05786895751953125, 0.060446739196777344, 0.06302452087402344, 0.06560230255126953, 0.06818008422851562, 0.07075786590576172, 0.07333564758300781, 0.0759134292602539, 0.0784912109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 10.0, 6.0, 10.0, 13.0, 28.0, 42.0, 61.0, 96.0, 229.0, 587.0, 2466.0, 3820410.0, 367379.0, 1961.0, 483.0, 222.0, 110.0, 71.0, 31.0, 23.0, 15.0, 9.0, 11.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3037109375, -1.264129638671875, -1.22454833984375, -1.184967041015625, -1.1453857421875, -1.105804443359375, -1.06622314453125, -1.026641845703125, -0.987060546875, -0.947479248046875, -0.90789794921875, -0.868316650390625, -0.8287353515625, -0.789154052734375, -0.74957275390625, -0.709991455078125, -0.67041015625, -0.630828857421875, -0.59124755859375, -0.551666259765625, -0.5120849609375, -0.472503662109375, -0.43292236328125, -0.393341064453125, -0.353759765625, -0.314178466796875, -0.27459716796875, -0.235015869140625, -0.1954345703125, -0.155853271484375, -0.11627197265625, -0.076690673828125, -0.037109375, 0.002471923828125, 0.04205322265625, 0.081634521484375, 0.1212158203125, 0.160797119140625, 0.20037841796875, 0.239959716796875, 0.279541015625, 0.319122314453125, 0.35870361328125, 0.398284912109375, 0.4378662109375, 0.477447509765625, 0.51702880859375, 0.556610107421875, 0.59619140625, 0.635772705078125, 0.67535400390625, 0.714935302734375, 0.7545166015625, 0.794097900390625, 0.83367919921875, 0.873260498046875, 0.912841796875, 0.952423095703125, 0.99200439453125, 1.031585693359375, 1.0711669921875, 1.110748291015625, 1.15032958984375, 1.189910888671875, 1.2294921875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 13.0, 33.0, 109.0, 433.0, 2218.0, 968.0, 226.0, 64.0, 12.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.001953125, -0.973114013671875, -0.94427490234375, -0.915435791015625, -0.8865966796875, -0.857757568359375, -0.82891845703125, -0.800079345703125, -0.771240234375, -0.742401123046875, -0.71356201171875, -0.684722900390625, -0.6558837890625, -0.627044677734375, -0.59820556640625, -0.569366455078125, -0.54052734375, -0.511688232421875, -0.48284912109375, -0.454010009765625, -0.4251708984375, -0.396331787109375, -0.36749267578125, -0.338653564453125, -0.309814453125, -0.280975341796875, -0.25213623046875, -0.223297119140625, -0.1944580078125, -0.165618896484375, -0.13677978515625, -0.107940673828125, -0.0791015625, -0.050262451171875, -0.02142333984375, 0.007415771484375, 0.0362548828125, 0.065093994140625, 0.09393310546875, 0.122772216796875, 0.151611328125, 0.180450439453125, 0.20928955078125, 0.238128662109375, 0.2669677734375, 0.295806884765625, 0.32464599609375, 0.353485107421875, 0.38232421875, 0.411163330078125, 0.44000244140625, 0.468841552734375, 0.4976806640625, 0.526519775390625, 0.55535888671875, 0.584197998046875, 0.613037109375, 0.641876220703125, 0.67071533203125, 0.699554443359375, 0.7283935546875, 0.757232666015625, 0.78607177734375, 0.814910888671875, 0.84375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 2.0, 7.0, 8.0, 8.0, 25.0, 20.0, 36.0, 78.0, 134.0, 206.0, 182.0, 122.0, 71.0, 39.0, 19.0, 8.0, 11.0, 7.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.041259765625, -3.939580202102661, -3.837900400161743, -3.7362208366394043, -3.6345412731170654, -3.5328617095947266, -3.4311819076538086, -3.3295023441314697, -3.227822780609131, -3.126143217086792, -3.024463415145874, -2.922783851623535, -2.8211042881011963, -2.7194247245788574, -2.6177449226379395, -2.5160653591156006, -2.4143855571746826, -2.3127059936523438, -2.211026191711426, -2.109346628189087, -2.007667064666748, -1.9059873819351196, -1.8043076992034912, -1.7026281356811523, -1.600948452949524, -1.4992687702178955, -1.3975892066955566, -1.2959095239639282, -1.1942298412322998, -1.092550277709961, -0.9908705949783325, -0.8891909718513489, -0.7875111103057861, -0.6858314871788025, -0.5841518640518188, -0.48247218132019043, -0.3807925581932068, -0.27911293506622314, -0.17743325233459473, -0.07575362920761108, 0.02592599391937256, 0.1276056319475174, 0.22928526997566223, 0.33096492290496826, 0.4326445460319519, 0.5343241691589355, 0.636003851890564, 0.7376834750175476, 0.8393630981445312, 0.9410427212715149, 1.0427223443984985, 1.144402027130127, 1.2460815906524658, 1.3477612733840942, 1.4494409561157227, 1.5511205196380615, 1.65280020236969, 1.7544798851013184, 1.8561594486236572, 1.9578391313552856, 2.059518814086914, 2.161198377609253, 2.262877941131592, 2.3645577430725098, 2.4662373065948486]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 10.0, 8.0, 9.0, 11.0, 33.0, 33.0, 37.0, 50.0, 63.0, 56.0, 79.0, 91.0, 94.0, 70.0, 49.0, 46.0, 38.0, 53.0, 34.0, 30.0, 19.0, 20.0, 13.0, 16.0, 12.0, 9.0, 9.0, 4.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.935934066772461, -1.8644180297851562, -1.792901873588562, -1.7213858366012573, -1.649869680404663, -1.5783536434173584, -1.5068376064300537, -1.435321569442749, -1.3638054132461548, -1.29228937625885, -1.2207732200622559, -1.1492571830749512, -1.0777411460876465, -1.0062249898910522, -0.9347089529037476, -0.8631928563117981, -0.7916767597198486, -0.7201606631278992, -0.6486445665359497, -0.577128529548645, -0.5056124329566956, -0.4340963363647461, -0.362580269575119, -0.29106420278549194, -0.21954810619354248, -0.1480320245027542, -0.07651594281196594, -0.004999861121177673, 0.0665162205696106, 0.13803231716156006, 0.20954838395118713, 0.2810644507408142, 0.35258054733276367, 0.42409664392471313, 0.4956127107143402, 0.5671287775039673, 0.6386448740959167, 0.7101609706878662, 0.7816770076751709, 0.8531931042671204, 0.9247092008590698, 0.9962252974510193, 1.0677413940429688, 1.1392574310302734, 1.2107734680175781, 1.2822896242141724, 1.353805661201477, 1.4253218173980713, 1.496837854385376, 1.5683538913726807, 1.639870047569275, 1.7113860845565796, 1.7829022407531738, 1.8544182777404785, 1.9259343147277832, 1.997450351715088, 2.0689663887023926, 2.1404824256896973, 2.211998462677002, 2.2835147380828857, 2.3550307750701904, 2.426546812057495, 2.4980628490448, 2.5695788860321045, 2.6410951614379883]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 14.0, 11.0, 23.0, 46.0, 64.0, 115.0, 193.0, 415.0, 893.0, 2108.0, 6254.0, 25017.0, 202503.0, 745525.0, 49359.0, 10341.0, 3252.0, 1233.0, 558.0, 275.0, 142.0, 93.0, 38.0, 28.0, 14.0, 9.0, 7.0, 8.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2705078125, -0.26259803771972656, -0.2546882629394531, -0.2467784881591797, -0.23886871337890625, -0.2309589385986328, -0.22304916381835938, -0.21513938903808594, -0.2072296142578125, -0.19931983947753906, -0.19141006469726562, -0.1835002899169922, -0.17559051513671875, -0.1676807403564453, -0.15977096557617188, -0.15186119079589844, -0.143951416015625, -0.13604164123535156, -0.12813186645507812, -0.12022209167480469, -0.11231231689453125, -0.10440254211425781, -0.09649276733398438, -0.08858299255371094, -0.0806732177734375, -0.07276344299316406, -0.06485366821289062, -0.05694389343261719, -0.04903411865234375, -0.04112434387207031, -0.033214569091796875, -0.025304794311523438, -0.01739501953125, -0.009485244750976562, -0.001575469970703125, 0.0063343048095703125, 0.01424407958984375, 0.022153854370117188, 0.030063629150390625, 0.03797340393066406, 0.0458831787109375, 0.05379295349121094, 0.061702728271484375, 0.06961250305175781, 0.07752227783203125, 0.08543205261230469, 0.09334182739257812, 0.10125160217285156, 0.109161376953125, 0.11707115173339844, 0.12498092651367188, 0.1328907012939453, 0.14080047607421875, 0.1487102508544922, 0.15662002563476562, 0.16452980041503906, 0.1724395751953125, 0.18034934997558594, 0.18825912475585938, 0.1961688995361328, 0.20407867431640625, 0.2119884490966797, 0.21989822387695312, 0.22780799865722656, 0.2357177734375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 8.0, 11.0, 9.0, 17.0, 26.0, 24.0, 31.0, 22.0, 50.0, 61.0, 53.0, 67.0, 63.0, 75.0, 78.0, 47.0, 44.0, 54.0, 52.0, 31.0, 37.0, 37.0, 20.0, 14.0, 15.0, 6.0, 14.0, 3.0, 8.0, 2.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1383056640625, -0.1346292495727539, -0.1309528350830078, -0.12727642059326172, -0.12360000610351562, -0.11992359161376953, -0.11624717712402344, -0.11257076263427734, -0.10889434814453125, -0.10521793365478516, -0.10154151916503906, -0.09786510467529297, -0.09418869018554688, -0.09051227569580078, -0.08683586120605469, -0.0831594467163086, -0.0794830322265625, -0.0758066177368164, -0.07213020324707031, -0.06845378875732422, -0.06477737426757812, -0.06110095977783203, -0.05742454528808594, -0.053748130798339844, -0.05007171630859375, -0.046395301818847656, -0.04271888732910156, -0.03904247283935547, -0.035366058349609375, -0.03168964385986328, -0.028013229370117188, -0.024336814880371094, -0.020660400390625, -0.016983985900878906, -0.013307571411132812, -0.009631156921386719, -0.005954742431640625, -0.0022783279418945312, 0.0013980865478515625, 0.005074501037597656, 0.00875091552734375, 0.012427330017089844, 0.016103744506835938, 0.01978015899658203, 0.023456573486328125, 0.02713298797607422, 0.030809402465820312, 0.034485816955566406, 0.0381622314453125, 0.041838645935058594, 0.04551506042480469, 0.04919147491455078, 0.052867889404296875, 0.05654430389404297, 0.06022071838378906, 0.06389713287353516, 0.06757354736328125, 0.07124996185302734, 0.07492637634277344, 0.07860279083251953, 0.08227920532226562, 0.08595561981201172, 0.08963203430175781, 0.0933084487915039, 0.09698486328125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 5.0, 7.0, 5.0, 4.0, 4.0, 9.0, 11.0, 33.0, 31.0, 27.0, 51.0, 86.0, 142.0, 326.0, 699.0, 2285.0, 11775.0, 837331.0, 183672.0, 8813.0, 1902.0, 602.0, 294.0, 145.0, 93.0, 61.0, 32.0, 31.0, 23.0, 16.0, 9.0, 7.0, 8.0, 5.0, 4.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29638671875, -0.28577423095703125, -0.2751617431640625, -0.26454925537109375, -0.253936767578125, -0.24332427978515625, -0.2327117919921875, -0.22209930419921875, -0.21148681640625, -0.20087432861328125, -0.1902618408203125, -0.17964935302734375, -0.169036865234375, -0.15842437744140625, -0.1478118896484375, -0.13719940185546875, -0.1265869140625, -0.11597442626953125, -0.1053619384765625, -0.09474945068359375, -0.084136962890625, -0.07352447509765625, -0.0629119873046875, -0.05229949951171875, -0.04168701171875, -0.03107452392578125, -0.0204620361328125, -0.00984954833984375, 0.000762939453125, 0.01137542724609375, 0.0219879150390625, 0.03260040283203125, 0.043212890625, 0.05382537841796875, 0.0644378662109375, 0.07505035400390625, 0.085662841796875, 0.09627532958984375, 0.1068878173828125, 0.11750030517578125, 0.12811279296875, 0.13872528076171875, 0.1493377685546875, 0.15995025634765625, 0.170562744140625, 0.18117523193359375, 0.1917877197265625, 0.20240020751953125, 0.2130126953125, 0.22362518310546875, 0.2342376708984375, 0.24485015869140625, 0.255462646484375, 0.26607513427734375, 0.2766876220703125, 0.28730010986328125, 0.29791259765625, 0.30852508544921875, 0.3191375732421875, 0.32975006103515625, 0.340362548828125, 0.35097503662109375, 0.3615875244140625, 0.37220001220703125, 0.3828125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 5.0, 5.0, 5.0, 4.0, 6.0, 5.0, 12.0, 9.0, 15.0, 20.0, 24.0, 25.0, 33.0, 34.0, 61.0, 67.0, 89.0, 91.0, 73.0, 84.0, 57.0, 57.0, 33.0, 35.0, 27.0, 24.0, 21.0, 15.0, 11.0, 10.0, 13.0, 8.0, 7.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.413818359375, -0.40030670166015625, -0.3867950439453125, -0.37328338623046875, -0.359771728515625, -0.34626007080078125, -0.3327484130859375, -0.31923675537109375, -0.30572509765625, -0.29221343994140625, -0.2787017822265625, -0.26519012451171875, -0.251678466796875, -0.23816680908203125, -0.2246551513671875, -0.21114349365234375, -0.1976318359375, -0.18412017822265625, -0.1706085205078125, -0.15709686279296875, -0.143585205078125, -0.13007354736328125, -0.1165618896484375, -0.10305023193359375, -0.08953857421875, -0.07602691650390625, -0.0625152587890625, -0.04900360107421875, -0.035491943359375, -0.02198028564453125, -0.0084686279296875, 0.00504302978515625, 0.0185546875, 0.03206634521484375, 0.0455780029296875, 0.05908966064453125, 0.072601318359375, 0.08611297607421875, 0.0996246337890625, 0.11313629150390625, 0.12664794921875, 0.14015960693359375, 0.1536712646484375, 0.16718292236328125, 0.180694580078125, 0.19420623779296875, 0.2077178955078125, 0.22122955322265625, 0.2347412109375, 0.24825286865234375, 0.2617645263671875, 0.27527618408203125, 0.288787841796875, 0.30229949951171875, 0.3158111572265625, 0.32932281494140625, 0.34283447265625, 0.35634613037109375, 0.3698577880859375, 0.38336944580078125, 0.396881103515625, 0.41039276123046875, 0.4239044189453125, 0.43741607666015625, 0.450927734375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 1.0, 3.0, 7.0, 5.0, 4.0, 9.0, 8.0, 18.0, 17.0, 25.0, 46.0, 52.0, 86.0, 170.0, 341.0, 802.0, 2879.0, 23319.0, 995646.0, 20802.0, 2728.0, 802.0, 343.0, 180.0, 97.0, 53.0, 35.0, 25.0, 17.0, 15.0, 8.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06268310546875, -0.059622764587402344, -0.05656242370605469, -0.05350208282470703, -0.050441741943359375, -0.04738140106201172, -0.04432106018066406, -0.041260719299316406, -0.03820037841796875, -0.035140037536621094, -0.03207969665527344, -0.02901935577392578, -0.025959014892578125, -0.02289867401123047, -0.019838333129882812, -0.016777992248535156, -0.0137176513671875, -0.010657310485839844, -0.0075969696044921875, -0.004536628723144531, -0.001476287841796875, 0.0015840530395507812, 0.0046443939208984375, 0.007704734802246094, 0.01076507568359375, 0.013825416564941406, 0.016885757446289062, 0.01994609832763672, 0.023006439208984375, 0.02606678009033203, 0.029127120971679688, 0.032187461853027344, 0.035247802734375, 0.038308143615722656, 0.04136848449707031, 0.04442882537841797, 0.047489166259765625, 0.05054950714111328, 0.05360984802246094, 0.056670188903808594, 0.05973052978515625, 0.0627908706665039, 0.06585121154785156, 0.06891155242919922, 0.07197189331054688, 0.07503223419189453, 0.07809257507324219, 0.08115291595458984, 0.0842132568359375, 0.08727359771728516, 0.09033393859863281, 0.09339427947998047, 0.09645462036132812, 0.09951496124267578, 0.10257530212402344, 0.1056356430053711, 0.10869598388671875, 0.1117563247680664, 0.11481666564941406, 0.11787700653076172, 0.12093734741210938, 0.12399768829345703, 0.1270580291748047, 0.13011837005615234, 0.1331787109375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 5.0, 4.0, 6.0, 2.0, 5.0, 9.0, 6.0, 18.0, 8.0, 14.0, 14.0, 23.0, 24.0, 29.0, 36.0, 38.0, 50.0, 61.0, 49.0, 60.0, 56.0, 67.0, 61.0, 64.0, 56.0, 32.0, 33.0, 21.0, 20.0, 20.0, 14.0, 18.0, 16.0, 9.0, 12.0, 3.0, 11.0, 6.0, 3.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.537799835205078e-05, -1.4892779290676117e-05, -1.4407560229301453e-05, -1.3922341167926788e-05, -1.3437122106552124e-05, -1.295190304517746e-05, -1.2466683983802795e-05, -1.1981464922428131e-05, -1.1496245861053467e-05, -1.1011026799678802e-05, -1.0525807738304138e-05, -1.0040588676929474e-05, -9.55536961555481e-06, -9.070150554180145e-06, -8.584931492805481e-06, -8.099712431430817e-06, -7.614493370056152e-06, -7.129274308681488e-06, -6.644055247306824e-06, -6.1588361859321594e-06, -5.673617124557495e-06, -5.188398063182831e-06, -4.7031790018081665e-06, -4.217959940433502e-06, -3.732740879058838e-06, -3.2475218176841736e-06, -2.7623027563095093e-06, -2.277083694934845e-06, -1.7918646335601807e-06, -1.3066455721855164e-06, -8.21426510810852e-07, -3.3620744943618774e-07, 1.4901161193847656e-07, 6.342306733131409e-07, 1.1194497346878052e-06, 1.6046687960624695e-06, 2.089887857437134e-06, 2.575106918811798e-06, 3.0603259801864624e-06, 3.5455450415611267e-06, 4.030764102935791e-06, 4.515983164310455e-06, 5.00120222568512e-06, 5.486421287059784e-06, 5.971640348434448e-06, 6.4568594098091125e-06, 6.942078471183777e-06, 7.427297532558441e-06, 7.912516593933105e-06, 8.39773565530777e-06, 8.882954716682434e-06, 9.368173778057098e-06, 9.853392839431763e-06, 1.0338611900806427e-05, 1.0823830962181091e-05, 1.1309050023555756e-05, 1.179426908493042e-05, 1.2279488146305084e-05, 1.2764707207679749e-05, 1.3249926269054413e-05, 1.3735145330429077e-05, 1.4220364391803741e-05, 1.4705583453178406e-05, 1.519080251455307e-05, 1.5676021575927734e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 7.0, 8.0, 10.0, 15.0, 18.0, 22.0, 56.0, 85.0, 147.0, 286.0, 506.0, 1249.0, 3157.0, 11638.0, 317289.0, 696681.0, 11765.0, 3135.0, 1248.0, 587.0, 271.0, 159.0, 72.0, 48.0, 32.0, 22.0, 17.0, 3.0, 3.0, 7.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.0880126953125, -0.08563423156738281, -0.08325576782226562, -0.08087730407714844, -0.07849884033203125, -0.07612037658691406, -0.07374191284179688, -0.07136344909667969, -0.0689849853515625, -0.06660652160644531, -0.06422805786132812, -0.06184959411621094, -0.05947113037109375, -0.05709266662597656, -0.054714202880859375, -0.05233573913574219, -0.049957275390625, -0.04757881164550781, -0.045200347900390625, -0.04282188415527344, -0.04044342041015625, -0.03806495666503906, -0.035686492919921875, -0.03330802917480469, -0.0309295654296875, -0.028551101684570312, -0.026172637939453125, -0.023794174194335938, -0.02141571044921875, -0.019037246704101562, -0.016658782958984375, -0.014280319213867188, -0.01190185546875, -0.009523391723632812, -0.007144927978515625, -0.0047664642333984375, -0.00238800048828125, -9.5367431640625e-06, 0.002368927001953125, 0.0047473907470703125, 0.0071258544921875, 0.009504318237304688, 0.011882781982421875, 0.014261245727539062, 0.01663970947265625, 0.019018173217773438, 0.021396636962890625, 0.023775100708007812, 0.026153564453125, 0.028532028198242188, 0.030910491943359375, 0.03328895568847656, 0.03566741943359375, 0.03804588317871094, 0.040424346923828125, 0.04280281066894531, 0.0451812744140625, 0.04755973815917969, 0.049938201904296875, 0.05231666564941406, 0.05469512939453125, 0.05707359313964844, 0.059452056884765625, 0.06183052062988281, 0.064208984375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 4.0, 1.0, 10.0, 22.0, 34.0, 53.0, 137.0, 425.0, 175.0, 66.0, 38.0, 15.0, 9.0, 9.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1197509765625, -0.11656665802001953, -0.11338233947753906, -0.1101980209350586, -0.10701370239257812, -0.10382938385009766, -0.10064506530761719, -0.09746074676513672, -0.09427642822265625, -0.09109210968017578, -0.08790779113769531, -0.08472347259521484, -0.08153915405273438, -0.0783548355102539, -0.07517051696777344, -0.07198619842529297, -0.0688018798828125, -0.06561756134033203, -0.06243324279785156, -0.059248924255371094, -0.056064605712890625, -0.052880287170410156, -0.04969596862792969, -0.04651165008544922, -0.04332733154296875, -0.04014301300048828, -0.03695869445800781, -0.033774375915527344, -0.030590057373046875, -0.027405738830566406, -0.024221420288085938, -0.02103710174560547, -0.017852783203125, -0.014668464660644531, -0.011484146118164062, -0.008299827575683594, -0.005115509033203125, -0.0019311904907226562, 0.0012531280517578125, 0.004437446594238281, 0.00762176513671875, 0.010806083679199219, 0.013990402221679688, 0.017174720764160156, 0.020359039306640625, 0.023543357849121094, 0.026727676391601562, 0.02991199493408203, 0.0330963134765625, 0.03628063201904297, 0.03946495056152344, 0.042649269104003906, 0.045833587646484375, 0.049017906188964844, 0.05220222473144531, 0.05538654327392578, 0.05857086181640625, 0.06175518035888672, 0.06493949890136719, 0.06812381744384766, 0.07130813598632812, 0.0744924545288086, 0.07767677307128906, 0.08086109161376953, 0.08404541015625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 16.0, 32.0, 66.0, 338.0, 403.0, 63.0, 35.0, 24.0, 11.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.347710132598877, -1.2685073614120483, -1.1893044710159302, -1.1101016998291016, -1.0308988094329834, -0.9516960382461548, -0.8724932670593262, -0.7932904362678528, -0.7140876054763794, -0.634884774684906, -0.5556819438934326, -0.476479172706604, -0.3972763419151306, -0.3180735111236572, -0.23887071013450623, -0.15966790914535522, -0.08046507835388184, -0.0012622624635696411, 0.07794055342674255, 0.15714336931705475, 0.23634618520736694, 0.31554901599884033, 0.39475181698799133, 0.47395461797714233, 0.5531574487686157, 0.6323602795600891, 0.7115631103515625, 0.7907658815383911, 0.8699687123298645, 0.9491715431213379, 1.0283743143081665, 1.1075770854949951, 1.1867802143096924, 1.265982985496521, 1.3451858758926392, 1.4243886470794678, 1.503591537475586, 1.5827943086624146, 1.6619970798492432, 1.7411999702453613, 1.82040274143219, 1.8996055126190186, 1.9788084030151367, 2.058011293411255, 2.137213945388794, 2.216416835784912, 2.2956197261810303, 2.3748223781585693, 2.4540252685546875, 2.5332281589508057, 2.6124308109283447, 2.691633701324463, 2.770836591720581, 2.850039482116699, 2.9292421340942383, 3.0084450244903564, 3.0876479148864746, 3.1668508052825928, 3.246053457260132, 3.32525634765625, 3.404459238052368, 3.4836621284484863, 3.5628647804260254, 3.6420676708221436, 3.7212703227996826]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 6.0, 4.0, 6.0, 10.0, 7.0, 11.0, 11.0, 18.0, 21.0, 10.0, 21.0, 25.0, 24.0, 30.0, 29.0, 245.0, 241.0, 31.0, 32.0, 45.0, 27.0, 30.0, 14.0, 13.0, 18.0, 12.0, 8.0, 12.0, 4.0, 7.0, 5.0, 11.0, 8.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3713531494140625, -1.3284969329833984, -1.2856407165527344, -1.2427845001220703, -1.1999282836914062, -1.1570720672607422, -1.1142158508300781, -1.071359634399414, -1.02850341796875, -0.9856472015380859, -0.9427909851074219, -0.8999347686767578, -0.8570785522460938, -0.8142223358154297, -0.7713661789894104, -0.7285099625587463, -0.685653805732727, -0.642797589302063, -0.5999413728713989, -0.5570851564407349, -0.5142289400100708, -0.4713727533817291, -0.42851656675338745, -0.3856603503227234, -0.3428041338920593, -0.29994791746139526, -0.2570917010307312, -0.21423551440238953, -0.17137929797172546, -0.1285230815410614, -0.08566689491271973, -0.042810678482055664, 4.553794860839844e-05, 0.042901746928691864, 0.08575795590877533, 0.1286141574382782, 0.17147037386894226, 0.21432659029960632, 0.257182776927948, 0.30003899335861206, 0.3428952097892761, 0.3857514262199402, 0.42860764265060425, 0.4714638292789459, 0.5143200159072876, 0.5571762323379517, 0.6000324487686157, 0.6428886651992798, 0.6857448816299438, 0.7286010980606079, 0.771457314491272, 0.814313530921936, 0.8571697473526001, 0.9000259637832642, 0.9428821206092834, 0.9857383370399475, 1.0285944938659668, 1.0714507102966309, 1.114306926727295, 1.157163143157959, 1.200019359588623, 1.242875576019287, 1.2857317924499512, 1.3285880088806152, 1.3714442253112793]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 8.0, 12.0, 27.0, 18.0, 47.0, 54.0, 71.0, 327.0, 171.0, 77.0, 56.0, 42.0, 28.0, 27.0, 11.0, 12.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2008056640625, -0.19520187377929688, -0.18959808349609375, -0.18399429321289062, -0.1783905029296875, -0.17278671264648438, -0.16718292236328125, -0.16157913208007812, -0.155975341796875, -0.15037155151367188, -0.14476776123046875, -0.13916397094726562, -0.1335601806640625, -0.12795639038085938, -0.12235260009765625, -0.11674880981445312, -0.11114501953125, -0.10554122924804688, -0.09993743896484375, -0.09433364868164062, -0.0887298583984375, -0.08312606811523438, -0.07752227783203125, -0.07191848754882812, -0.066314697265625, -0.060710906982421875, -0.05510711669921875, -0.049503326416015625, -0.0438995361328125, -0.038295745849609375, -0.03269195556640625, -0.027088165283203125, -0.021484375, -0.015880584716796875, -0.01027679443359375, -0.004673004150390625, 0.0009307861328125, 0.006534576416015625, 0.01213836669921875, 0.017742156982421875, 0.023345947265625, 0.028949737548828125, 0.03455352783203125, 0.040157318115234375, 0.0457611083984375, 0.051364898681640625, 0.05696868896484375, 0.06257247924804688, 0.06817626953125, 0.07378005981445312, 0.07938385009765625, 0.08498764038085938, 0.0905914306640625, 0.09619522094726562, 0.10179901123046875, 0.10740280151367188, 0.113006591796875, 0.11861038208007812, 0.12421417236328125, 0.12981796264648438, 0.1354217529296875, 0.14102554321289062, 0.14662933349609375, 0.15223312377929688, 0.1578369140625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 9.0, 21.0, 8.0, 11.0, 20.0, 31.0, 50.0, 40.0, 55.0, 99.0, 170.0, 346.0, 634.0, 1542.0, 4928.0, 63582.0, 8304330.0, 8569.0, 2194.0, 901.0, 406.0, 205.0, 146.0, 82.0, 48.0, 57.0, 35.0, 30.0, 14.0, 12.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.841816782951355, -0.8171857595443726, -0.7925547361373901, -0.7679237127304077, -0.7432927489280701, -0.7186617255210876, -0.6940307021141052, -0.6693996787071228, -0.6447687149047852, -0.6201376914978027, -0.5955066680908203, -0.5708756446838379, -0.5462446808815002, -0.5216136574745178, -0.4969826340675354, -0.472351610660553, -0.44772058725357056, -0.42308956384658813, -0.3984585702419281, -0.3738275468349457, -0.34919655323028564, -0.3245655298233032, -0.2999345064163208, -0.2753034830093384, -0.25067248940467834, -0.22604148089885712, -0.2014104723930359, -0.17677944898605347, -0.15214844048023224, -0.127517431974411, -0.10288640856742859, -0.07825540006160736, -0.05362439155578613, -0.028993379324674606, -0.00436236709356308, 0.020268648862838745, 0.04489965736865997, 0.0695306658744812, 0.09416168928146362, 0.11879269778728485, 0.14342370629310608, 0.1680547147989273, 0.19268572330474854, 0.21731674671173096, 0.24194775521755219, 0.2665787637233734, 0.29120978713035583, 0.31584078073501587, 0.3404718041419983, 0.3651028275489807, 0.38973382115364075, 0.41436484456062317, 0.4389958381652832, 0.4636268615722656, 0.48825788497924805, 0.5128889083862305, 0.5375199317932129, 0.5621509552001953, 0.5867819786071777, 0.6114130020141602, 0.6360439658164978, 0.6606749892234802, 0.6853060126304626, 0.7099370360374451, 0.7345679998397827]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 4.0, 3.0, 3.0, 10.0, 2.0, 7.0, 1.0, 4.0, 9.0, 4.0, 6.0, 2.0, 2.0, 9.0, 4.0, 4.0, 1.0, 1.0, 4.0, 5.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.8215011954307556, -0.7937370538711548, -0.765972912311554, -0.7382087707519531, -0.7104446887969971, -0.6826804876327515, -0.6549164056777954, -0.6271522641181946, -0.5993881225585938, -0.5716239809989929, -0.5438598394393921, -0.5160956978797913, -0.4883315861225128, -0.460567444562912, -0.43280333280563354, -0.4050391912460327, -0.3772750496864319, -0.34951090812683105, -0.3217467665672302, -0.2939826548099518, -0.26621851325035095, -0.23845437169075012, -0.21069024503231049, -0.18292611837387085, -0.15516197681427002, -0.1273978352546692, -0.09963370859622955, -0.07186957448720932, -0.04410544037818909, -0.016341298818588257, 0.01142282783985138, 0.039186954498291016, 0.06695115566253662, 0.09471528977155685, 0.12247942388057709, 0.15024355053901672, 0.17800769209861755, 0.20577183365821838, 0.23353596031665802, 0.26130008697509766, 0.2890642285346985, 0.3168283700942993, 0.34459251165390015, 0.3723566234111786, 0.4001207649707794, 0.42788490653038025, 0.4556490182876587, 0.4834131598472595, 0.5111773014068604, 0.5389414429664612, 0.566705584526062, 0.5944697260856628, 0.6222338676452637, 0.6499979496002197, 0.6777620911598206, 0.7055262327194214, 0.7332903742790222, 0.761054515838623, 0.7888186573982239, 0.8165827989578247, 0.8443468809127808, 0.8721110820770264, 0.8998751640319824, 0.9276393055915833, 0.9554034471511841]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [7.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 9.0, 3.0, 6.0, 11.0, 10.0, 29.0, 38.0, 44.0, 62.0, 96.0, 123.0, 201.0, 353.0, 549.0, 996.0, 1704.0, 3678.0, 8134.0, 22030.0, 75637.0, 242926.0, 117024.0, 30139.0, 10424.0, 4325.0, 2281.0, 1221.0, 720.0, 428.0, 310.0, 205.0, 135.0, 107.0, 75.0, 50.0, 45.0, 28.0, 27.0, 23.0, 18.0, 8.0, 4.0, 5.0, 10.0, 0.0, 3.0, 2.0, 6.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.6826171875, -0.6579360961914062, -0.6332550048828125, -0.6085739135742188, -0.583892822265625, -0.5592117309570312, -0.5345306396484375, -0.5098495483398438, -0.48516845703125, -0.46048736572265625, -0.4358062744140625, -0.41112518310546875, -0.386444091796875, -0.36176300048828125, -0.3370819091796875, -0.31240081787109375, -0.2877197265625, -0.26303863525390625, -0.2383575439453125, -0.21367645263671875, -0.188995361328125, -0.16431427001953125, -0.1396331787109375, -0.11495208740234375, -0.09027099609375, -0.06558990478515625, -0.0409088134765625, -0.01622772216796875, 0.008453369140625, 0.03313446044921875, 0.0578155517578125, 0.08249664306640625, 0.107177734375, 0.13185882568359375, 0.1565399169921875, 0.18122100830078125, 0.205902099609375, 0.23058319091796875, 0.2552642822265625, 0.27994537353515625, 0.30462646484375, 0.32930755615234375, 0.3539886474609375, 0.37866973876953125, 0.403350830078125, 0.42803192138671875, 0.4527130126953125, 0.47739410400390625, 0.5020751953125, 0.5267562866210938, 0.5514373779296875, 0.5761184692382812, 0.600799560546875, 0.6254806518554688, 0.6501617431640625, 0.6748428344726562, 0.69952392578125, 0.7242050170898438, 0.7488861083984375, 0.7735671997070312, 0.798248291015625, 0.8229293823242188, 0.8476104736328125, 0.8722915649414062, 0.89697265625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 7.0, 7.0, 7.0, 14.0, 19.0, 25.0, 31.0, 41.0, 50.0, 63.0, 81.0, 88.0, 81.0, 86.0, 81.0, 68.0, 52.0, 35.0, 32.0, 26.0, 25.0, 19.0, 12.0, 11.0, 8.0, 4.0, 6.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1376953125, -0.13363265991210938, -0.12957000732421875, -0.12550735473632812, -0.1214447021484375, -0.11738204956054688, -0.11331939697265625, -0.10925674438476562, -0.105194091796875, -0.10113143920898438, -0.09706878662109375, -0.09300613403320312, -0.0889434814453125, -0.08488082885742188, -0.08081817626953125, -0.07675552368164062, -0.07269287109375, -0.06863021850585938, -0.06456756591796875, -0.060504913330078125, -0.0564422607421875, -0.052379608154296875, -0.04831695556640625, -0.044254302978515625, -0.040191650390625, -0.036128997802734375, -0.03206634521484375, -0.028003692626953125, -0.0239410400390625, -0.019878387451171875, -0.01581573486328125, -0.011753082275390625, -0.0076904296875, -0.003627777099609375, 0.00043487548828125, 0.004497528076171875, 0.0085601806640625, 0.012622833251953125, 0.01668548583984375, 0.020748138427734375, 0.024810791015625, 0.028873443603515625, 0.03293609619140625, 0.036998748779296875, 0.0410614013671875, 0.045124053955078125, 0.04918670654296875, 0.053249359130859375, 0.05731201171875, 0.061374664306640625, 0.06543731689453125, 0.06949996948242188, 0.0735626220703125, 0.07762527465820312, 0.08168792724609375, 0.08575057983398438, 0.089813232421875, 0.09387588500976562, 0.09793853759765625, 0.10200119018554688, 0.1060638427734375, 0.11012649536132812, 0.11418914794921875, 0.11825180053710938, 0.122314453125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 7.0, 13.0, 10.0, 29.0, 38.0, 48.0, 74.0, 62.0, 62.0, 41.0, 28.0, 16.0, 11.0, 8.0, 9.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8406106233596802, -0.8140976428985596, -0.7875846028327942, -0.7610716223716736, -0.7345585823059082, -0.7080456018447876, -0.681532621383667, -0.6550195813179016, -0.628506600856781, -0.6019936203956604, -0.575480580329895, -0.5489675998687744, -0.522454559803009, -0.4959415793418884, -0.46942856907844543, -0.44291555881500244, -0.41640254855155945, -0.38988953828811646, -0.36337652802467346, -0.33686351776123047, -0.31035053730010986, -0.28383752703666687, -0.2573245167732239, -0.23081152141094208, -0.20429851114749908, -0.1777855008840561, -0.1512725055217743, -0.1247594952583313, -0.0982464924454689, -0.0717334896326065, -0.04522047936916351, -0.018707484006881714, 0.007805526256561279, 0.034318529069423676, 0.06083153560757637, 0.08734454214572906, 0.11385754495859146, 0.14037054777145386, 0.16688355803489685, 0.19339655339717865, 0.21990956366062164, 0.24642257392406464, 0.27293556928634644, 0.29944857954978943, 0.3259615898132324, 0.352474570274353, 0.3789876103401184, 0.405500590801239, 0.432013601064682, 0.458526611328125, 0.485039621591568, 0.511552631855011, 0.5380656123161316, 0.564578652381897, 0.5910916328430176, 0.6176046133041382, 0.6441176533699036, 0.6706306338310242, 0.6971436738967896, 0.7236566543579102, 0.7501696944236755, 0.7766826748847961, 0.8031957149505615, 0.8297086954116821, 0.8562216758728027]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 4.0, 4.0, 7.0, 8.0, 14.0, 34.0, 61.0, 92.0, 98.0, 53.0, 42.0, 14.0, 9.0, 8.0, 6.0, 3.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6522510051727295, -0.6285818815231323, -0.6049128174781799, -0.5812436938285828, -0.5575746297836304, -0.5339055061340332, -0.510236382484436, -0.48656731843948364, -0.46289822459220886, -0.4392291307449341, -0.4155600368976593, -0.3918909430503845, -0.36822181940078735, -0.34455275535583496, -0.3208836317062378, -0.297214537858963, -0.27354544401168823, -0.24987635016441345, -0.22620725631713867, -0.2025381475687027, -0.17886905372142792, -0.15519995987415314, -0.13153085112571716, -0.10786175727844238, -0.0841926634311676, -0.060523565858602524, -0.036854468286037445, -0.013185366988182068, 0.010483726859092712, 0.03415282070636749, 0.05782192945480347, 0.08149102330207825, 0.10516011714935303, 0.1288292109966278, 0.1524983048439026, 0.17616741359233856, 0.19983650743961334, 0.22350560128688812, 0.2471747100353241, 0.2708438038825989, 0.29451289772987366, 0.31818199157714844, 0.3418510854244232, 0.365520179271698, 0.38918930292129517, 0.41285836696624756, 0.4365274906158447, 0.4601965844631195, 0.4838656783103943, 0.5075348019599915, 0.5312038660049438, 0.554872989654541, 0.5785420536994934, 0.6022111773490906, 0.625880241394043, 0.6495493650436401, 0.6732184886932373, 0.6968876123428345, 0.7205566763877869, 0.744225800037384, 0.7678948640823364, 0.7915639877319336, 0.8152331113815308, 0.8389021754264832, 0.8625712394714355]}, "train/train_runtime": 5180.8925, "train/train_samples_per_second": 5.508, "train/train_steps_per_second": 0.086, "train/total_flos": 0.0, "train/train_loss": 4.375692403904526, "eval/loss": 4.211044788360596, "eval/wer": 2.02631892106307, "eval/runtime": 1133.2799, "eval/samples_per_second": 2.331, "eval/steps_per_second": 0.292} \ No newline at end of file +{"train/loss": 4.3145, "train/learning_rate": 8.860000000000002e-06, "train/epoch": 1.0, "train/global_step": 446, "_runtime": 6620, "_timestamp": 1646065893, "_step": 447, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 10.0, 27.0, 95.0, 154.0, 264.0, 230.0, 141.0, 62.0, 23.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.178123474121094, -22.747371673583984, -21.316619873046875, -19.885866165161133, -18.455114364624023, -17.024362564086914, -15.593609809875488, -14.162857055664062, -12.732105255126953, -11.301353454589844, -9.870600700378418, -8.439847946166992, -7.009096145629883, -5.578343868255615, -4.147591590881348, -2.716838836669922, -1.2860870361328125, 0.14466524124145508, 1.5754175186157227, 3.0061697959899902, 4.436922073364258, 5.867674350738525, 7.298426628112793, 8.729179382324219, 10.159931182861328, 11.590682983398438, 13.021435737609863, 14.452188491821289, 15.882940292358398, 17.313692092895508, 18.74444580078125, 20.17519760131836, 21.60594940185547, 23.036701202392578, 24.467453002929688, 25.89820671081543, 27.32895851135254, 28.75971031188965, 30.19046401977539, 31.6212158203125, 33.05196762084961, 34.48271942138672, 35.91347122192383, 37.34422302246094, 38.77497863769531, 40.20573043823242, 41.63648223876953, 43.06723403930664, 44.49798583984375, 45.92873764038086, 47.35948944091797, 48.79024124145508, 50.22099304199219, 51.65174865722656, 53.08250045776367, 54.51325225830078, 55.94400405883789, 57.374755859375, 58.80550765991211, 60.23625946044922, 61.667015075683594, 63.0977668762207, 64.52851867675781, 65.95927429199219, 67.39002227783203]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 6.0, 6.0, 11.0, 9.0, 15.0, 9.0, 9.0, 15.0, 24.0, 25.0, 24.0, 23.0, 30.0, 33.0, 34.0, 32.0, 38.0, 43.0, 44.0, 45.0, 47.0, 46.0, 42.0, 28.0, 37.0, 36.0, 36.0, 41.0, 22.0, 29.0, 35.0, 17.0, 22.0, 13.0, 11.0, 8.0, 15.0, 13.0, 9.0, 3.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.37661361694336, -28.406328201293945, -27.4360408782959, -26.465755462646484, -25.495468139648438, -24.525182723999023, -23.55489730834961, -22.584609985351562, -21.61432456970215, -20.644039154052734, -19.673751831054688, -18.703466415405273, -17.733179092407227, -16.762893676757812, -15.792607307434082, -14.822320938110352, -13.852034568786621, -12.88174819946289, -11.91146183013916, -10.94117546081543, -9.970890045166016, -9.000603675842285, -8.030317306518555, -7.060031414031982, -6.089745044708252, -5.1194586753845215, -4.149172782897949, -3.1788864135742188, -2.2086002826690674, -1.238314151763916, -0.26802778244018555, 0.7022581100463867, 1.6725444793701172, 2.6428306102752686, 3.61311674118042, 4.58340311050415, 5.553689002990723, 6.523975372314453, 7.494261741638184, 8.464548110961914, 9.434833526611328, 10.405119895935059, 11.375406265258789, 12.345691680908203, 13.315978050231934, 14.286264419555664, 15.256550788879395, 16.226837158203125, 17.197124481201172, 18.167409896850586, 19.137697219848633, 20.107982635498047, 21.078269958496094, 22.048555374145508, 23.018840789794922, 23.98912811279297, 24.959413528442383, 25.929698944091797, 26.899986267089844, 27.870271682739258, 28.840559005737305, 29.81084442138672, 30.781131744384766, 31.75141716003418, 32.721702575683594]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 9.0, 4.0, 9.0, 12.0, 10.0, 13.0, 14.0, 17.0, 11.0, 19.0, 31.0, 29.0, 29.0, 22.0, 29.0, 39.0, 46.0, 42.0, 38.0, 38.0, 37.0, 37.0, 39.0, 36.0, 41.0, 42.0, 46.0, 37.0, 34.0, 30.0, 27.0, 22.0, 20.0, 13.0, 18.0, 17.0, 10.0, 8.0, 5.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.94140625, -1.8817291259765625, -1.822052001953125, -1.7623748779296875, -1.70269775390625, -1.6430206298828125, -1.583343505859375, -1.5236663818359375, -1.4639892578125, -1.4043121337890625, -1.344635009765625, -1.2849578857421875, -1.22528076171875, -1.1656036376953125, -1.105926513671875, -1.0462493896484375, -0.986572265625, -0.9268951416015625, -0.867218017578125, -0.8075408935546875, -0.74786376953125, -0.6881866455078125, -0.628509521484375, -0.5688323974609375, -0.5091552734375, -0.4494781494140625, -0.389801025390625, -0.3301239013671875, -0.27044677734375, -0.2107696533203125, -0.151092529296875, -0.0914154052734375, -0.03173828125, 0.0279388427734375, 0.087615966796875, 0.1472930908203125, 0.20697021484375, 0.2666473388671875, 0.326324462890625, 0.3860015869140625, 0.4456787109375, 0.5053558349609375, 0.565032958984375, 0.6247100830078125, 0.68438720703125, 0.7440643310546875, 0.803741455078125, 0.8634185791015625, 0.923095703125, 0.9827728271484375, 1.042449951171875, 1.1021270751953125, 1.16180419921875, 1.2214813232421875, 1.281158447265625, 1.3408355712890625, 1.4005126953125, 1.4601898193359375, 1.519866943359375, 1.5795440673828125, 1.63922119140625, 1.6988983154296875, 1.758575439453125, 1.8182525634765625, 1.8779296875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 13.0, 2.0, 18.0, 18.0, 21.0, 22.0, 39.0, 57.0, 112.0, 150.0, 185.0, 247.0, 378.0, 716.0, 1142.0, 2033.0, 3863.0, 9314.0, 30312.0, 185619.0, 1951480.0, 1788085.0, 174110.0, 28857.0, 8971.0, 3909.0, 1823.0, 1020.0, 612.0, 397.0, 256.0, 174.0, 100.0, 83.0, 48.0, 25.0, 24.0, 19.0, 13.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08984375, -5.8994140625, -5.708984375, -5.5185546875, -5.328125, -5.1376953125, -4.947265625, -4.7568359375, -4.56640625, -4.3759765625, -4.185546875, -3.9951171875, -3.8046875, -3.6142578125, -3.423828125, -3.2333984375, -3.04296875, -2.8525390625, -2.662109375, -2.4716796875, -2.28125, -2.0908203125, -1.900390625, -1.7099609375, -1.51953125, -1.3291015625, -1.138671875, -0.9482421875, -0.7578125, -0.5673828125, -0.376953125, -0.1865234375, 0.00390625, 0.1943359375, 0.384765625, 0.5751953125, 0.765625, 0.9560546875, 1.146484375, 1.3369140625, 1.52734375, 1.7177734375, 1.908203125, 2.0986328125, 2.2890625, 2.4794921875, 2.669921875, 2.8603515625, 3.05078125, 3.2412109375, 3.431640625, 3.6220703125, 3.8125, 4.0029296875, 4.193359375, 4.3837890625, 4.57421875, 4.7646484375, 4.955078125, 5.1455078125, 5.3359375, 5.5263671875, 5.716796875, 5.9072265625, 6.09765625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 12.0, 16.0, 54.0, 104.0, 267.0, 681.0, 1383.0, 907.0, 362.0, 150.0, 66.0, 31.0, 22.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.203125, -18.614990234375, -18.02685546875, -17.438720703125, -16.8505859375, -16.262451171875, -15.67431640625, -15.086181640625, -14.498046875, -13.909912109375, -13.32177734375, -12.733642578125, -12.1455078125, -11.557373046875, -10.96923828125, -10.381103515625, -9.79296875, -9.204833984375, -8.61669921875, -8.028564453125, -7.4404296875, -6.852294921875, -6.26416015625, -5.676025390625, -5.087890625, -4.499755859375, -3.91162109375, -3.323486328125, -2.7353515625, -2.147216796875, -1.55908203125, -0.970947265625, -0.3828125, 0.205322265625, 0.79345703125, 1.381591796875, 1.9697265625, 2.557861328125, 3.14599609375, 3.734130859375, 4.322265625, 4.910400390625, 5.49853515625, 6.086669921875, 6.6748046875, 7.262939453125, 7.85107421875, 8.439208984375, 9.02734375, 9.615478515625, 10.20361328125, 10.791748046875, 11.3798828125, 11.968017578125, 12.55615234375, 13.144287109375, 13.732421875, 14.320556640625, 14.90869140625, 15.496826171875, 16.0849609375, 16.673095703125, 17.26123046875, 17.849365234375, 18.4375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 6.0, 2.0, 8.0, 26.0, 24.0, 58.0, 124.0, 257.0, 712.0, 2667.0, 79438.0, 4099747.0, 8932.0, 1416.0, 465.0, 193.0, 99.0, 46.0, 22.0, 11.0, 5.0, 7.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-53.03125, -51.43798828125, -49.8447265625, -48.25146484375, -46.658203125, -45.06494140625, -43.4716796875, -41.87841796875, -40.28515625, -38.69189453125, -37.0986328125, -35.50537109375, -33.912109375, -32.31884765625, -30.7255859375, -29.13232421875, -27.5390625, -25.94580078125, -24.3525390625, -22.75927734375, -21.166015625, -19.57275390625, -17.9794921875, -16.38623046875, -14.79296875, -13.19970703125, -11.6064453125, -10.01318359375, -8.419921875, -6.82666015625, -5.2333984375, -3.64013671875, -2.046875, -0.45361328125, 1.1396484375, 2.73291015625, 4.326171875, 5.91943359375, 7.5126953125, 9.10595703125, 10.69921875, 12.29248046875, 13.8857421875, 15.47900390625, 17.072265625, 18.66552734375, 20.2587890625, 21.85205078125, 23.4453125, 25.03857421875, 26.6318359375, 28.22509765625, 29.818359375, 31.41162109375, 33.0048828125, 34.59814453125, 36.19140625, 37.78466796875, 39.3779296875, 40.97119140625, 42.564453125, 44.15771484375, 45.7509765625, 47.34423828125, 48.9375]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 13.0, 84.0, 295.0, 382.0, 197.0, 40.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.72069549560547, -42.622344970703125, -40.523990631103516, -38.425636291503906, -36.32728576660156, -34.22893524169922, -32.13058090209961, -30.032228469848633, -27.933876037597656, -25.83552360534668, -23.737171173095703, -21.638818740844727, -19.54046630859375, -17.442113876342773, -15.343761444091797, -13.24540901184082, -11.147056579589844, -9.048704147338867, -6.950351715087891, -4.851999282836914, -2.7536468505859375, -0.6552944183349609, 1.4430580139160156, 3.541410446166992, 5.639762878417969, 7.738115310668945, 9.836467742919922, 11.934820175170898, 14.033172607421875, 16.13152503967285, 18.229877471923828, 20.328229904174805, 22.42657470703125, 24.524927139282227, 26.623279571533203, 28.72163200378418, 30.819984436035156, 32.9183349609375, 35.01668930053711, 37.11504364013672, 39.21339416503906, 41.311744689941406, 43.410099029541016, 45.508453369140625, 47.60680389404297, 49.70515441894531, 51.80350875854492, 53.90186309814453, 56.000213623046875, 58.09856414794922, 60.19691848754883, 62.29527282714844, 64.39362335205078, 66.49197387695312, 68.59033203125, 70.68868255615234, 72.78703308105469, 74.88538360595703, 76.98373413085938, 79.08209228515625, 81.1804428100586, 83.27879333496094, 85.37715148925781, 87.47550201416016, 89.5738525390625]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 3.0, 9.0, 9.0, 11.0, 10.0, 15.0, 18.0, 15.0, 21.0, 20.0, 28.0, 29.0, 38.0, 32.0, 45.0, 43.0, 37.0, 45.0, 42.0, 36.0, 42.0, 41.0, 44.0, 45.0, 37.0, 36.0, 26.0, 29.0, 35.0, 27.0, 26.0, 15.0, 14.0, 17.0, 12.0, 12.0, 9.0, 6.0, 6.0, 1.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-26.552268981933594, -25.800241470336914, -25.048215866088867, -24.296188354492188, -23.54416275024414, -22.79213523864746, -22.040109634399414, -21.288082122802734, -20.536056518554688, -19.784029006958008, -19.03200340270996, -18.27997589111328, -17.527950286865234, -16.775922775268555, -16.023897171020508, -15.271869659423828, -14.519843101501465, -13.767816543579102, -13.015789985656738, -12.263763427734375, -11.511736869812012, -10.759710311889648, -10.007682800292969, -9.255657196044922, -8.503629684448242, -7.751603126525879, -6.999576568603516, -6.247550010681152, -5.495523452758789, -4.743496894836426, -3.9914698600769043, -3.239443302154541, -2.487417221069336, -1.7353906631469727, -0.9833639860153198, -0.231337308883667, 0.5206892490386963, 1.2727158069610596, 2.024742603302002, 2.7767691612243652, 3.5287957191467285, 4.280822277069092, 5.032848834991455, 5.784875869750977, 6.53690242767334, 7.288928985595703, 8.040955543518066, 8.79298210144043, 9.545008659362793, 10.297035217285156, 11.04906177520752, 11.801088333129883, 12.553114891052246, 13.30514144897461, 14.057168960571289, 14.809194564819336, 15.561222076416016, 16.313249588012695, 17.065275192260742, 17.817302703857422, 18.56932830810547, 19.32135581970215, 20.073381423950195, 20.825408935546875, 21.577434539794922]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 1.0, 5.0, 6.0, 8.0, 7.0, 12.0, 11.0, 12.0, 10.0, 16.0, 21.0, 11.0, 21.0, 34.0, 28.0, 24.0, 34.0, 39.0, 27.0, 36.0, 42.0, 36.0, 37.0, 40.0, 38.0, 46.0, 35.0, 32.0, 34.0, 35.0, 38.0, 24.0, 36.0, 21.0, 21.0, 29.0, 15.0, 15.0, 17.0, 13.0, 8.0, 3.0, 8.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0], "bins": [-2.05859375, -1.99981689453125, -1.9410400390625, -1.88226318359375, -1.823486328125, -1.76470947265625, -1.7059326171875, -1.64715576171875, -1.58837890625, -1.52960205078125, -1.4708251953125, -1.41204833984375, -1.353271484375, -1.29449462890625, -1.2357177734375, -1.17694091796875, -1.1181640625, -1.05938720703125, -1.0006103515625, -0.94183349609375, -0.883056640625, -0.82427978515625, -0.7655029296875, -0.70672607421875, -0.64794921875, -0.58917236328125, -0.5303955078125, -0.47161865234375, -0.412841796875, -0.35406494140625, -0.2952880859375, -0.23651123046875, -0.177734375, -0.11895751953125, -0.0601806640625, -0.00140380859375, 0.057373046875, 0.11614990234375, 0.1749267578125, 0.23370361328125, 0.29248046875, 0.35125732421875, 0.4100341796875, 0.46881103515625, 0.527587890625, 0.58636474609375, 0.6451416015625, 0.70391845703125, 0.7626953125, 0.82147216796875, 0.8802490234375, 0.93902587890625, 0.997802734375, 1.05657958984375, 1.1153564453125, 1.17413330078125, 1.23291015625, 1.29168701171875, 1.3504638671875, 1.40924072265625, 1.468017578125, 1.52679443359375, 1.5855712890625, 1.64434814453125, 1.703125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 4.0, 6.0, 14.0, 32.0, 34.0, 46.0, 94.0, 122.0, 174.0, 280.0, 417.0, 624.0, 912.0, 1427.0, 2162.0, 3216.0, 4891.0, 7381.0, 11625.0, 17769.0, 27845.0, 44022.0, 72039.0, 130516.0, 315714.0, 173819.0, 87581.0, 52980.0, 32995.0, 20735.0, 13597.0, 8827.0, 5644.0, 3731.0, 2473.0, 1619.0, 1094.0, 682.0, 459.0, 315.0, 222.0, 161.0, 87.0, 46.0, 47.0, 22.0, 19.0, 16.0, 13.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.432373046875, -0.41828155517578125, -0.4041900634765625, -0.39009857177734375, -0.376007080078125, -0.36191558837890625, -0.3478240966796875, -0.33373260498046875, -0.31964111328125, -0.30554962158203125, -0.2914581298828125, -0.27736663818359375, -0.263275146484375, -0.24918365478515625, -0.2350921630859375, -0.22100067138671875, -0.2069091796875, -0.19281768798828125, -0.1787261962890625, -0.16463470458984375, -0.150543212890625, -0.13645172119140625, -0.1223602294921875, -0.10826873779296875, -0.09417724609375, -0.08008575439453125, -0.0659942626953125, -0.05190277099609375, -0.037811279296875, -0.02371978759765625, -0.0096282958984375, 0.00446319580078125, 0.0185546875, 0.03264617919921875, 0.0467376708984375, 0.06082916259765625, 0.074920654296875, 0.08901214599609375, 0.1031036376953125, 0.11719512939453125, 0.13128662109375, 0.14537811279296875, 0.1594696044921875, 0.17356109619140625, 0.187652587890625, 0.20174407958984375, 0.2158355712890625, 0.22992706298828125, 0.2440185546875, 0.25811004638671875, 0.2722015380859375, 0.28629302978515625, 0.300384521484375, 0.31447601318359375, 0.3285675048828125, 0.34265899658203125, 0.35675048828125, 0.37084197998046875, 0.3849334716796875, 0.39902496337890625, 0.413116455078125, 0.42720794677734375, 0.4412994384765625, 0.45539093017578125, 0.469482421875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 10.0, 8.0, 9.0, 7.0, 6.0, 17.0, 11.0, 13.0, 7.0, 21.0, 33.0, 27.0, 17.0, 31.0, 29.0, 37.0, 34.0, 32.0, 41.0, 30.0, 39.0, 30.0, 1053.0, 40.0, 41.0, 37.0, 27.0, 31.0, 38.0, 30.0, 26.0, 23.0, 23.0, 29.0, 22.0, 19.0, 16.0, 10.0, 14.0, 9.0, 10.0, 7.0, 13.0, 8.0, 5.0, 5.0, 4.0, 4.0, 1.0], "bins": [-1.341796875, -1.3057785034179688, -1.2697601318359375, -1.2337417602539062, -1.197723388671875, -1.1617050170898438, -1.1256866455078125, -1.0896682739257812, -1.05364990234375, -1.0176315307617188, -0.9816131591796875, -0.9455947875976562, -0.909576416015625, -0.8735580444335938, -0.8375396728515625, -0.8015213012695312, -0.7655029296875, -0.7294845581054688, -0.6934661865234375, -0.6574478149414062, -0.621429443359375, -0.5854110717773438, -0.5493927001953125, -0.5133743286132812, -0.47735595703125, -0.44133758544921875, -0.4053192138671875, -0.36930084228515625, -0.333282470703125, -0.29726409912109375, -0.2612457275390625, -0.22522735595703125, -0.189208984375, -0.15319061279296875, -0.1171722412109375, -0.08115386962890625, -0.045135498046875, -0.00911712646484375, 0.0269012451171875, 0.06291961669921875, 0.09893798828125, 0.13495635986328125, 0.1709747314453125, 0.20699310302734375, 0.243011474609375, 0.27902984619140625, 0.3150482177734375, 0.35106658935546875, 0.3870849609375, 0.42310333251953125, 0.4591217041015625, 0.49514007568359375, 0.531158447265625, 0.5671768188476562, 0.6031951904296875, 0.6392135620117188, 0.67523193359375, 0.7112503051757812, 0.7472686767578125, 0.7832870483398438, 0.819305419921875, 0.8553237915039062, 0.8913421630859375, 0.9273605346679688, 0.96337890625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 3.0, 6.0, 8.0, 12.0, 23.0, 36.0, 46.0, 78.0, 154.0, 179.0, 267.0, 500.0, 668.0, 1040.0, 1735.0, 2635.0, 4244.0, 6796.0, 11103.0, 18051.0, 30982.0, 53147.0, 94262.0, 200786.0, 1379612.0, 124792.0, 67575.0, 38802.0, 22883.0, 14101.0, 8459.0, 5185.0, 3302.0, 2114.0, 1308.0, 775.0, 516.0, 302.0, 201.0, 148.0, 93.0, 66.0, 37.0, 31.0, 32.0, 13.0, 9.0, 7.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42822265625, -0.41304779052734375, -0.3978729248046875, -0.38269805908203125, -0.367523193359375, -0.35234832763671875, -0.3371734619140625, -0.32199859619140625, -0.30682373046875, -0.29164886474609375, -0.2764739990234375, -0.26129913330078125, -0.246124267578125, -0.23094940185546875, -0.2157745361328125, -0.20059967041015625, -0.1854248046875, -0.17024993896484375, -0.1550750732421875, -0.13990020751953125, -0.124725341796875, -0.10955047607421875, -0.0943756103515625, -0.07920074462890625, -0.06402587890625, -0.04885101318359375, -0.0336761474609375, -0.01850128173828125, -0.003326416015625, 0.01184844970703125, 0.0270233154296875, 0.04219818115234375, 0.057373046875, 0.07254791259765625, 0.0877227783203125, 0.10289764404296875, 0.118072509765625, 0.13324737548828125, 0.1484222412109375, 0.16359710693359375, 0.17877197265625, 0.19394683837890625, 0.2091217041015625, 0.22429656982421875, 0.239471435546875, 0.25464630126953125, 0.2698211669921875, 0.28499603271484375, 0.3001708984375, 0.31534576416015625, 0.3305206298828125, 0.34569549560546875, 0.360870361328125, 0.37604522705078125, 0.3912200927734375, 0.40639495849609375, 0.42156982421875, 0.43674468994140625, 0.4519195556640625, 0.46709442138671875, 0.482269287109375, 0.49744415283203125, 0.5126190185546875, 0.5277938842773438, 0.54296875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 3.0, 4.0, 7.0, 7.0, 4.0, 12.0, 11.0, 13.0, 18.0, 29.0, 42.0, 46.0, 59.0, 75.0, 97.0, 127.0, 113.0, 88.0, 61.0, 50.0, 32.0, 26.0, 22.0, 12.0, 7.0, 10.0, 2.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.000385284423828125, -0.0003730654716491699, -0.00036084651947021484, -0.00034862756729125977, -0.0003364086151123047, -0.0003241896629333496, -0.00031197071075439453, -0.00029975175857543945, -0.0002875328063964844, -0.0002753138542175293, -0.0002630949020385742, -0.00025087594985961914, -0.00023865699768066406, -0.00022643804550170898, -0.0002142190933227539, -0.00020200014114379883, -0.00018978118896484375, -0.00017756223678588867, -0.0001653432846069336, -0.00015312433242797852, -0.00014090538024902344, -0.00012868642807006836, -0.00011646747589111328, -0.0001042485237121582, -9.202957153320312e-05, -7.981061935424805e-05, -6.759166717529297e-05, -5.537271499633789e-05, -4.315376281738281e-05, -3.0934810638427734e-05, -1.8715858459472656e-05, -6.496906280517578e-06, 5.7220458984375e-06, 1.7940998077392578e-05, 3.0159950256347656e-05, 4.2378902435302734e-05, 5.459785461425781e-05, 6.681680679321289e-05, 7.903575897216797e-05, 9.125471115112305e-05, 0.00010347366333007812, 0.0001156926155090332, 0.00012791156768798828, 0.00014013051986694336, 0.00015234947204589844, 0.00016456842422485352, 0.0001767873764038086, 0.00018900632858276367, 0.00020122528076171875, 0.00021344423294067383, 0.0002256631851196289, 0.00023788213729858398, 0.00025010108947753906, 0.00026232004165649414, 0.0002745389938354492, 0.0002867579460144043, 0.0002989768981933594, 0.00031119585037231445, 0.00032341480255126953, 0.0003356337547302246, 0.0003478527069091797, 0.00036007165908813477, 0.00037229061126708984, 0.0003845095634460449, 0.000396728515625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 6.0, 5.0, 3.0, 6.0, 8.0, 10.0, 6.0, 14.0, 24.0, 12.0, 27.0, 32.0, 69.0, 76.0, 135.0, 165.0, 274.0, 439.0, 843.0, 61082.0, 982778.0, 1088.0, 519.0, 291.0, 172.0, 136.0, 86.0, 69.0, 45.0, 25.0, 19.0, 14.0, 13.0, 9.0, 10.0, 10.0, 6.0, 6.0, 3.0, 4.0, 5.0, 1.0, 4.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006679534912109375, -0.006464958190917969, -0.0062503814697265625, -0.006035804748535156, -0.00582122802734375, -0.005606651306152344, -0.0053920745849609375, -0.005177497863769531, -0.004962921142578125, -0.004748344421386719, -0.0045337677001953125, -0.004319190979003906, -0.0041046142578125, -0.0038900375366210938, -0.0036754608154296875, -0.0034608840942382812, -0.003246307373046875, -0.0030317306518554688, -0.0028171539306640625, -0.0026025772094726562, -0.00238800048828125, -0.0021734237670898438, -0.0019588470458984375, -0.0017442703247070312, -0.001529693603515625, -0.0013151168823242188, -0.0011005401611328125, -0.0008859634399414062, -0.00067138671875, -0.00045680999755859375, -0.0002422332763671875, -2.765655517578125e-05, 0.000186920166015625, 0.00040149688720703125, 0.0006160736083984375, 0.0008306503295898438, 0.00104522705078125, 0.0012598037719726562, 0.0014743804931640625, 0.0016889572143554688, 0.001903533935546875, 0.0021181106567382812, 0.0023326873779296875, 0.0025472640991210938, 0.0027618408203125, 0.0029764175415039062, 0.0031909942626953125, 0.0034055709838867188, 0.003620147705078125, 0.0038347244262695312, 0.0040493011474609375, 0.004263877868652344, 0.00447845458984375, 0.004693031311035156, 0.0049076080322265625, 0.005122184753417969, 0.005336761474609375, 0.005551338195800781, 0.0057659149169921875, 0.005980491638183594, 0.006195068359375, 0.006409645080566406, 0.0066242218017578125, 0.006838798522949219, 0.007053375244140625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 41.0, 165.0, 369.0, 324.0, 81.0, 23.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012935695121996105, -0.00011844108666991815, -0.00010752522211987525, -9.660935029387474e-05, -8.569348574383184e-05, -7.477762119378895e-05, -6.386174936778843e-05, -5.2945884817745537e-05, -4.203002026770264e-05, -3.111415571765974e-05, -2.0198287529638037e-05, -9.282419341616333e-06, 1.633445208426565e-06, 1.2549309758469462e-05, 2.3465181584469974e-05, 3.438104613451287e-05, 4.529691068455577e-05, 5.6212775234598666e-05, 6.712863978464156e-05, 7.804451161064208e-05, 8.896037616068497e-05, 9.987624071072787e-05, 0.00011079211253672838, 0.00012170797708677128, 0.00013262384163681418, 0.0001435397134628147, 0.00015445557073689997, 0.00016537144256290048, 0.000176287314388901, 0.00018720317166298628, 0.0001981190434889868, 0.0002090349153149873, 0.00021995074348524213, 0.00023086661531124264, 0.00024178247258532792, 0.00025269834441132843, 0.0002636142016854137, 0.00027453008806332946, 0.00028544594533741474, 0.0002963618026115, 0.0003072776598855853, 0.0003181935171596706, 0.00032910940353758633, 0.0003400252608116716, 0.0003509411180857569, 0.00036185700446367264, 0.0003727728617377579, 0.0003836887190118432, 0.00039460460538975894, 0.00040552046266384423, 0.00041643634904175997, 0.00042735220631584525, 0.00043826806358993053, 0.0004491839208640158, 0.00046009980724193156, 0.00047101566451601684, 0.0004819315508939326, 0.0004928474081680179, 0.0005037632654421031, 0.0005146791227161884, 0.0005255950381979346, 0.0005365108954720199, 0.0005474267527461052, 0.0005583426100201905, 0.0005692584672942758]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 10.0, 11.0, 7.0, 14.0, 22.0, 22.0, 22.0, 17.0, 22.0, 24.0, 24.0, 35.0, 43.0, 31.0, 36.0, 51.0, 53.0, 47.0, 31.0, 45.0, 28.0, 41.0, 35.0, 48.0, 29.0, 33.0, 30.0, 42.0, 21.0, 14.0, 22.0, 19.0, 21.0, 8.0, 8.0, 4.0, 6.0, 1.0, 7.0, 5.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017070770263671875, -0.00016574375331401825, -0.00016077980399131775, -0.00015581585466861725, -0.00015085190534591675, -0.00014588795602321625, -0.00014092400670051575, -0.00013596005737781525, -0.00013099610805511475, -0.00012603215873241425, -0.00012106820940971375, -0.00011610426008701324, -0.00011114031076431274, -0.00010617636144161224, -0.00010121241211891174, -9.624846279621124e-05, -9.128451347351074e-05, -8.632056415081024e-05, -8.135661482810974e-05, -7.639266550540924e-05, -7.142871618270874e-05, -6.646476686000824e-05, -6.150081753730774e-05, -5.653686821460724e-05, -5.157291889190674e-05, -4.660896956920624e-05, -4.164502024650574e-05, -3.668107092380524e-05, -3.1717121601104736e-05, -2.6753172278404236e-05, -2.1789222955703735e-05, -1.6825273633003235e-05, -1.1861324310302734e-05, -6.897374987602234e-06, -1.9334256649017334e-06, 3.030523657798767e-06, 7.994472980499268e-06, 1.2958422303199768e-05, 1.792237162590027e-05, 2.288632094860077e-05, 2.785027027130127e-05, 3.281421959400177e-05, 3.777816891670227e-05, 4.274211823940277e-05, 4.770606756210327e-05, 5.267001688480377e-05, 5.763396620750427e-05, 6.259791553020477e-05, 6.756186485290527e-05, 7.252581417560577e-05, 7.748976349830627e-05, 8.245371282100677e-05, 8.741766214370728e-05, 9.238161146640778e-05, 9.734556078910828e-05, 0.00010230951011180878, 0.00010727345943450928, 0.00011223740875720978, 0.00011720135807991028, 0.00012216530740261078, 0.00012712925672531128, 0.00013209320604801178, 0.00013705715537071228, 0.00014202110469341278, 0.00014698505401611328]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 1.0, 5.0, 6.0, 8.0, 7.0, 12.0, 11.0, 12.0, 10.0, 16.0, 21.0, 11.0, 21.0, 34.0, 28.0, 24.0, 34.0, 39.0, 27.0, 36.0, 42.0, 36.0, 37.0, 40.0, 38.0, 46.0, 35.0, 32.0, 34.0, 35.0, 38.0, 24.0, 36.0, 21.0, 21.0, 29.0, 15.0, 15.0, 17.0, 13.0, 8.0, 3.0, 8.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0], "bins": [-2.05859375, -1.99981689453125, -1.9410400390625, -1.88226318359375, -1.823486328125, -1.76470947265625, -1.7059326171875, -1.64715576171875, -1.58837890625, -1.52960205078125, -1.4708251953125, -1.41204833984375, -1.353271484375, -1.29449462890625, -1.2357177734375, -1.17694091796875, -1.1181640625, -1.05938720703125, -1.0006103515625, -0.94183349609375, -0.883056640625, -0.82427978515625, -0.7655029296875, -0.70672607421875, -0.64794921875, -0.58917236328125, -0.5303955078125, -0.47161865234375, -0.412841796875, -0.35406494140625, -0.2952880859375, -0.23651123046875, -0.177734375, -0.11895751953125, -0.0601806640625, -0.00140380859375, 0.057373046875, 0.11614990234375, 0.1749267578125, 0.23370361328125, 0.29248046875, 0.35125732421875, 0.4100341796875, 0.46881103515625, 0.527587890625, 0.58636474609375, 0.6451416015625, 0.70391845703125, 0.7626953125, 0.82147216796875, 0.8802490234375, 0.93902587890625, 0.997802734375, 1.05657958984375, 1.1153564453125, 1.17413330078125, 1.23291015625, 1.29168701171875, 1.3504638671875, 1.40924072265625, 1.468017578125, 1.52679443359375, 1.5855712890625, 1.64434814453125, 1.703125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 12.0, 6.0, 13.0, 17.0, 18.0, 34.0, 34.0, 40.0, 76.0, 100.0, 92.0, 178.0, 203.0, 308.0, 383.0, 508.0, 779.0, 1022.0, 1590.0, 2285.0, 3571.0, 6127.0, 11608.0, 30470.0, 256039.0, 638337.0, 57605.0, 15852.0, 7805.0, 4511.0, 2798.0, 1735.0, 1229.0, 857.0, 611.0, 455.0, 309.0, 253.0, 164.0, 141.0, 87.0, 67.0, 62.0, 43.0, 29.0, 20.0, 21.0, 15.0, 12.0, 11.0, 5.0, 8.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-9.921875, -9.6038818359375, -9.285888671875, -8.9678955078125, -8.64990234375, -8.3319091796875, -8.013916015625, -7.6959228515625, -7.3779296875, -7.0599365234375, -6.741943359375, -6.4239501953125, -6.10595703125, -5.7879638671875, -5.469970703125, -5.1519775390625, -4.833984375, -4.5159912109375, -4.197998046875, -3.8800048828125, -3.56201171875, -3.2440185546875, -2.926025390625, -2.6080322265625, -2.2900390625, -1.9720458984375, -1.654052734375, -1.3360595703125, -1.01806640625, -0.7000732421875, -0.382080078125, -0.0640869140625, 0.25390625, 0.5718994140625, 0.889892578125, 1.2078857421875, 1.52587890625, 1.8438720703125, 2.161865234375, 2.4798583984375, 2.7978515625, 3.1158447265625, 3.433837890625, 3.7518310546875, 4.06982421875, 4.3878173828125, 4.705810546875, 5.0238037109375, 5.341796875, 5.6597900390625, 5.977783203125, 6.2957763671875, 6.61376953125, 6.9317626953125, 7.249755859375, 7.5677490234375, 7.8857421875, 8.2037353515625, 8.521728515625, 8.8397216796875, 9.15771484375, 9.4757080078125, 9.793701171875, 10.1116943359375, 10.4296875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 6.0, 3.0, 4.0, 1.0, 4.0, 9.0, 9.0, 12.0, 9.0, 14.0, 15.0, 18.0, 18.0, 24.0, 27.0, 26.0, 27.0, 30.0, 37.0, 45.0, 69.0, 57.0, 110.0, 237.0, 1364.0, 244.0, 138.0, 73.0, 53.0, 44.0, 41.0, 43.0, 30.0, 30.0, 33.0, 24.0, 19.0, 18.0, 17.0, 14.0, 10.0, 5.0, 9.0, 8.0, 7.0, 3.0, 2.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-5.1015625, -4.93524169921875, -4.7689208984375, -4.60260009765625, -4.436279296875, -4.26995849609375, -4.1036376953125, -3.93731689453125, -3.77099609375, -3.60467529296875, -3.4383544921875, -3.27203369140625, -3.105712890625, -2.93939208984375, -2.7730712890625, -2.60675048828125, -2.4404296875, -2.27410888671875, -2.1077880859375, -1.94146728515625, -1.775146484375, -1.60882568359375, -1.4425048828125, -1.27618408203125, -1.10986328125, -0.94354248046875, -0.7772216796875, -0.61090087890625, -0.444580078125, -0.27825927734375, -0.1119384765625, 0.05438232421875, 0.220703125, 0.38702392578125, 0.5533447265625, 0.71966552734375, 0.885986328125, 1.05230712890625, 1.2186279296875, 1.38494873046875, 1.55126953125, 1.71759033203125, 1.8839111328125, 2.05023193359375, 2.216552734375, 2.38287353515625, 2.5491943359375, 2.71551513671875, 2.8818359375, 3.04815673828125, 3.2144775390625, 3.38079833984375, 3.547119140625, 3.71343994140625, 3.8797607421875, 4.04608154296875, 4.21240234375, 4.37872314453125, 4.5450439453125, 4.71136474609375, 4.877685546875, 5.04400634765625, 5.2103271484375, 5.37664794921875, 5.54296875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 2.0, 6.0, 3.0, 4.0, 5.0, 10.0, 14.0, 14.0, 12.0, 14.0, 16.0, 14.0, 26.0, 38.0, 37.0, 47.0, 71.0, 100.0, 214.0, 483.0, 1904.0, 74589.0, 3056935.0, 9117.0, 1103.0, 364.0, 157.0, 101.0, 47.0, 46.0, 33.0, 25.0, 20.0, 23.0, 13.0, 17.0, 16.0, 10.0, 12.0, 7.0, 10.0, 4.0, 5.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-24.40625, -23.695068359375, -22.98388671875, -22.272705078125, -21.5615234375, -20.850341796875, -20.13916015625, -19.427978515625, -18.716796875, -18.005615234375, -17.29443359375, -16.583251953125, -15.8720703125, -15.160888671875, -14.44970703125, -13.738525390625, -13.02734375, -12.316162109375, -11.60498046875, -10.893798828125, -10.1826171875, -9.471435546875, -8.76025390625, -8.049072265625, -7.337890625, -6.626708984375, -5.91552734375, -5.204345703125, -4.4931640625, -3.781982421875, -3.07080078125, -2.359619140625, -1.6484375, -0.937255859375, -0.22607421875, 0.485107421875, 1.1962890625, 1.907470703125, 2.61865234375, 3.329833984375, 4.041015625, 4.752197265625, 5.46337890625, 6.174560546875, 6.8857421875, 7.596923828125, 8.30810546875, 9.019287109375, 9.73046875, 10.441650390625, 11.15283203125, 11.864013671875, 12.5751953125, 13.286376953125, 13.99755859375, 14.708740234375, 15.419921875, 16.131103515625, 16.84228515625, 17.553466796875, 18.2646484375, 18.975830078125, 19.68701171875, 20.398193359375, 21.109375]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 47.0, 963.0, 5.0, 4.0, 1.0, 1.0], "bins": [-219.2111053466797, -215.51856994628906, -211.82603454589844, -208.13348388671875, -204.44094848632812, -200.7484130859375, -197.05587768554688, -193.36334228515625, -189.67079162597656, -185.97825622558594, -182.2857208251953, -178.59317016601562, -174.900634765625, -171.20809936523438, -167.51556396484375, -163.82302856445312, -160.1304931640625, -156.43795776367188, -152.74542236328125, -149.05287170410156, -145.36033630371094, -141.6678009033203, -137.9752655029297, -134.28271484375, -130.59017944335938, -126.89764404296875, -123.2051010131836, -119.51256561279297, -115.82002258300781, -112.12748718261719, -108.43495178222656, -104.7424087524414, -101.04986572265625, -97.35733032226562, -93.66478729248047, -89.97225189208984, -86.27970886230469, -82.58717346191406, -78.89463806152344, -75.20209503173828, -71.50955200195312, -67.8170166015625, -64.12447357177734, -60.43193817138672, -56.73939514160156, -53.04685974121094, -49.35432052612305, -45.661781311035156, -41.969242095947266, -38.276702880859375, -34.584163665771484, -30.891626358032227, -27.199087142944336, -23.506547927856445, -19.814010620117188, -16.121471405029297, -12.428932189941406, -8.736392974853516, -5.043854713439941, -1.3513164520263672, 2.3412227630615234, 6.033761978149414, 9.726299285888672, 13.418838500976562, 17.111377716064453]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 3.0, 7.0, 9.0, 9.0, 14.0, 6.0, 15.0, 18.0, 19.0, 17.0, 30.0, 27.0, 32.0, 29.0, 35.0, 36.0, 40.0, 47.0, 39.0, 48.0, 32.0, 41.0, 39.0, 39.0, 51.0, 32.0, 35.0, 37.0, 28.0, 29.0, 19.0, 23.0, 21.0, 17.0, 16.0, 14.0, 14.0, 4.0, 5.0, 5.0, 4.0, 5.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.64004135131836, -20.046937942504883, -19.453834533691406, -18.860729217529297, -18.26762580871582, -17.674522399902344, -17.081418991088867, -16.48831558227539, -15.895210266113281, -15.302106857299805, -14.709002494812012, -14.115899085998535, -13.522794723510742, -12.929691314697266, -12.336587905883789, -11.743483543395996, -11.15038013458252, -10.557276725769043, -9.96417236328125, -9.371068954467773, -8.77796459197998, -8.184861183166504, -7.591757297515869, -6.998653411865234, -6.4055495262146, -5.812445640563965, -5.21934175491333, -4.626237869262695, -4.033134460449219, -3.440030336380005, -2.846926689147949, -2.2538228034973145, -1.6607189178466797, -1.067615032196045, -0.4745112657546997, 0.11859250068664551, 0.7116963863372803, 1.304800271987915, 1.8979039192199707, 2.4910078048706055, 3.0841116905212402, 3.677215576171875, 4.27031946182251, 4.8634233474731445, 5.456526756286621, 6.049631118774414, 6.642734527587891, 7.235838413238525, 7.82894229888916, 8.422045707702637, 9.01515007019043, 9.608253479003906, 10.2013578414917, 10.794461250305176, 11.387565612792969, 11.980669021606445, 12.573772430419922, 13.166875839233398, 13.759980201721191, 14.353083610534668, 14.946187973022461, 15.539291381835938, 16.132394790649414, 16.72549819946289, 17.318603515625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 6.0, 4.0, 3.0, 7.0, 5.0, 9.0, 14.0, 13.0, 13.0, 15.0, 19.0, 16.0, 24.0, 19.0, 35.0, 28.0, 32.0, 23.0, 35.0, 47.0, 27.0, 45.0, 45.0, 42.0, 32.0, 45.0, 30.0, 38.0, 39.0, 29.0, 35.0, 27.0, 32.0, 30.0, 26.0, 16.0, 23.0, 11.0, 18.0, 16.0, 6.0, 7.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0, 5.0], "bins": [-2.314453125, -2.2505950927734375, -2.186737060546875, -2.1228790283203125, -2.05902099609375, -1.9951629638671875, -1.931304931640625, -1.8674468994140625, -1.8035888671875, -1.7397308349609375, -1.675872802734375, -1.6120147705078125, -1.54815673828125, -1.4842987060546875, -1.420440673828125, -1.3565826416015625, -1.292724609375, -1.2288665771484375, -1.165008544921875, -1.1011505126953125, -1.03729248046875, -0.9734344482421875, -0.909576416015625, -0.8457183837890625, -0.7818603515625, -0.7180023193359375, -0.654144287109375, -0.5902862548828125, -0.52642822265625, -0.4625701904296875, -0.398712158203125, -0.3348541259765625, -0.27099609375, -0.2071380615234375, -0.143280029296875, -0.0794219970703125, -0.01556396484375, 0.0482940673828125, 0.112152099609375, 0.1760101318359375, 0.2398681640625, 0.3037261962890625, 0.367584228515625, 0.4314422607421875, 0.49530029296875, 0.5591583251953125, 0.623016357421875, 0.6868743896484375, 0.750732421875, 0.8145904541015625, 0.878448486328125, 0.9423065185546875, 1.00616455078125, 1.0700225830078125, 1.133880615234375, 1.1977386474609375, 1.2615966796875, 1.3254547119140625, 1.389312744140625, 1.4531707763671875, 1.51702880859375, 1.5808868408203125, 1.644744873046875, 1.7086029052734375, 1.7724609375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 3.0, 6.0, 5.0, 10.0, 15.0, 19.0, 22.0, 34.0, 42.0, 58.0, 85.0, 112.0, 166.0, 271.0, 403.0, 715.0, 1244.0, 2303.0, 4733.0, 10777.0, 29396.0, 152462.0, 2597760.0, 1273820.0, 82225.0, 20830.0, 8201.0, 3842.0, 1949.0, 1070.0, 630.0, 342.0, 229.0, 136.0, 96.0, 82.0, 44.0, 47.0, 26.0, 16.0, 14.0, 10.0, 7.0, 5.0, 2.0, 6.0, 7.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.140625, -9.8319091796875, -9.523193359375, -9.2144775390625, -8.90576171875, -8.5970458984375, -8.288330078125, -7.9796142578125, -7.6708984375, -7.3621826171875, -7.053466796875, -6.7447509765625, -6.43603515625, -6.1273193359375, -5.818603515625, -5.5098876953125, -5.201171875, -4.8924560546875, -4.583740234375, -4.2750244140625, -3.96630859375, -3.6575927734375, -3.348876953125, -3.0401611328125, -2.7314453125, -2.4227294921875, -2.114013671875, -1.8052978515625, -1.49658203125, -1.1878662109375, -0.879150390625, -0.5704345703125, -0.26171875, 0.0469970703125, 0.355712890625, 0.6644287109375, 0.97314453125, 1.2818603515625, 1.590576171875, 1.8992919921875, 2.2080078125, 2.5167236328125, 2.825439453125, 3.1341552734375, 3.44287109375, 3.7515869140625, 4.060302734375, 4.3690185546875, 4.677734375, 4.9864501953125, 5.295166015625, 5.6038818359375, 5.91259765625, 6.2213134765625, 6.530029296875, 6.8387451171875, 7.1474609375, 7.4561767578125, 7.764892578125, 8.0736083984375, 8.38232421875, 8.6910400390625, 8.999755859375, 9.3084716796875, 9.6171875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 6.0, 7.0, 7.0, 21.0, 17.0, 28.0, 51.0, 66.0, 109.0, 166.0, 287.0, 453.0, 669.0, 723.0, 559.0, 346.0, 205.0, 127.0, 82.0, 47.0, 35.0, 21.0, 20.0, 7.0, 7.0, 2.0, 7.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-17.046875, -16.65234375, -16.2578125, -15.86328125, -15.46875, -15.07421875, -14.6796875, -14.28515625, -13.890625, -13.49609375, -13.1015625, -12.70703125, -12.3125, -11.91796875, -11.5234375, -11.12890625, -10.734375, -10.33984375, -9.9453125, -9.55078125, -9.15625, -8.76171875, -8.3671875, -7.97265625, -7.578125, -7.18359375, -6.7890625, -6.39453125, -6.0, -5.60546875, -5.2109375, -4.81640625, -4.421875, -4.02734375, -3.6328125, -3.23828125, -2.84375, -2.44921875, -2.0546875, -1.66015625, -1.265625, -0.87109375, -0.4765625, -0.08203125, 0.3125, 0.70703125, 1.1015625, 1.49609375, 1.890625, 2.28515625, 2.6796875, 3.07421875, 3.46875, 3.86328125, 4.2578125, 4.65234375, 5.046875, 5.44140625, 5.8359375, 6.23046875, 6.625, 7.01953125, 7.4140625, 7.80859375, 8.203125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 10.0, 7.0, 11.0, 11.0, 18.0, 23.0, 38.0, 45.0, 71.0, 135.0, 198.0, 337.0, 767.0, 3103.0, 427449.0, 3752607.0, 7209.0, 1041.0, 448.0, 268.0, 122.0, 106.0, 72.0, 48.0, 41.0, 18.0, 21.0, 14.0, 9.0, 7.0, 10.0, 6.0, 0.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.53125, -35.27880859375, -34.0263671875, -32.77392578125, -31.521484375, -30.26904296875, -29.0166015625, -27.76416015625, -26.51171875, -25.25927734375, -24.0068359375, -22.75439453125, -21.501953125, -20.24951171875, -18.9970703125, -17.74462890625, -16.4921875, -15.23974609375, -13.9873046875, -12.73486328125, -11.482421875, -10.22998046875, -8.9775390625, -7.72509765625, -6.47265625, -5.22021484375, -3.9677734375, -2.71533203125, -1.462890625, -0.21044921875, 1.0419921875, 2.29443359375, 3.546875, 4.79931640625, 6.0517578125, 7.30419921875, 8.556640625, 9.80908203125, 11.0615234375, 12.31396484375, 13.56640625, 14.81884765625, 16.0712890625, 17.32373046875, 18.576171875, 19.82861328125, 21.0810546875, 22.33349609375, 23.5859375, 24.83837890625, 26.0908203125, 27.34326171875, 28.595703125, 29.84814453125, 31.1005859375, 32.35302734375, 33.60546875, 34.85791015625, 36.1103515625, 37.36279296875, 38.615234375, 39.86767578125, 41.1201171875, 42.37255859375, 43.625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 11.0, 464.0, 523.0, 20.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-290.7997131347656, -285.41876220703125, -280.03778076171875, -274.6568298339844, -269.27587890625, -263.8949279785156, -258.51397705078125, -253.13299560546875, -247.75204467773438, -242.37109375, -236.99012756347656, -231.60916137695312, -226.22821044921875, -220.84725952148438, -215.46629333496094, -210.0853271484375, -204.70437622070312, -199.32342529296875, -193.9424591064453, -188.56149291992188, -183.1805419921875, -177.79959106445312, -172.4186248779297, -167.03765869140625, -161.65670776367188, -156.2757568359375, -150.89479064941406, -145.51382446289062, -140.13287353515625, -134.75192260742188, -129.37095642089844, -123.98999786376953, -118.60903930664062, -113.22808074951172, -107.84712219238281, -102.4661636352539, -97.085205078125, -91.7042465209961, -86.32328796386719, -80.94232940673828, -75.56137084960938, -70.18041229248047, -64.79945373535156, -59.418495178222656, -54.03753662109375, -48.656578063964844, -43.27561950683594, -37.89466094970703, -32.51370620727539, -27.132747650146484, -21.751789093017578, -16.370830535888672, -10.989871978759766, -5.608913421630859, -0.22795486450195312, 5.153003692626953, 10.53396224975586, 15.914920806884766, 21.295879364013672, 26.676837921142578, 32.057796478271484, 37.43875503540039, 42.8197135925293, 48.2006721496582, 53.58163070678711]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 7.0, 4.0, 5.0, 11.0, 11.0, 9.0, 13.0, 17.0, 20.0, 27.0, 21.0, 24.0, 24.0, 35.0, 33.0, 39.0, 36.0, 37.0, 41.0, 28.0, 28.0, 40.0, 42.0, 36.0, 45.0, 31.0, 31.0, 39.0, 34.0, 33.0, 26.0, 31.0, 23.0, 23.0, 17.0, 20.0, 5.0, 20.0, 3.0, 6.0, 5.0, 8.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.058658599853516, -26.214746475219727, -25.370832443237305, -24.526920318603516, -23.683006286621094, -22.839094161987305, -21.995182037353516, -21.151268005371094, -20.307353973388672, -19.463441848754883, -18.61952781677246, -17.775615692138672, -16.93170166015625, -16.08778953552246, -15.243876457214355, -14.39996337890625, -13.556051254272461, -12.712138175964355, -11.86822509765625, -11.024312973022461, -10.180398941040039, -9.33648681640625, -8.492573738098145, -7.648660659790039, -6.804747581481934, -5.960834503173828, -5.116921424865723, -4.273008823394775, -3.42909574508667, -2.5851826667785645, -1.7412700653076172, -0.8973569869995117, -0.05344200134277344, 0.7904709577560425, 1.6343839168548584, 2.4782967567443848, 3.3222098350524902, 4.166122913360596, 5.010035514831543, 5.853948593139648, 6.697861671447754, 7.541774749755859, 8.385687828063965, 9.22960090637207, 10.07351303100586, 10.917427062988281, 11.76133918762207, 12.605252265930176, 13.449165344238281, 14.293078422546387, 15.136991500854492, 15.980903625488281, 16.824817657470703, 17.668729782104492, 18.51264190673828, 19.356555938720703, 20.200469970703125, 21.044382095336914, 21.888296127319336, 22.732208251953125, 23.576122283935547, 24.420034408569336, 25.263946533203125, 26.107860565185547, 26.951772689819336]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 8.0, 2.0, 4.0, 5.0, 11.0, 10.0, 5.0, 10.0, 12.0, 17.0, 17.0, 17.0, 22.0, 20.0, 24.0, 28.0, 29.0, 42.0, 34.0, 34.0, 41.0, 42.0, 34.0, 47.0, 37.0, 52.0, 34.0, 37.0, 36.0, 31.0, 28.0, 30.0, 30.0, 26.0, 25.0, 24.0, 18.0, 19.0, 13.0, 11.0, 10.0, 5.0, 8.0, 5.0, 9.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.24609375, -2.181304931640625, -2.11651611328125, -2.051727294921875, -1.9869384765625, -1.922149658203125, -1.85736083984375, -1.792572021484375, -1.727783203125, -1.662994384765625, -1.59820556640625, -1.533416748046875, -1.4686279296875, -1.403839111328125, -1.33905029296875, -1.274261474609375, -1.20947265625, -1.144683837890625, -1.07989501953125, -1.015106201171875, -0.9503173828125, -0.885528564453125, -0.82073974609375, -0.755950927734375, -0.691162109375, -0.626373291015625, -0.56158447265625, -0.496795654296875, -0.4320068359375, -0.367218017578125, -0.30242919921875, -0.237640380859375, -0.1728515625, -0.108062744140625, -0.04327392578125, 0.021514892578125, 0.0863037109375, 0.151092529296875, 0.21588134765625, 0.280670166015625, 0.345458984375, 0.410247802734375, 0.47503662109375, 0.539825439453125, 0.6046142578125, 0.669403076171875, 0.73419189453125, 0.798980712890625, 0.86376953125, 0.928558349609375, 0.99334716796875, 1.058135986328125, 1.1229248046875, 1.187713623046875, 1.25250244140625, 1.317291259765625, 1.382080078125, 1.446868896484375, 1.51165771484375, 1.576446533203125, 1.6412353515625, 1.706024169921875, 1.77081298828125, 1.835601806640625, 1.900390625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 1.0, 3.0, 6.0, 9.0, 14.0, 13.0, 22.0, 63.0, 69.0, 102.0, 132.0, 226.0, 271.0, 447.0, 662.0, 912.0, 1372.0, 1982.0, 2945.0, 4372.0, 6579.0, 9531.0, 14358.0, 21764.0, 33290.0, 52876.0, 88529.0, 175046.0, 311703.0, 125894.0, 69565.0, 42643.0, 27583.0, 18408.0, 12008.0, 8117.0, 5503.0, 3718.0, 2518.0, 1712.0, 1150.0, 784.0, 524.0, 368.0, 236.0, 189.0, 122.0, 84.0, 42.0, 34.0, 23.0, 12.0, 17.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4677734375, -0.45281982421875, -0.4378662109375, -0.42291259765625, -0.407958984375, -0.39300537109375, -0.3780517578125, -0.36309814453125, -0.34814453125, -0.33319091796875, -0.3182373046875, -0.30328369140625, -0.288330078125, -0.27337646484375, -0.2584228515625, -0.24346923828125, -0.228515625, -0.21356201171875, -0.1986083984375, -0.18365478515625, -0.168701171875, -0.15374755859375, -0.1387939453125, -0.12384033203125, -0.10888671875, -0.09393310546875, -0.0789794921875, -0.06402587890625, -0.049072265625, -0.03411865234375, -0.0191650390625, -0.00421142578125, 0.0107421875, 0.02569580078125, 0.0406494140625, 0.05560302734375, 0.070556640625, 0.08551025390625, 0.1004638671875, 0.11541748046875, 0.13037109375, 0.14532470703125, 0.1602783203125, 0.17523193359375, 0.190185546875, 0.20513916015625, 0.2200927734375, 0.23504638671875, 0.25, 0.26495361328125, 0.2799072265625, 0.29486083984375, 0.309814453125, 0.32476806640625, 0.3397216796875, 0.35467529296875, 0.36962890625, 0.38458251953125, 0.3995361328125, 0.41448974609375, 0.429443359375, 0.44439697265625, 0.4593505859375, 0.47430419921875, 0.4892578125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 1.0, 4.0, 6.0, 5.0, 7.0, 4.0, 8.0, 5.0, 7.0, 15.0, 22.0, 19.0, 15.0, 14.0, 16.0, 17.0, 32.0, 27.0, 39.0, 29.0, 26.0, 35.0, 42.0, 31.0, 32.0, 44.0, 1063.0, 28.0, 35.0, 28.0, 30.0, 36.0, 33.0, 36.0, 25.0, 22.0, 27.0, 28.0, 22.0, 14.0, 20.0, 10.0, 13.0, 8.0, 13.0, 7.0, 5.0, 4.0, 3.0, 5.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 2.0], "bins": [-1.2431640625, -1.206146240234375, -1.16912841796875, -1.132110595703125, -1.0950927734375, -1.058074951171875, -1.02105712890625, -0.984039306640625, -0.947021484375, -0.910003662109375, -0.87298583984375, -0.835968017578125, -0.7989501953125, -0.761932373046875, -0.72491455078125, -0.687896728515625, -0.65087890625, -0.613861083984375, -0.57684326171875, -0.539825439453125, -0.5028076171875, -0.465789794921875, -0.42877197265625, -0.391754150390625, -0.354736328125, -0.317718505859375, -0.28070068359375, -0.243682861328125, -0.2066650390625, -0.169647216796875, -0.13262939453125, -0.095611572265625, -0.05859375, -0.021575927734375, 0.01544189453125, 0.052459716796875, 0.0894775390625, 0.126495361328125, 0.16351318359375, 0.200531005859375, 0.237548828125, 0.274566650390625, 0.31158447265625, 0.348602294921875, 0.3856201171875, 0.422637939453125, 0.45965576171875, 0.496673583984375, 0.53369140625, 0.570709228515625, 0.60772705078125, 0.644744873046875, 0.6817626953125, 0.718780517578125, 0.75579833984375, 0.792816162109375, 0.829833984375, 0.866851806640625, 0.90386962890625, 0.940887451171875, 0.9779052734375, 1.014923095703125, 1.05194091796875, 1.088958740234375, 1.1259765625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 6.0, 12.0, 20.0, 29.0, 30.0, 63.0, 77.0, 93.0, 147.0, 194.0, 359.0, 525.0, 789.0, 1124.0, 1755.0, 2523.0, 4083.0, 6355.0, 9453.0, 15274.0, 24430.0, 40491.0, 68891.0, 125947.0, 1382406.0, 184782.0, 90943.0, 52180.0, 31306.0, 18981.0, 11890.0, 7520.0, 4814.0, 3105.0, 2102.0, 1384.0, 919.0, 692.0, 467.0, 291.0, 204.0, 142.0, 107.0, 63.0, 44.0, 34.0, 30.0, 14.0, 14.0, 13.0, 4.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.466064453125, -0.4509010314941406, -0.43573760986328125, -0.4205741882324219, -0.4054107666015625, -0.3902473449707031, -0.37508392333984375, -0.3599205017089844, -0.344757080078125, -0.3295936584472656, -0.31443023681640625, -0.2992668151855469, -0.2841033935546875, -0.2689399719238281, -0.25377655029296875, -0.23861312866210938, -0.22344970703125, -0.20828628540039062, -0.19312286376953125, -0.17795944213867188, -0.1627960205078125, -0.14763259887695312, -0.13246917724609375, -0.11730575561523438, -0.102142333984375, -0.08697891235351562, -0.07181549072265625, -0.056652069091796875, -0.0414886474609375, -0.026325225830078125, -0.01116180419921875, 0.004001617431640625, 0.0191650390625, 0.034328460693359375, 0.04949188232421875, 0.06465530395507812, 0.0798187255859375, 0.09498214721679688, 0.11014556884765625, 0.12530899047851562, 0.140472412109375, 0.15563583374023438, 0.17079925537109375, 0.18596267700195312, 0.2011260986328125, 0.21628952026367188, 0.23145294189453125, 0.24661636352539062, 0.26177978515625, 0.2769432067871094, 0.29210662841796875, 0.3072700500488281, 0.3224334716796875, 0.3375968933105469, 0.35276031494140625, 0.3679237365722656, 0.383087158203125, 0.3982505798339844, 0.41341400146484375, 0.4285774230957031, 0.4437408447265625, 0.4589042663574219, 0.47406768798828125, 0.4892311096191406, 0.50439453125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 7.0, 11.0, 5.0, 14.0, 21.0, 24.0, 24.0, 42.0, 63.0, 69.0, 79.0, 108.0, 99.0, 90.0, 73.0, 63.0, 57.0, 30.0, 35.0, 25.0, 17.0, 12.0, 7.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005121231079101562, -0.0004980526864528656, -0.00048398226499557495, -0.0004699118435382843, -0.00045584142208099365, -0.000441771000623703, -0.00042770057916641235, -0.0004136301577091217, -0.00039955973625183105, -0.0003854893147945404, -0.00037141889333724976, -0.0003573484718799591, -0.00034327805042266846, -0.0003292076289653778, -0.00031513720750808716, -0.0003010667860507965, -0.00028699636459350586, -0.0002729259431362152, -0.00025885552167892456, -0.0002447851002216339, -0.00023071467876434326, -0.0002166442573070526, -0.00020257383584976196, -0.0001885034143924713, -0.00017443299293518066, -0.00016036257147789001, -0.00014629215002059937, -0.00013222172856330872, -0.00011815130710601807, -0.00010408088564872742, -9.001046419143677e-05, -7.594004273414612e-05, -6.186962127685547e-05, -4.779919981956482e-05, -3.372877836227417e-05, -1.965835690498352e-05, -5.587935447692871e-06, 8.482486009597778e-06, 2.2552907466888428e-05, 3.662332892417908e-05, 5.0693750381469727e-05, 6.476417183876038e-05, 7.883459329605103e-05, 9.290501475334167e-05, 0.00010697543621063232, 0.00012104585766792297, 0.00013511627912521362, 0.00014918670058250427, 0.00016325712203979492, 0.00017732754349708557, 0.00019139796495437622, 0.00020546838641166687, 0.00021953880786895752, 0.00023360922932624817, 0.0002476796507835388, 0.00026175007224082947, 0.0002758204936981201, 0.00028989091515541077, 0.0003039613366127014, 0.00031803175806999207, 0.0003321021795272827, 0.00034617260098457336, 0.000360243022441864, 0.00037431344389915466, 0.0003883838653564453]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 4.0, 5.0, 8.0, 14.0, 18.0, 40.0, 53.0, 78.0, 107.0, 143.0, 267.0, 709.0, 249744.0, 795750.0, 751.0, 321.0, 173.0, 119.0, 64.0, 38.0, 45.0, 27.0, 18.0, 15.0, 11.0, 11.0, 5.0, 4.0, 4.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009918212890625, -0.009608626365661621, -0.009299039840698242, -0.008989453315734863, -0.008679866790771484, -0.008370280265808105, -0.008060693740844727, -0.007751107215881348, -0.007441520690917969, -0.00713193416595459, -0.006822347640991211, -0.006512761116027832, -0.006203174591064453, -0.005893588066101074, -0.005584001541137695, -0.005274415016174316, -0.0049648284912109375, -0.004655241966247559, -0.00434565544128418, -0.004036068916320801, -0.003726482391357422, -0.003416895866394043, -0.003107309341430664, -0.002797722816467285, -0.0024881362915039062, -0.0021785497665405273, -0.0018689632415771484, -0.0015593767166137695, -0.0012497901916503906, -0.0009402036666870117, -0.0006306171417236328, -0.0003210306167602539, -1.1444091796875e-05, 0.0002981424331665039, 0.0006077289581298828, 0.0009173154830932617, 0.0012269020080566406, 0.0015364885330200195, 0.0018460750579833984, 0.0021556615829467773, 0.0024652481079101562, 0.002774834632873535, 0.003084421157836914, 0.003394007682800293, 0.003703594207763672, 0.004013180732727051, 0.00432276725769043, 0.004632353782653809, 0.0049419403076171875, 0.005251526832580566, 0.005561113357543945, 0.005870699882507324, 0.006180286407470703, 0.006489872932434082, 0.006799459457397461, 0.00710904598236084, 0.007418632507324219, 0.007728219032287598, 0.008037805557250977, 0.008347392082214355, 0.008656978607177734, 0.008966565132141113, 0.009276151657104492, 0.009585738182067871, 0.00989532470703125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 22.0, 94.0, 296.0, 387.0, 170.0, 38.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006656274199485779, -0.0006498635630123317, -0.0006340997642837465, -0.0006183359073475003, -0.0006025721086189151, -0.0005868082516826689, -0.0005710444529540837, -0.0005552805960178375, -0.0005395167972892523, -0.0005237529403530061, -0.0005079891416244209, -0.0004922252846881747, -0.0004764614859595895, -0.0004606976290233433, -0.0004449338011909276, -0.0004291699733585119, -0.00041340611642226577, -0.00039764228858985007, -0.00038187846075743437, -0.00036611463292501867, -0.00035035080509260297, -0.0003345869481563568, -0.0003188231203239411, -0.0003030592924915254, -0.0002872954646591097, -0.000271531636826694, -0.0002557678089942783, -0.00024000396660994738, -0.00022424013877753168, -0.00020847631094511598, -0.00019271246856078506, -0.00017694864072836936, -0.0001611847837921232, -0.0001454209559597075, -0.0001296571281272918, -0.00011389328574296087, -9.812945791054517e-05, -8.236563007812947e-05, -6.660179496975616e-05, -5.083795986138284e-05, -3.507413202896714e-05, -1.9310300558572635e-05, -3.546469088178128e-06, 1.2217362382216379e-05, 2.7981193852610886e-05, 4.3745021685026586e-05, 5.95088567933999e-05, 7.527269190177321e-05, 9.103651973418891e-05, 0.00010680034756660461, 0.00012256417539902031, 0.00013832801778335124, 0.00015409184561576694, 0.00016985567344818264, 0.00018561951583251357, 0.00020138334366492927, 0.00021714717149734497, 0.00023291099932976067, 0.00024867482716217637, 0.00026443865499459207, 0.00028020248282700777, 0.00029596633976325393, 0.00031173016759566963, 0.00032749399542808533, 0.00034325782326050103]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 5.0, 9.0, 14.0, 13.0, 14.0, 23.0, 29.0, 40.0, 24.0, 32.0, 31.0, 33.0, 35.0, 41.0, 44.0, 39.0, 52.0, 47.0, 43.0, 37.0, 48.0, 42.0, 41.0, 45.0, 33.0, 24.0, 25.0, 17.0, 21.0, 19.0, 17.0, 15.0, 18.0, 6.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019800662994384766, -0.00019209552556276321, -0.00018618442118167877, -0.00018027331680059433, -0.0001743622124195099, -0.00016845110803842545, -0.000162540003657341, -0.00015662889927625656, -0.00015071779489517212, -0.00014480669051408768, -0.00013889558613300323, -0.0001329844817519188, -0.00012707337737083435, -0.00012116227298974991, -0.00011525116860866547, -0.00010934006422758102, -0.00010342895984649658, -9.751785546541214e-05, -9.16067510843277e-05, -8.569564670324326e-05, -7.978454232215881e-05, -7.387343794107437e-05, -6.796233355998993e-05, -6.205122917890549e-05, -5.6140124797821045e-05, -5.02290204167366e-05, -4.431791603565216e-05, -3.840681165456772e-05, -3.2495707273483276e-05, -2.6584602892398834e-05, -2.0673498511314392e-05, -1.476239413022995e-05, -8.851289749145508e-06, -2.9401853680610657e-06, 2.9709190130233765e-06, 8.882023394107819e-06, 1.479312777519226e-05, 2.0704232156276703e-05, 2.6615336537361145e-05, 3.252644091844559e-05, 3.843754529953003e-05, 4.434864968061447e-05, 5.0259754061698914e-05, 5.6170858442783356e-05, 6.20819628238678e-05, 6.799306720495224e-05, 7.390417158603668e-05, 7.981527596712112e-05, 8.572638034820557e-05, 9.163748472929001e-05, 9.754858911037445e-05, 0.00010345969349145889, 0.00010937079787254333, 0.00011528190225362778, 0.00012119300663471222, 0.00012710411101579666, 0.0001330152153968811, 0.00013892631977796555, 0.00014483742415905, 0.00015074852854013443, 0.00015665963292121887, 0.00016257073730230331, 0.00016848184168338776, 0.0001743929460644722, 0.00018030405044555664]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 8.0, 2.0, 4.0, 5.0, 11.0, 10.0, 5.0, 10.0, 12.0, 17.0, 17.0, 17.0, 22.0, 20.0, 24.0, 28.0, 29.0, 42.0, 34.0, 34.0, 41.0, 42.0, 34.0, 47.0, 37.0, 52.0, 34.0, 37.0, 36.0, 31.0, 28.0, 30.0, 30.0, 26.0, 25.0, 24.0, 18.0, 19.0, 13.0, 11.0, 10.0, 5.0, 8.0, 5.0, 9.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.24609375, -2.181304931640625, -2.11651611328125, -2.051727294921875, -1.9869384765625, -1.922149658203125, -1.85736083984375, -1.792572021484375, -1.727783203125, -1.662994384765625, -1.59820556640625, -1.533416748046875, -1.4686279296875, -1.403839111328125, -1.33905029296875, -1.274261474609375, -1.20947265625, -1.144683837890625, -1.07989501953125, -1.015106201171875, -0.9503173828125, -0.885528564453125, -0.82073974609375, -0.755950927734375, -0.691162109375, -0.626373291015625, -0.56158447265625, -0.496795654296875, -0.4320068359375, -0.367218017578125, -0.30242919921875, -0.237640380859375, -0.1728515625, -0.108062744140625, -0.04327392578125, 0.021514892578125, 0.0863037109375, 0.151092529296875, 0.21588134765625, 0.280670166015625, 0.345458984375, 0.410247802734375, 0.47503662109375, 0.539825439453125, 0.6046142578125, 0.669403076171875, 0.73419189453125, 0.798980712890625, 0.86376953125, 0.928558349609375, 0.99334716796875, 1.058135986328125, 1.1229248046875, 1.187713623046875, 1.25250244140625, 1.317291259765625, 1.382080078125, 1.446868896484375, 1.51165771484375, 1.576446533203125, 1.6412353515625, 1.706024169921875, 1.77081298828125, 1.835601806640625, 1.900390625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 4.0, 11.0, 8.0, 8.0, 16.0, 22.0, 26.0, 28.0, 57.0, 77.0, 91.0, 152.0, 196.0, 300.0, 491.0, 735.0, 1340.0, 2391.0, 4972.0, 10795.0, 26071.0, 67104.0, 180994.0, 358462.0, 240334.0, 91825.0, 34587.0, 14164.0, 6149.0, 2951.0, 1621.0, 924.0, 545.0, 337.0, 237.0, 170.0, 116.0, 61.0, 49.0, 47.0, 26.0, 19.0, 11.0, 21.0, 8.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.427734375, -2.348541259765625, -2.26934814453125, -2.190155029296875, -2.1109619140625, -2.031768798828125, -1.95257568359375, -1.873382568359375, -1.794189453125, -1.714996337890625, -1.63580322265625, -1.556610107421875, -1.4774169921875, -1.398223876953125, -1.31903076171875, -1.239837646484375, -1.16064453125, -1.081451416015625, -1.00225830078125, -0.923065185546875, -0.8438720703125, -0.764678955078125, -0.68548583984375, -0.606292724609375, -0.527099609375, -0.447906494140625, -0.36871337890625, -0.289520263671875, -0.2103271484375, -0.131134033203125, -0.05194091796875, 0.027252197265625, 0.1064453125, 0.185638427734375, 0.26483154296875, 0.344024658203125, 0.4232177734375, 0.502410888671875, 0.58160400390625, 0.660797119140625, 0.739990234375, 0.819183349609375, 0.89837646484375, 0.977569580078125, 1.0567626953125, 1.135955810546875, 1.21514892578125, 1.294342041015625, 1.37353515625, 1.452728271484375, 1.53192138671875, 1.611114501953125, 1.6903076171875, 1.769500732421875, 1.84869384765625, 1.927886962890625, 2.007080078125, 2.086273193359375, 2.16546630859375, 2.244659423828125, 2.3238525390625, 2.403045654296875, 2.48223876953125, 2.561431884765625, 2.640625]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 3.0, 10.0, 11.0, 5.0, 15.0, 11.0, 11.0, 15.0, 8.0, 22.0, 21.0, 23.0, 32.0, 30.0, 40.0, 36.0, 34.0, 47.0, 44.0, 81.0, 191.0, 1484.0, 290.0, 122.0, 72.0, 50.0, 36.0, 31.0, 31.0, 32.0, 27.0, 24.0, 24.0, 27.0, 17.0, 16.0, 12.0, 12.0, 7.0, 13.0, 8.0, 8.0, 3.0, 1.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-7.12890625, -6.91741943359375, -6.7059326171875, -6.49444580078125, -6.282958984375, -6.07147216796875, -5.8599853515625, -5.64849853515625, -5.43701171875, -5.22552490234375, -5.0140380859375, -4.80255126953125, -4.591064453125, -4.37957763671875, -4.1680908203125, -3.95660400390625, -3.7451171875, -3.53363037109375, -3.3221435546875, -3.11065673828125, -2.899169921875, -2.68768310546875, -2.4761962890625, -2.26470947265625, -2.05322265625, -1.84173583984375, -1.6302490234375, -1.41876220703125, -1.207275390625, -0.99578857421875, -0.7843017578125, -0.57281494140625, -0.361328125, -0.14984130859375, 0.0616455078125, 0.27313232421875, 0.484619140625, 0.69610595703125, 0.9075927734375, 1.11907958984375, 1.33056640625, 1.54205322265625, 1.7535400390625, 1.96502685546875, 2.176513671875, 2.38800048828125, 2.5994873046875, 2.81097412109375, 3.0224609375, 3.23394775390625, 3.4454345703125, 3.65692138671875, 3.868408203125, 4.07989501953125, 4.2913818359375, 4.50286865234375, 4.71435546875, 4.92584228515625, 5.1373291015625, 5.34881591796875, 5.560302734375, 5.77178955078125, 5.9832763671875, 6.19476318359375, 6.40625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 7.0, 4.0, 5.0, 10.0, 16.0, 13.0, 11.0, 22.0, 13.0, 26.0, 30.0, 30.0, 43.0, 59.0, 87.0, 116.0, 226.0, 434.0, 1501.0, 18089.0, 2853192.0, 266078.0, 3944.0, 809.0, 303.0, 181.0, 105.0, 63.0, 60.0, 43.0, 33.0, 24.0, 23.0, 9.0, 16.0, 16.0, 16.0, 9.0, 7.0, 7.0, 4.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-13.9765625, -13.5069580078125, -13.037353515625, -12.5677490234375, -12.09814453125, -11.6285400390625, -11.158935546875, -10.6893310546875, -10.2197265625, -9.7501220703125, -9.280517578125, -8.8109130859375, -8.34130859375, -7.8717041015625, -7.402099609375, -6.9324951171875, -6.462890625, -5.9932861328125, -5.523681640625, -5.0540771484375, -4.58447265625, -4.1148681640625, -3.645263671875, -3.1756591796875, -2.7060546875, -2.2364501953125, -1.766845703125, -1.2972412109375, -0.82763671875, -0.3580322265625, 0.111572265625, 0.5811767578125, 1.05078125, 1.5203857421875, 1.989990234375, 2.4595947265625, 2.92919921875, 3.3988037109375, 3.868408203125, 4.3380126953125, 4.8076171875, 5.2772216796875, 5.746826171875, 6.2164306640625, 6.68603515625, 7.1556396484375, 7.625244140625, 8.0948486328125, 8.564453125, 9.0340576171875, 9.503662109375, 9.9732666015625, 10.44287109375, 10.9124755859375, 11.382080078125, 11.8516845703125, 12.3212890625, 12.7908935546875, 13.260498046875, 13.7301025390625, 14.19970703125, 14.6693115234375, 15.138916015625, 15.6085205078125, 16.078125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 58.0, 509.0, 403.0, 40.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.01401901245117, -45.538883209228516, -44.06374740600586, -42.58860778808594, -41.11347198486328, -39.638336181640625, -38.16320037841797, -36.68806457519531, -35.212928771972656, -33.73779296875, -32.262657165527344, -30.787519454956055, -29.3123836517334, -27.83724594116211, -26.362110137939453, -24.886974334716797, -23.411836624145508, -21.93670082092285, -20.461563110351562, -18.986427307128906, -17.51129150390625, -16.036155700683594, -14.561017990112305, -13.085882186889648, -11.610745429992676, -10.135608673095703, -8.660472869873047, -7.185336112976074, -5.71019983291626, -4.235063552856445, -2.7599267959594727, -1.2847909927368164, 0.19034576416015625, 1.6654821634292603, 3.1406185626983643, 4.615755081176758, 6.090891361236572, 7.566027641296387, 9.04116439819336, 10.516300201416016, 11.991436958312988, 13.466573715209961, 14.941709518432617, 16.416847229003906, 17.891983032226562, 19.36711883544922, 20.842254638671875, 22.31739044189453, 23.79252815246582, 25.267663955688477, 26.742801666259766, 28.217937469482422, 29.693073272705078, 31.168209075927734, 32.643348693847656, 34.11848449707031, 35.59362030029297, 37.068756103515625, 38.54389190673828, 40.01902770996094, 41.49416732788086, 42.969303131103516, 44.44443893432617, 45.91957473754883, 47.394710540771484]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 7.0, 5.0, 4.0, 7.0, 16.0, 15.0, 20.0, 11.0, 22.0, 15.0, 24.0, 24.0, 28.0, 43.0, 38.0, 35.0, 39.0, 40.0, 33.0, 57.0, 38.0, 48.0, 30.0, 32.0, 50.0, 34.0, 39.0, 33.0, 21.0, 31.0, 18.0, 21.0, 22.0, 15.0, 14.0, 13.0, 9.0, 11.0, 8.0, 6.0, 7.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-20.036022186279297, -19.33404541015625, -18.632070541381836, -17.93009376525879, -17.228116989135742, -16.526142120361328, -15.824165344238281, -15.12218952178955, -14.42021369934082, -13.71823787689209, -13.016261100769043, -12.314285278320312, -11.612309455871582, -10.910333633422852, -10.208356857299805, -9.506381034851074, -8.804404258728027, -8.102428436279297, -7.400452136993408, -6.6984758377075195, -5.996500015258789, -5.2945237159729, -4.592547416687012, -3.8905715942382812, -3.1885952949523926, -2.486619234085083, -1.7846430540084839, -1.0826668739318848, -0.3806908130645752, 0.3212852478027344, 1.023261547088623, 1.7252373695373535, 2.427213668823242, 3.1291897296905518, 3.8311657905578613, 4.53314208984375, 5.2351179122924805, 5.937094211578369, 6.639070510864258, 7.341046333312988, 8.043022155761719, 8.74499797821045, 9.446974754333496, 10.148950576782227, 10.850926399230957, 11.552902221679688, 12.254878997802734, 12.956854820251465, 13.658831596374512, 14.360807418823242, 15.062784194946289, 15.76476001739502, 16.46673583984375, 17.168712615966797, 17.870689392089844, 18.572664260864258, 19.274641036987305, 19.97661781311035, 20.678592681884766, 21.380569458007812, 22.08254623413086, 22.784521102905273, 23.48649787902832, 24.188472747802734, 24.89044952392578]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 6.0, 7.0, 7.0, 7.0, 9.0, 7.0, 7.0, 10.0, 24.0, 20.0, 16.0, 27.0, 21.0, 17.0, 32.0, 38.0, 35.0, 27.0, 42.0, 45.0, 36.0, 51.0, 40.0, 43.0, 33.0, 42.0, 30.0, 43.0, 23.0, 30.0, 37.0, 29.0, 23.0, 36.0, 16.0, 12.0, 18.0, 9.0, 14.0, 11.0, 3.0, 4.0, 9.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.287109375, -2.218719482421875, -2.15032958984375, -2.081939697265625, -2.0135498046875, -1.945159912109375, -1.87677001953125, -1.808380126953125, -1.739990234375, -1.671600341796875, -1.60321044921875, -1.534820556640625, -1.4664306640625, -1.398040771484375, -1.32965087890625, -1.261260986328125, -1.19287109375, -1.124481201171875, -1.05609130859375, -0.987701416015625, -0.9193115234375, -0.850921630859375, -0.78253173828125, -0.714141845703125, -0.645751953125, -0.577362060546875, -0.50897216796875, -0.440582275390625, -0.3721923828125, -0.303802490234375, -0.23541259765625, -0.167022705078125, -0.0986328125, -0.030242919921875, 0.03814697265625, 0.106536865234375, 0.1749267578125, 0.243316650390625, 0.31170654296875, 0.380096435546875, 0.448486328125, 0.516876220703125, 0.58526611328125, 0.653656005859375, 0.7220458984375, 0.790435791015625, 0.85882568359375, 0.927215576171875, 0.99560546875, 1.063995361328125, 1.13238525390625, 1.200775146484375, 1.2691650390625, 1.337554931640625, 1.40594482421875, 1.474334716796875, 1.542724609375, 1.611114501953125, 1.67950439453125, 1.747894287109375, 1.8162841796875, 1.884674072265625, 1.95306396484375, 2.021453857421875, 2.08984375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 5.0, 9.0, 6.0, 10.0, 17.0, 15.0, 20.0, 32.0, 33.0, 58.0, 70.0, 101.0, 171.0, 299.0, 550.0, 1208.0, 4214.0, 23852.0, 268217.0, 2564993.0, 1231429.0, 84415.0, 10376.0, 2254.0, 813.0, 437.0, 199.0, 129.0, 86.0, 62.0, 42.0, 36.0, 30.0, 12.0, 12.0, 14.0, 14.0, 7.0, 10.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.3359375, -7.1187744140625, -6.901611328125, -6.6844482421875, -6.46728515625, -6.2501220703125, -6.032958984375, -5.8157958984375, -5.5986328125, -5.3814697265625, -5.164306640625, -4.9471435546875, -4.72998046875, -4.5128173828125, -4.295654296875, -4.0784912109375, -3.861328125, -3.6441650390625, -3.427001953125, -3.2098388671875, -2.99267578125, -2.7755126953125, -2.558349609375, -2.3411865234375, -2.1240234375, -1.9068603515625, -1.689697265625, -1.4725341796875, -1.25537109375, -1.0382080078125, -0.821044921875, -0.6038818359375, -0.38671875, -0.1695556640625, 0.047607421875, 0.2647705078125, 0.48193359375, 0.6990966796875, 0.916259765625, 1.1334228515625, 1.3505859375, 1.5677490234375, 1.784912109375, 2.0020751953125, 2.21923828125, 2.4364013671875, 2.653564453125, 2.8707275390625, 3.087890625, 3.3050537109375, 3.522216796875, 3.7393798828125, 3.95654296875, 4.1737060546875, 4.390869140625, 4.6080322265625, 4.8251953125, 5.0423583984375, 5.259521484375, 5.4766845703125, 5.69384765625, 5.9110107421875, 6.128173828125, 6.3453369140625, 6.5625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 4.0, 5.0, 5.0, 8.0, 15.0, 16.0, 25.0, 32.0, 49.0, 69.0, 122.0, 164.0, 241.0, 307.0, 419.0, 507.0, 547.0, 443.0, 307.0, 250.0, 149.0, 114.0, 95.0, 54.0, 52.0, 27.0, 19.0, 14.0, 4.0, 7.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.390625, -11.11346435546875, -10.8363037109375, -10.55914306640625, -10.281982421875, -10.00482177734375, -9.7276611328125, -9.45050048828125, -9.17333984375, -8.89617919921875, -8.6190185546875, -8.34185791015625, -8.064697265625, -7.78753662109375, -7.5103759765625, -7.23321533203125, -6.9560546875, -6.67889404296875, -6.4017333984375, -6.12457275390625, -5.847412109375, -5.57025146484375, -5.2930908203125, -5.01593017578125, -4.73876953125, -4.46160888671875, -4.1844482421875, -3.90728759765625, -3.630126953125, -3.35296630859375, -3.0758056640625, -2.79864501953125, -2.521484375, -2.24432373046875, -1.9671630859375, -1.69000244140625, -1.412841796875, -1.13568115234375, -0.8585205078125, -0.58135986328125, -0.30419921875, -0.02703857421875, 0.2501220703125, 0.52728271484375, 0.804443359375, 1.08160400390625, 1.3587646484375, 1.63592529296875, 1.9130859375, 2.19024658203125, 2.4674072265625, 2.74456787109375, 3.021728515625, 3.29888916015625, 3.5760498046875, 3.85321044921875, 4.13037109375, 4.40753173828125, 4.6846923828125, 4.96185302734375, 5.239013671875, 5.51617431640625, 5.7933349609375, 6.07049560546875, 6.34765625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [4.0, 3.0, 0.0, 4.0, 3.0, 1.0, 7.0, 8.0, 15.0, 29.0, 25.0, 28.0, 56.0, 79.0, 117.0, 196.0, 353.0, 856.0, 4504.0, 241963.0, 3889173.0, 53028.0, 2395.0, 630.0, 262.0, 177.0, 120.0, 74.0, 55.0, 40.0, 24.0, 26.0, 14.0, 10.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.484375, -15.674560546875, -14.86474609375, -14.054931640625, -13.2451171875, -12.435302734375, -11.62548828125, -10.815673828125, -10.005859375, -9.196044921875, -8.38623046875, -7.576416015625, -6.7666015625, -5.956787109375, -5.14697265625, -4.337158203125, -3.52734375, -2.717529296875, -1.90771484375, -1.097900390625, -0.2880859375, 0.521728515625, 1.33154296875, 2.141357421875, 2.951171875, 3.760986328125, 4.57080078125, 5.380615234375, 6.1904296875, 7.000244140625, 7.81005859375, 8.619873046875, 9.4296875, 10.239501953125, 11.04931640625, 11.859130859375, 12.6689453125, 13.478759765625, 14.28857421875, 15.098388671875, 15.908203125, 16.718017578125, 17.52783203125, 18.337646484375, 19.1474609375, 19.957275390625, 20.76708984375, 21.576904296875, 22.38671875, 23.196533203125, 24.00634765625, 24.816162109375, 25.6259765625, 26.435791015625, 27.24560546875, 28.055419921875, 28.865234375, 29.675048828125, 30.48486328125, 31.294677734375, 32.1044921875, 32.914306640625, 33.72412109375, 34.533935546875, 35.34375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 10.0, 30.0, 85.0, 171.0, 259.0, 232.0, 139.0, 60.0, 20.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.64305114746094, -80.0042495727539, -78.36544799804688, -76.72663879394531, -75.08783721923828, -73.44903564453125, -71.81023406982422, -70.17143249511719, -68.53262329101562, -66.8938217163086, -65.25502014160156, -63.616214752197266, -61.97740936279297, -60.33860778808594, -58.699806213378906, -57.061004638671875, -55.422203063964844, -53.78340148925781, -52.144596099853516, -50.505794525146484, -48.86698913574219, -47.228187561035156, -45.589385986328125, -43.950584411621094, -42.3117790222168, -40.672977447509766, -39.03417205810547, -37.39537048339844, -35.756568908691406, -34.11776351928711, -32.47896194458008, -30.840158462524414, -29.201351165771484, -27.56254768371582, -25.923744201660156, -24.284942626953125, -22.64613914489746, -21.007335662841797, -19.368534088134766, -17.7297306060791, -16.090927124023438, -14.452123641967773, -12.813321113586426, -11.174518585205078, -9.535715103149414, -7.89691162109375, -6.258109092712402, -4.619306564331055, -2.9805030822753906, -1.3417000770568848, 0.2971029281616211, 1.935905933380127, 3.574708938598633, 5.213512420654297, 6.8523149490356445, 8.491117477416992, 10.129920959472656, 11.76872444152832, 13.407526969909668, 15.046329498291016, 16.68513298034668, 18.323936462402344, 19.962738037109375, 21.60154151916504, 23.240345001220703]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 6.0, 8.0, 12.0, 14.0, 12.0, 18.0, 17.0, 15.0, 15.0, 25.0, 34.0, 26.0, 36.0, 45.0, 39.0, 38.0, 34.0, 41.0, 39.0, 52.0, 29.0, 51.0, 38.0, 34.0, 38.0, 27.0, 35.0, 23.0, 30.0, 23.0, 24.0, 17.0, 18.0, 11.0, 19.0, 17.0, 17.0, 8.0, 2.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.884597778320312, -25.114299774169922, -24.34400177001953, -23.57370376586914, -22.803407669067383, -22.033109664916992, -21.2628116607666, -20.49251365661621, -19.722217559814453, -18.951919555664062, -18.181621551513672, -17.41132354736328, -16.641027450561523, -15.870729446411133, -15.100431442260742, -14.330133438110352, -13.559835433959961, -12.78953742980957, -12.019240379333496, -11.248942375183105, -10.478645324707031, -9.70834732055664, -8.93804931640625, -8.16775131225586, -7.397454261779785, -6.627156734466553, -5.85685920715332, -5.08656120300293, -4.316263675689697, -3.545966148376465, -2.775668144226074, -2.005370616912842, -1.2350730895996094, -0.4647754430770874, 0.30552220344543457, 1.075819969177246, 1.8461174964904785, 2.616415023803711, 3.3867130279541016, 4.157010555267334, 4.927308082580566, 5.697605609893799, 6.467903137207031, 7.238201141357422, 8.008499145507812, 8.778796195983887, 9.549094200134277, 10.319391250610352, 11.089689254760742, 11.859987258911133, 12.630284309387207, 13.400582313537598, 14.170879364013672, 14.941177368164062, 15.711475372314453, 16.481773376464844, 17.252071380615234, 18.022369384765625, 18.792667388916016, 19.562965393066406, 20.333261489868164, 21.103559494018555, 21.873857498168945, 22.644155502319336, 23.414451599121094]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 3.0, 7.0, 11.0, 13.0, 11.0, 18.0, 17.0, 16.0, 26.0, 17.0, 29.0, 27.0, 30.0, 26.0, 32.0, 25.0, 31.0, 32.0, 35.0, 52.0, 45.0, 38.0, 46.0, 29.0, 28.0, 38.0, 35.0, 26.0, 37.0, 25.0, 22.0, 16.0, 23.0, 23.0, 19.0, 14.0, 12.0, 13.0, 13.0, 8.0, 7.0, 5.0, 2.0, 5.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.142578125, -2.0771484375, -2.01171875, -1.9462890625, -1.880859375, -1.8154296875, -1.75, -1.6845703125, -1.619140625, -1.5537109375, -1.48828125, -1.4228515625, -1.357421875, -1.2919921875, -1.2265625, -1.1611328125, -1.095703125, -1.0302734375, -0.96484375, -0.8994140625, -0.833984375, -0.7685546875, -0.703125, -0.6376953125, -0.572265625, -0.5068359375, -0.44140625, -0.3759765625, -0.310546875, -0.2451171875, -0.1796875, -0.1142578125, -0.048828125, 0.0166015625, 0.08203125, 0.1474609375, 0.212890625, 0.2783203125, 0.34375, 0.4091796875, 0.474609375, 0.5400390625, 0.60546875, 0.6708984375, 0.736328125, 0.8017578125, 0.8671875, 0.9326171875, 0.998046875, 1.0634765625, 1.12890625, 1.1943359375, 1.259765625, 1.3251953125, 1.390625, 1.4560546875, 1.521484375, 1.5869140625, 1.65234375, 1.7177734375, 1.783203125, 1.8486328125, 1.9140625, 1.9794921875, 2.044921875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 3.0, 0.0, 8.0, 8.0, 12.0, 28.0, 43.0, 52.0, 78.0, 67.0, 149.0, 214.0, 303.0, 449.0, 602.0, 918.0, 1290.0, 1835.0, 2572.0, 3776.0, 5451.0, 7865.0, 11103.0, 16003.0, 22976.0, 33099.0, 48983.0, 74074.0, 122274.0, 275982.0, 154242.0, 85526.0, 55614.0, 37714.0, 25923.0, 18035.0, 12540.0, 8620.0, 6081.0, 4283.0, 2990.0, 2037.0, 1488.0, 1006.0, 626.0, 486.0, 373.0, 252.0, 158.0, 123.0, 73.0, 56.0, 35.0, 26.0, 15.0, 15.0, 3.0, 4.0, 2.0, 2.0, 4.0], "bins": [-0.43408203125, -0.4207916259765625, -0.407501220703125, -0.3942108154296875, -0.38092041015625, -0.3676300048828125, -0.354339599609375, -0.3410491943359375, -0.3277587890625, -0.3144683837890625, -0.301177978515625, -0.2878875732421875, -0.27459716796875, -0.2613067626953125, -0.248016357421875, -0.2347259521484375, -0.221435546875, -0.2081451416015625, -0.194854736328125, -0.1815643310546875, -0.16827392578125, -0.1549835205078125, -0.141693115234375, -0.1284027099609375, -0.1151123046875, -0.1018218994140625, -0.088531494140625, -0.0752410888671875, -0.06195068359375, -0.0486602783203125, -0.035369873046875, -0.0220794677734375, -0.0087890625, 0.0045013427734375, 0.017791748046875, 0.0310821533203125, 0.04437255859375, 0.0576629638671875, 0.070953369140625, 0.0842437744140625, 0.0975341796875, 0.1108245849609375, 0.124114990234375, 0.1374053955078125, 0.15069580078125, 0.1639862060546875, 0.177276611328125, 0.1905670166015625, 0.203857421875, 0.2171478271484375, 0.230438232421875, 0.2437286376953125, 0.25701904296875, 0.2703094482421875, 0.283599853515625, 0.2968902587890625, 0.3101806640625, 0.3234710693359375, 0.336761474609375, 0.3500518798828125, 0.36334228515625, 0.3766326904296875, 0.389923095703125, 0.4032135009765625, 0.41650390625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 3.0, 6.0, 7.0, 10.0, 17.0, 17.0, 10.0, 17.0, 20.0, 15.0, 29.0, 37.0, 32.0, 39.0, 40.0, 46.0, 50.0, 42.0, 50.0, 1066.0, 44.0, 52.0, 38.0, 41.0, 41.0, 33.0, 40.0, 29.0, 28.0, 26.0, 12.0, 17.0, 8.0, 16.0, 15.0, 8.0, 7.0, 5.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5205078125, -1.4700469970703125, -1.419586181640625, -1.3691253662109375, -1.31866455078125, -1.2682037353515625, -1.217742919921875, -1.1672821044921875, -1.1168212890625, -1.0663604736328125, -1.015899658203125, -0.9654388427734375, -0.91497802734375, -0.8645172119140625, -0.814056396484375, -0.7635955810546875, -0.713134765625, -0.6626739501953125, -0.612213134765625, -0.5617523193359375, -0.51129150390625, -0.4608306884765625, -0.410369873046875, -0.3599090576171875, -0.3094482421875, -0.2589874267578125, -0.208526611328125, -0.1580657958984375, -0.10760498046875, -0.0571441650390625, -0.006683349609375, 0.0437774658203125, 0.09423828125, 0.1446990966796875, 0.195159912109375, 0.2456207275390625, 0.29608154296875, 0.3465423583984375, 0.397003173828125, 0.4474639892578125, 0.4979248046875, 0.5483856201171875, 0.598846435546875, 0.6493072509765625, 0.69976806640625, 0.7502288818359375, 0.800689697265625, 0.8511505126953125, 0.901611328125, 0.9520721435546875, 1.002532958984375, 1.0529937744140625, 1.10345458984375, 1.1539154052734375, 1.204376220703125, 1.2548370361328125, 1.3052978515625, 1.3557586669921875, 1.406219482421875, 1.4566802978515625, 1.50714111328125, 1.5576019287109375, 1.608062744140625, 1.6585235595703125, 1.708984375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 8.0, 10.0, 8.0, 23.0, 31.0, 47.0, 69.0, 135.0, 161.0, 260.0, 436.0, 705.0, 1048.0, 1789.0, 2989.0, 5023.0, 8514.0, 14697.0, 26479.0, 49534.0, 99318.0, 256068.0, 1390665.0, 113411.0, 56340.0, 29762.0, 16383.0, 9382.0, 5355.0, 3346.0, 1882.0, 1207.0, 713.0, 501.0, 269.0, 180.0, 141.0, 72.0, 57.0, 42.0, 21.0, 16.0, 13.0, 9.0, 2.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.6962890625, -0.6758651733398438, -0.6554412841796875, -0.6350173950195312, -0.614593505859375, -0.5941696166992188, -0.5737457275390625, -0.5533218383789062, -0.53289794921875, -0.5124740600585938, -0.4920501708984375, -0.47162628173828125, -0.451202392578125, -0.43077850341796875, -0.4103546142578125, -0.38993072509765625, -0.3695068359375, -0.34908294677734375, -0.3286590576171875, -0.30823516845703125, -0.287811279296875, -0.26738739013671875, -0.2469635009765625, -0.22653961181640625, -0.20611572265625, -0.18569183349609375, -0.1652679443359375, -0.14484405517578125, -0.124420166015625, -0.10399627685546875, -0.0835723876953125, -0.06314849853515625, -0.042724609375, -0.02230072021484375, -0.0018768310546875, 0.01854705810546875, 0.038970947265625, 0.05939483642578125, 0.0798187255859375, 0.10024261474609375, 0.12066650390625, 0.14109039306640625, 0.1615142822265625, 0.18193817138671875, 0.202362060546875, 0.22278594970703125, 0.2432098388671875, 0.26363372802734375, 0.2840576171875, 0.30448150634765625, 0.3249053955078125, 0.34532928466796875, 0.365753173828125, 0.38617706298828125, 0.4066009521484375, 0.42702484130859375, 0.44744873046875, 0.46787261962890625, 0.4882965087890625, 0.5087203979492188, 0.529144287109375, 0.5495681762695312, 0.5699920654296875, 0.5904159545898438, 0.61083984375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 7.0, 8.0, 11.0, 10.0, 13.0, 20.0, 28.0, 27.0, 39.0, 41.0, 57.0, 65.0, 74.0, 89.0, 95.0, 87.0, 70.0, 39.0, 40.0, 25.0, 29.0, 16.0, 23.0, 16.0, 9.0, 12.0, 7.0, 13.0, 9.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0003712177276611328, -0.00035952404141426086, -0.0003478303551673889, -0.00033613666892051697, -0.000324442982673645, -0.00031274929642677307, -0.0003010556101799011, -0.0002893619239330292, -0.0002776682376861572, -0.0002659745514392853, -0.00025428086519241333, -0.00024258717894554138, -0.00023089349269866943, -0.00021919980645179749, -0.00020750612020492554, -0.0001958124339580536, -0.00018411874771118164, -0.0001724250614643097, -0.00016073137521743774, -0.0001490376889705658, -0.00013734400272369385, -0.0001256503164768219, -0.00011395663022994995, -0.000102262943983078, -9.056925773620605e-05, -7.88755714893341e-05, -6.718188524246216e-05, -5.548819899559021e-05, -4.379451274871826e-05, -3.2100826501846313e-05, -2.0407140254974365e-05, -8.713454008102417e-06, 2.9802322387695312e-06, 1.467391848564148e-05, 2.6367604732513428e-05, 3.8061290979385376e-05, 4.9754977226257324e-05, 6.144866347312927e-05, 7.314234972000122e-05, 8.483603596687317e-05, 9.652972221374512e-05, 0.00010822340846061707, 0.00011991709470748901, 0.00013161078095436096, 0.0001433044672012329, 0.00015499815344810486, 0.0001666918396949768, 0.00017838552594184875, 0.0001900792121887207, 0.00020177289843559265, 0.0002134665846824646, 0.00022516027092933655, 0.0002368539571762085, 0.00024854764342308044, 0.0002602413296699524, 0.00027193501591682434, 0.0002836287021636963, 0.00029532238841056824, 0.0003070160746574402, 0.00031870976090431213, 0.0003304034471511841, 0.00034209713339805603, 0.000353790819644928, 0.0003654845058917999, 0.0003771781921386719]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 5.0, 6.0, 8.0, 6.0, 11.0, 9.0, 28.0, 27.0, 35.0, 42.0, 46.0, 76.0, 112.0, 148.0, 269.0, 580.0, 4417.0, 1032769.0, 8476.0, 562.0, 312.0, 190.0, 101.0, 81.0, 47.0, 49.0, 35.0, 31.0, 22.0, 11.0, 9.0, 9.0, 6.0, 7.0, 2.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00824737548828125, -0.00799405574798584, -0.00774073600769043, -0.0074874162673950195, -0.007234096527099609, -0.006980776786804199, -0.006727457046508789, -0.006474137306213379, -0.006220817565917969, -0.005967497825622559, -0.0057141780853271484, -0.005460858345031738, -0.005207538604736328, -0.004954218864440918, -0.004700899124145508, -0.004447579383850098, -0.0041942596435546875, -0.003940939903259277, -0.003687620162963867, -0.003434300422668457, -0.003180980682373047, -0.0029276609420776367, -0.0026743412017822266, -0.0024210214614868164, -0.0021677017211914062, -0.001914381980895996, -0.001661062240600586, -0.0014077425003051758, -0.0011544227600097656, -0.0009011030197143555, -0.0006477832794189453, -0.00039446353912353516, -0.000141143798828125, 0.00011217594146728516, 0.0003654956817626953, 0.0006188154220581055, 0.0008721351623535156, 0.0011254549026489258, 0.001378774642944336, 0.001632094383239746, 0.0018854141235351562, 0.0021387338638305664, 0.0023920536041259766, 0.0026453733444213867, 0.002898693084716797, 0.003152012825012207, 0.003405332565307617, 0.0036586523056030273, 0.0039119720458984375, 0.004165291786193848, 0.004418611526489258, 0.004671931266784668, 0.004925251007080078, 0.005178570747375488, 0.0054318904876708984, 0.005685210227966309, 0.005938529968261719, 0.006191849708557129, 0.006445169448852539, 0.006698489189147949, 0.006951808929443359, 0.0072051286697387695, 0.00745844841003418, 0.00771176815032959, 0.007965087890625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 10.0, 158.0, 583.0, 241.0, 21.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011593077797442675, -0.0011284862412139773, -0.0010976645862683654, -0.0010668430477380753, -0.0010360213927924633, -0.0010051998542621732, -0.0009743782575242221, -0.0009435566607862711, -0.0009127350640483201, -0.000881913467310369, -0.000851091870572418, -0.0008202702738344669, -0.0007894487353041768, -0.0007586270803585649, -0.0007278055418282747, -0.0006969839450903237, -0.0006661623483523726, -0.0006353407516144216, -0.0006045191548764706, -0.0005736975581385195, -0.0005428759614005685, -0.0005120544228702784, -0.0004812328261323273, -0.0004504112293943763, -0.00041958963265642524, -0.0003887680359184742, -0.00035794643918052316, -0.0003271248715464026, -0.00029630327480845153, -0.0002654816780705005, -0.00023466009588446468, -0.00020383851369842887, -0.00017301685875281692, -0.00014219526201486588, -0.00011137367982883006, -8.055209036683664e-05, -4.973050090484321e-05, -1.890890416689217e-05, 1.1912678019143641e-05, 4.273426020517945e-05, 7.355585694313049e-05, 0.00010437744640512392, 0.00013519903586711735, 0.00016602061805315316, 0.0001968422147911042, 0.00022766381152905524, 0.0002584853791631758, 0.00028930697590112686, 0.0003201285726390779, 0.00035095016937702894, 0.00038177176611498, 0.00041259333374910057, 0.0004434149304870516, 0.00047423652722500265, 0.0005050580948591232, 0.0005358796915970743, 0.0005667012883350253, 0.0005975228850729764, 0.0006283444818109274, 0.0006591660785488784, 0.0006899876752868295, 0.0007208092138171196, 0.0007516308105550706, 0.0007824524072930217, 0.0008132740040309727]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 3.0, 1.0, 7.0, 5.0, 6.0, 7.0, 18.0, 13.0, 13.0, 20.0, 12.0, 25.0, 16.0, 27.0, 32.0, 36.0, 30.0, 28.0, 28.0, 42.0, 28.0, 41.0, 36.0, 32.0, 34.0, 31.0, 39.0, 37.0, 30.0, 28.0, 42.0, 26.0, 27.0, 17.0, 34.0, 22.0, 16.0, 16.0, 9.0, 14.0, 17.0, 13.0, 12.0, 10.0, 5.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.00016307830810546875, -0.00015824567526578903, -0.00015341304242610931, -0.0001485804095864296, -0.00014374777674674988, -0.00013891514390707016, -0.00013408251106739044, -0.00012924987822771072, -0.000124417245388031, -0.00011958461254835129, -0.00011475197970867157, -0.00010991934686899185, -0.00010508671402931213, -0.00010025408118963242, -9.54214483499527e-05, -9.058881551027298e-05, -8.575618267059326e-05, -8.092354983091354e-05, -7.609091699123383e-05, -7.125828415155411e-05, -6.642565131187439e-05, -6.159301847219467e-05, -5.6760385632514954e-05, -5.1927752792835236e-05, -4.709511995315552e-05, -4.22624871134758e-05, -3.742985427379608e-05, -3.2597221434116364e-05, -2.7764588594436646e-05, -2.2931955754756927e-05, -1.809932291507721e-05, -1.3266690075397491e-05, -8.434057235717773e-06, -3.6014243960380554e-06, 1.2312084436416626e-06, 6.063841283321381e-06, 1.0896474123001099e-05, 1.5729106962680817e-05, 2.0561739802360535e-05, 2.5394372642040253e-05, 3.022700548171997e-05, 3.505963832139969e-05, 3.989227116107941e-05, 4.4724904000759125e-05, 4.955753684043884e-05, 5.439016968011856e-05, 5.922280251979828e-05, 6.4055435359478e-05, 6.888806819915771e-05, 7.372070103883743e-05, 7.855333387851715e-05, 8.338596671819687e-05, 8.821859955787659e-05, 9.30512323975563e-05, 9.788386523723602e-05, 0.00010271649807691574, 0.00010754913091659546, 0.00011238176375627518, 0.0001172143965959549, 0.00012204702943563461, 0.00012687966227531433, 0.00013171229511499405, 0.00013654492795467377, 0.00014137756079435349, 0.0001462101936340332]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 3.0, 7.0, 11.0, 13.0, 11.0, 18.0, 17.0, 16.0, 26.0, 17.0, 29.0, 27.0, 30.0, 26.0, 32.0, 25.0, 31.0, 32.0, 35.0, 52.0, 45.0, 38.0, 46.0, 29.0, 28.0, 38.0, 35.0, 26.0, 37.0, 25.0, 22.0, 16.0, 23.0, 23.0, 19.0, 14.0, 12.0, 13.0, 13.0, 8.0, 7.0, 5.0, 2.0, 4.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.142578125, -2.0771484375, -2.01171875, -1.9462890625, -1.880859375, -1.8154296875, -1.75, -1.6845703125, -1.619140625, -1.5537109375, -1.48828125, -1.4228515625, -1.357421875, -1.2919921875, -1.2265625, -1.1611328125, -1.095703125, -1.0302734375, -0.96484375, -0.8994140625, -0.833984375, -0.7685546875, -0.703125, -0.6376953125, -0.572265625, -0.5068359375, -0.44140625, -0.3759765625, -0.310546875, -0.2451171875, -0.1796875, -0.1142578125, -0.048828125, 0.0166015625, 0.08203125, 0.1474609375, 0.212890625, 0.2783203125, 0.34375, 0.4091796875, 0.474609375, 0.5400390625, 0.60546875, 0.6708984375, 0.736328125, 0.8017578125, 0.8671875, 0.9326171875, 0.998046875, 1.0634765625, 1.12890625, 1.1943359375, 1.259765625, 1.3251953125, 1.390625, 1.4560546875, 1.521484375, 1.5869140625, 1.65234375, 1.7177734375, 1.783203125, 1.8486328125, 1.9140625, 1.9794921875, 2.044921875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 12.0, 11.0, 11.0, 19.0, 24.0, 31.0, 51.0, 61.0, 69.0, 101.0, 154.0, 230.0, 317.0, 465.0, 827.0, 1326.0, 2415.0, 4772.0, 9359.0, 20803.0, 51395.0, 152519.0, 423922.0, 246403.0, 77311.0, 29198.0, 12910.0, 6183.0, 3048.0, 1653.0, 998.0, 658.0, 376.0, 277.0, 200.0, 120.0, 106.0, 60.0, 38.0, 36.0, 22.0, 26.0, 14.0, 5.0, 8.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.474609375, -2.39654541015625, -2.3184814453125, -2.24041748046875, -2.162353515625, -2.08428955078125, -2.0062255859375, -1.92816162109375, -1.85009765625, -1.77203369140625, -1.6939697265625, -1.61590576171875, -1.537841796875, -1.45977783203125, -1.3817138671875, -1.30364990234375, -1.2255859375, -1.14752197265625, -1.0694580078125, -0.99139404296875, -0.913330078125, -0.83526611328125, -0.7572021484375, -0.67913818359375, -0.60107421875, -0.52301025390625, -0.4449462890625, -0.36688232421875, -0.288818359375, -0.21075439453125, -0.1326904296875, -0.05462646484375, 0.0234375, 0.10150146484375, 0.1795654296875, 0.25762939453125, 0.335693359375, 0.41375732421875, 0.4918212890625, 0.56988525390625, 0.64794921875, 0.72601318359375, 0.8040771484375, 0.88214111328125, 0.960205078125, 1.03826904296875, 1.1163330078125, 1.19439697265625, 1.2724609375, 1.35052490234375, 1.4285888671875, 1.50665283203125, 1.584716796875, 1.66278076171875, 1.7408447265625, 1.81890869140625, 1.89697265625, 1.97503662109375, 2.0531005859375, 2.13116455078125, 2.209228515625, 2.28729248046875, 2.3653564453125, 2.44342041015625, 2.521484375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 7.0, 3.0, 3.0, 9.0, 6.0, 10.0, 13.0, 17.0, 19.0, 28.0, 24.0, 32.0, 35.0, 55.0, 44.0, 59.0, 54.0, 114.0, 432.0, 1519.0, 123.0, 50.0, 55.0, 53.0, 50.0, 38.0, 33.0, 29.0, 31.0, 28.0, 26.0, 8.0, 8.0, 9.0, 10.0, 3.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0, -7.7147216796875, -7.429443359375, -7.1441650390625, -6.85888671875, -6.5736083984375, -6.288330078125, -6.0030517578125, -5.7177734375, -5.4324951171875, -5.147216796875, -4.8619384765625, -4.57666015625, -4.2913818359375, -4.006103515625, -3.7208251953125, -3.435546875, -3.1502685546875, -2.864990234375, -2.5797119140625, -2.29443359375, -2.0091552734375, -1.723876953125, -1.4385986328125, -1.1533203125, -0.8680419921875, -0.582763671875, -0.2974853515625, -0.01220703125, 0.2730712890625, 0.558349609375, 0.8436279296875, 1.12890625, 1.4141845703125, 1.699462890625, 1.9847412109375, 2.27001953125, 2.5552978515625, 2.840576171875, 3.1258544921875, 3.4111328125, 3.6964111328125, 3.981689453125, 4.2669677734375, 4.55224609375, 4.8375244140625, 5.122802734375, 5.4080810546875, 5.693359375, 5.9786376953125, 6.263916015625, 6.5491943359375, 6.83447265625, 7.1197509765625, 7.405029296875, 7.6903076171875, 7.9755859375, 8.2608642578125, 8.546142578125, 8.8314208984375, 9.11669921875, 9.4019775390625, 9.687255859375, 9.9725341796875, 10.2578125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 18.0, 12.0, 8.0, 12.0, 23.0, 32.0, 41.0, 57.0, 55.0, 79.0, 117.0, 191.0, 348.0, 1101.0, 11049.0, 2046745.0, 1075322.0, 8569.0, 948.0, 378.0, 171.0, 109.0, 65.0, 59.0, 44.0, 36.0, 21.0, 21.0, 12.0, 10.0, 10.0, 17.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.6875, -16.210205078125, -15.73291015625, -15.255615234375, -14.7783203125, -14.301025390625, -13.82373046875, -13.346435546875, -12.869140625, -12.391845703125, -11.91455078125, -11.437255859375, -10.9599609375, -10.482666015625, -10.00537109375, -9.528076171875, -9.05078125, -8.573486328125, -8.09619140625, -7.618896484375, -7.1416015625, -6.664306640625, -6.18701171875, -5.709716796875, -5.232421875, -4.755126953125, -4.27783203125, -3.800537109375, -3.3232421875, -2.845947265625, -2.36865234375, -1.891357421875, -1.4140625, -0.936767578125, -0.45947265625, 0.017822265625, 0.4951171875, 0.972412109375, 1.44970703125, 1.927001953125, 2.404296875, 2.881591796875, 3.35888671875, 3.836181640625, 4.3134765625, 4.790771484375, 5.26806640625, 5.745361328125, 6.22265625, 6.699951171875, 7.17724609375, 7.654541015625, 8.1318359375, 8.609130859375, 9.08642578125, 9.563720703125, 10.041015625, 10.518310546875, 10.99560546875, 11.472900390625, 11.9501953125, 12.427490234375, 12.90478515625, 13.382080078125, 13.859375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 10.0, 37.0, 138.0, 324.0, 339.0, 140.0, 26.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.88785934448242, -42.930809020996094, -41.97376251220703, -41.0167121887207, -40.059661865234375, -39.10261154174805, -38.14556121826172, -37.188514709472656, -36.23146438598633, -35.2744140625, -34.31736755371094, -33.36031723022461, -32.40326690673828, -31.446216583251953, -30.489168167114258, -29.532119750976562, -28.575069427490234, -27.618019104003906, -26.66097068786621, -25.703922271728516, -24.746871948242188, -23.78982162475586, -22.832773208618164, -21.87572479248047, -20.91867446899414, -19.961624145507812, -19.004575729370117, -18.047527313232422, -17.090476989746094, -16.133426666259766, -15.17637825012207, -14.219328880310059, -13.262277603149414, -12.305228233337402, -11.34817886352539, -10.391129493713379, -9.434080123901367, -8.477030754089355, -7.519981384277344, -6.562932014465332, -5.60588264465332, -4.648833274841309, -3.691783905029297, -2.734734535217285, -1.7776851654052734, -0.8206357955932617, 0.13641357421875, 1.0934629440307617, 2.0505123138427734, 3.007561683654785, 3.964611053466797, 4.921660423278809, 5.87870979309082, 6.835759162902832, 7.792808532714844, 8.749857902526855, 9.706907272338867, 10.663956642150879, 11.62100601196289, 12.578055381774902, 13.535104751586914, 14.492154121398926, 15.449203491210938, 16.406253814697266, 17.36330223083496]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 10.0, 13.0, 8.0, 16.0, 15.0, 12.0, 17.0, 13.0, 20.0, 22.0, 32.0, 28.0, 31.0, 36.0, 35.0, 35.0, 41.0, 43.0, 45.0, 39.0, 35.0, 30.0, 45.0, 32.0, 45.0, 26.0, 33.0, 32.0, 23.0, 34.0, 22.0, 17.0, 17.0, 13.0, 16.0, 12.0, 14.0, 3.0, 9.0, 9.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-27.39957618713379, -26.6306209564209, -25.86166763305664, -25.09271240234375, -24.32375717163086, -23.5548038482666, -22.78584861755371, -22.016895294189453, -21.247940063476562, -20.478984832763672, -19.710031509399414, -18.941076278686523, -18.172122955322266, -17.403167724609375, -16.634212493896484, -15.86525821685791, -15.096303939819336, -14.327349662780762, -13.558395385742188, -12.789440155029297, -12.020485877990723, -11.251531600952148, -10.482576370239258, -9.713622093200684, -8.94466781616211, -8.175713539123535, -7.406758785247803, -6.63780403137207, -5.868849754333496, -5.099895477294922, -4.3309407234191895, -3.561985969543457, -2.7930335998535156, -2.0240790843963623, -1.255124568939209, -0.48617005348205566, 0.28278446197509766, 1.051738977432251, 1.8206934928894043, 2.5896482467651367, 3.358602523803711, 4.127556800842285, 4.896511554718018, 5.66546630859375, 6.434420585632324, 7.203374862670898, 7.972329616546631, 8.741284370422363, 9.510238647460938, 10.279192924499512, 11.048147201538086, 11.817102432250977, 12.58605670928955, 13.355010986328125, 14.123966217041016, 14.89292049407959, 15.661874771118164, 16.430830001831055, 17.199783325195312, 17.968738555908203, 18.737693786621094, 19.50664710998535, 20.275602340698242, 21.0445556640625, 21.81351089477539]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 6.0, 3.0, 2.0, 5.0, 2.0, 7.0, 8.0, 12.0, 16.0, 15.0, 15.0, 22.0, 21.0, 18.0, 22.0, 23.0, 31.0, 25.0, 29.0, 25.0, 41.0, 32.0, 33.0, 44.0, 31.0, 51.0, 42.0, 34.0, 37.0, 39.0, 34.0, 35.0, 19.0, 19.0, 34.0, 15.0, 19.0, 19.0, 26.0, 11.0, 18.0, 15.0, 12.0, 10.0, 3.0, 7.0, 6.0, 3.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.1640625, -2.096588134765625, -2.02911376953125, -1.961639404296875, -1.8941650390625, -1.826690673828125, -1.75921630859375, -1.691741943359375, -1.624267578125, -1.556793212890625, -1.48931884765625, -1.421844482421875, -1.3543701171875, -1.286895751953125, -1.21942138671875, -1.151947021484375, -1.08447265625, -1.016998291015625, -0.94952392578125, -0.882049560546875, -0.8145751953125, -0.747100830078125, -0.67962646484375, -0.612152099609375, -0.544677734375, -0.477203369140625, -0.40972900390625, -0.342254638671875, -0.2747802734375, -0.207305908203125, -0.13983154296875, -0.072357177734375, -0.0048828125, 0.062591552734375, 0.13006591796875, 0.197540283203125, 0.2650146484375, 0.332489013671875, 0.39996337890625, 0.467437744140625, 0.534912109375, 0.602386474609375, 0.66986083984375, 0.737335205078125, 0.8048095703125, 0.872283935546875, 0.93975830078125, 1.007232666015625, 1.07470703125, 1.142181396484375, 1.20965576171875, 1.277130126953125, 1.3446044921875, 1.412078857421875, 1.47955322265625, 1.547027587890625, 1.614501953125, 1.681976318359375, 1.74945068359375, 1.816925048828125, 1.8843994140625, 1.951873779296875, 2.01934814453125, 2.086822509765625, 2.154296875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 8.0, 10.0, 10.0, 12.0, 12.0, 13.0, 12.0, 15.0, 23.0, 28.0, 19.0, 16.0, 26.0, 31.0, 37.0, 60.0, 148.0, 468.0, 2428.0, 42806.0, 2771058.0, 1356148.0, 18638.0, 1502.0, 310.0, 113.0, 56.0, 44.0, 26.0, 27.0, 17.0, 15.0, 12.0, 20.0, 20.0, 20.0, 17.0, 11.0, 12.0, 10.0, 5.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.8203125, -12.430419921875, -12.04052734375, -11.650634765625, -11.2607421875, -10.870849609375, -10.48095703125, -10.091064453125, -9.701171875, -9.311279296875, -8.92138671875, -8.531494140625, -8.1416015625, -7.751708984375, -7.36181640625, -6.971923828125, -6.58203125, -6.192138671875, -5.80224609375, -5.412353515625, -5.0224609375, -4.632568359375, -4.24267578125, -3.852783203125, -3.462890625, -3.072998046875, -2.68310546875, -2.293212890625, -1.9033203125, -1.513427734375, -1.12353515625, -0.733642578125, -0.34375, 0.046142578125, 0.43603515625, 0.825927734375, 1.2158203125, 1.605712890625, 1.99560546875, 2.385498046875, 2.775390625, 3.165283203125, 3.55517578125, 3.945068359375, 4.3349609375, 4.724853515625, 5.11474609375, 5.504638671875, 5.89453125, 6.284423828125, 6.67431640625, 7.064208984375, 7.4541015625, 7.843994140625, 8.23388671875, 8.623779296875, 9.013671875, 9.403564453125, 9.79345703125, 10.183349609375, 10.5732421875, 10.963134765625, 11.35302734375, 11.742919921875, 12.1328125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 8.0, 6.0, 6.0, 6.0, 15.0, 21.0, 22.0, 30.0, 48.0, 60.0, 70.0, 102.0, 128.0, 201.0, 250.0, 271.0, 419.0, 415.0, 403.0, 348.0, 334.0, 266.0, 157.0, 127.0, 107.0, 65.0, 27.0, 27.0, 39.0, 25.0, 19.0, 18.0, 5.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.2890625, -7.08026123046875, -6.8714599609375, -6.66265869140625, -6.453857421875, -6.24505615234375, -6.0362548828125, -5.82745361328125, -5.61865234375, -5.40985107421875, -5.2010498046875, -4.99224853515625, -4.783447265625, -4.57464599609375, -4.3658447265625, -4.15704345703125, -3.9482421875, -3.73944091796875, -3.5306396484375, -3.32183837890625, -3.113037109375, -2.90423583984375, -2.6954345703125, -2.48663330078125, -2.27783203125, -2.06903076171875, -1.8602294921875, -1.65142822265625, -1.442626953125, -1.23382568359375, -1.0250244140625, -0.81622314453125, -0.607421875, -0.39862060546875, -0.1898193359375, 0.01898193359375, 0.227783203125, 0.43658447265625, 0.6453857421875, 0.85418701171875, 1.06298828125, 1.27178955078125, 1.4805908203125, 1.68939208984375, 1.898193359375, 2.10699462890625, 2.3157958984375, 2.52459716796875, 2.7333984375, 2.94219970703125, 3.1510009765625, 3.35980224609375, 3.568603515625, 3.77740478515625, 3.9862060546875, 4.19500732421875, 4.40380859375, 4.61260986328125, 4.8214111328125, 5.03021240234375, 5.239013671875, 5.44781494140625, 5.6566162109375, 5.86541748046875, 6.07421875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 8.0, 5.0, 21.0, 20.0, 34.0, 37.0, 58.0, 122.0, 139.0, 240.0, 508.0, 2925.0, 361250.0, 3812626.0, 14491.0, 883.0, 362.0, 184.0, 110.0, 107.0, 56.0, 31.0, 22.0, 15.0, 11.0, 8.0, 5.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.171875, -26.135986328125, -25.10009765625, -24.064208984375, -23.0283203125, -21.992431640625, -20.95654296875, -19.920654296875, -18.884765625, -17.848876953125, -16.81298828125, -15.777099609375, -14.7412109375, -13.705322265625, -12.66943359375, -11.633544921875, -10.59765625, -9.561767578125, -8.52587890625, -7.489990234375, -6.4541015625, -5.418212890625, -4.38232421875, -3.346435546875, -2.310546875, -1.274658203125, -0.23876953125, 0.797119140625, 1.8330078125, 2.868896484375, 3.90478515625, 4.940673828125, 5.9765625, 7.012451171875, 8.04833984375, 9.084228515625, 10.1201171875, 11.156005859375, 12.19189453125, 13.227783203125, 14.263671875, 15.299560546875, 16.33544921875, 17.371337890625, 18.4072265625, 19.443115234375, 20.47900390625, 21.514892578125, 22.55078125, 23.586669921875, 24.62255859375, 25.658447265625, 26.6943359375, 27.730224609375, 28.76611328125, 29.802001953125, 30.837890625, 31.873779296875, 32.90966796875, 33.945556640625, 34.9814453125, 36.017333984375, 37.05322265625, 38.089111328125, 39.125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 30.0, 165.0, 378.0, 330.0, 100.0, 10.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-170.1788787841797, -167.13201904296875, -164.0851593017578, -161.03829956054688, -157.99143981933594, -154.944580078125, -151.89773559570312, -148.8508758544922, -145.80401611328125, -142.7571563720703, -139.71029663085938, -136.66343688964844, -133.6165771484375, -130.56973266601562, -127.52286529541016, -124.47600555419922, -121.42914581298828, -118.38228607177734, -115.3354263305664, -112.28857421875, -109.24171447753906, -106.19485473632812, -103.14799499511719, -100.10113525390625, -97.05427551269531, -94.00741577148438, -90.96055603027344, -87.9136962890625, -84.8668441772461, -81.81998443603516, -78.77312469482422, -75.72626495361328, -72.6794204711914, -69.63256072998047, -66.58570098876953, -63.53884506225586, -60.49198913574219, -57.44512939453125, -54.39826965332031, -51.351409912109375, -48.3045539855957, -45.257694244384766, -42.210838317871094, -39.163978576660156, -36.11711883544922, -33.07026290893555, -30.02340316772461, -26.976545333862305, -23.9296875, -20.882829666137695, -17.83597183227539, -14.789112091064453, -11.742254257202148, -8.695396423339844, -5.648536682128906, -2.6016788482666016, 0.4451789855957031, 3.492037296295166, 6.538895606994629, 9.58575439453125, 12.632612228393555, 15.67947006225586, 18.726329803466797, 21.7731876373291, 24.820045471191406]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 6.0, 9.0, 8.0, 10.0, 9.0, 9.0, 10.0, 17.0, 19.0, 17.0, 20.0, 23.0, 27.0, 32.0, 23.0, 25.0, 41.0, 27.0, 50.0, 34.0, 34.0, 49.0, 39.0, 44.0, 40.0, 40.0, 39.0, 37.0, 23.0, 24.0, 25.0, 30.0, 19.0, 19.0, 17.0, 13.0, 15.0, 11.0, 15.0, 8.0, 9.0, 7.0, 7.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.906139373779297, -19.24754524230957, -18.58894920349121, -17.930355072021484, -17.271759033203125, -16.6131649017334, -15.954569816589355, -15.295974731445312, -14.63737964630127, -13.978784561157227, -13.320189476013184, -12.66159439086914, -12.003000259399414, -11.344404220581055, -10.685810089111328, -10.027215003967285, -9.368619918823242, -8.7100248336792, -8.051429748535156, -7.3928351402282715, -6.7342400550842285, -6.0756449699401855, -5.417050361633301, -4.758455276489258, -4.099860191345215, -3.441265106201172, -2.782670259475708, -2.124075412750244, -1.4654803276062012, -0.8068852424621582, -0.14829039573669434, 0.5103044509887695, 1.1689014434814453, 1.8274964094161987, 2.486091375350952, 3.144686222076416, 3.803281307220459, 4.461876392364502, 5.120471000671387, 5.77906608581543, 6.437661170959473, 7.096256256103516, 7.754851341247559, 8.413446426391602, 9.072040557861328, 9.730636596679688, 10.389230728149414, 11.047825813293457, 11.7064208984375, 12.365015983581543, 13.023611068725586, 13.682206153869629, 14.340801239013672, 14.999395370483398, 15.657990455627441, 16.316585540771484, 16.975181579589844, 17.63377571105957, 18.29237174987793, 18.950965881347656, 19.609561920166016, 20.268156051635742, 20.9267520904541, 21.585346221923828, 22.243940353393555]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 10.0, 5.0, 7.0, 10.0, 7.0, 12.0, 14.0, 14.0, 22.0, 20.0, 21.0, 14.0, 23.0, 29.0, 40.0, 32.0, 37.0, 32.0, 46.0, 22.0, 37.0, 28.0, 50.0, 41.0, 48.0, 36.0, 40.0, 29.0, 33.0, 24.0, 18.0, 23.0, 20.0, 17.0, 26.0, 21.0, 21.0, 17.0, 12.0, 7.0, 12.0, 7.0, 6.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.177734375, -2.107421875, -2.037109375, -1.966796875, -1.896484375, -1.826171875, -1.755859375, -1.685546875, -1.615234375, -1.544921875, -1.474609375, -1.404296875, -1.333984375, -1.263671875, -1.193359375, -1.123046875, -1.052734375, -0.982421875, -0.912109375, -0.841796875, -0.771484375, -0.701171875, -0.630859375, -0.560546875, -0.490234375, -0.419921875, -0.349609375, -0.279296875, -0.208984375, -0.138671875, -0.068359375, 0.001953125, 0.072265625, 0.142578125, 0.212890625, 0.283203125, 0.353515625, 0.423828125, 0.494140625, 0.564453125, 0.634765625, 0.705078125, 0.775390625, 0.845703125, 0.916015625, 0.986328125, 1.056640625, 1.126953125, 1.197265625, 1.267578125, 1.337890625, 1.408203125, 1.478515625, 1.548828125, 1.619140625, 1.689453125, 1.759765625, 1.830078125, 1.900390625, 1.970703125, 2.041015625, 2.111328125, 2.181640625, 2.251953125, 2.322265625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 7.0, 8.0, 8.0, 11.0, 13.0, 24.0, 38.0, 58.0, 66.0, 111.0, 162.0, 226.0, 338.0, 482.0, 700.0, 983.0, 1449.0, 2053.0, 2925.0, 4291.0, 6130.0, 8811.0, 12756.0, 18585.0, 27513.0, 41772.0, 67127.0, 116498.0, 297536.0, 182195.0, 91381.0, 54424.0, 34814.0, 23245.0, 15891.0, 10958.0, 7680.0, 5327.0, 3673.0, 2565.0, 1770.0, 1204.0, 864.0, 583.0, 396.0, 272.0, 189.0, 151.0, 98.0, 60.0, 53.0, 32.0, 20.0, 14.0, 12.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.4853515625, -0.4695892333984375, -0.453826904296875, -0.4380645751953125, -0.42230224609375, -0.4065399169921875, -0.390777587890625, -0.3750152587890625, -0.3592529296875, -0.3434906005859375, -0.327728271484375, -0.3119659423828125, -0.29620361328125, -0.2804412841796875, -0.264678955078125, -0.2489166259765625, -0.233154296875, -0.2173919677734375, -0.201629638671875, -0.1858673095703125, -0.17010498046875, -0.1543426513671875, -0.138580322265625, -0.1228179931640625, -0.1070556640625, -0.0912933349609375, -0.075531005859375, -0.0597686767578125, -0.04400634765625, -0.0282440185546875, -0.012481689453125, 0.0032806396484375, 0.01904296875, 0.0348052978515625, 0.050567626953125, 0.0663299560546875, 0.08209228515625, 0.0978546142578125, 0.113616943359375, 0.1293792724609375, 0.1451416015625, 0.1609039306640625, 0.176666259765625, 0.1924285888671875, 0.20819091796875, 0.2239532470703125, 0.239715576171875, 0.2554779052734375, 0.271240234375, 0.2870025634765625, 0.302764892578125, 0.3185272216796875, 0.33428955078125, 0.3500518798828125, 0.365814208984375, 0.3815765380859375, 0.3973388671875, 0.4131011962890625, 0.428863525390625, 0.4446258544921875, 0.46038818359375, 0.4761505126953125, 0.491912841796875, 0.5076751708984375, 0.5234375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 1.0, 9.0, 12.0, 8.0, 9.0, 20.0, 20.0, 13.0, 27.0, 20.0, 30.0, 35.0, 42.0, 46.0, 43.0, 32.0, 42.0, 40.0, 47.0, 1063.0, 37.0, 32.0, 39.0, 27.0, 34.0, 50.0, 21.0, 30.0, 33.0, 32.0, 24.0, 13.0, 17.0, 9.0, 16.0, 7.0, 12.0, 6.0, 6.0, 5.0, 6.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.419921875, -1.3717498779296875, -1.323577880859375, -1.2754058837890625, -1.22723388671875, -1.1790618896484375, -1.130889892578125, -1.0827178955078125, -1.0345458984375, -0.9863739013671875, -0.938201904296875, -0.8900299072265625, -0.84185791015625, -0.7936859130859375, -0.745513916015625, -0.6973419189453125, -0.649169921875, -0.6009979248046875, -0.552825927734375, -0.5046539306640625, -0.45648193359375, -0.4083099365234375, -0.360137939453125, -0.3119659423828125, -0.2637939453125, -0.2156219482421875, -0.167449951171875, -0.1192779541015625, -0.07110595703125, -0.0229339599609375, 0.025238037109375, 0.0734100341796875, 0.12158203125, 0.1697540283203125, 0.217926025390625, 0.2660980224609375, 0.31427001953125, 0.3624420166015625, 0.410614013671875, 0.4587860107421875, 0.5069580078125, 0.5551300048828125, 0.603302001953125, 0.6514739990234375, 0.69964599609375, 0.7478179931640625, 0.795989990234375, 0.8441619873046875, 0.892333984375, 0.9405059814453125, 0.988677978515625, 1.0368499755859375, 1.08502197265625, 1.1331939697265625, 1.181365966796875, 1.2295379638671875, 1.2777099609375, 1.3258819580078125, 1.374053955078125, 1.4222259521484375, 1.47039794921875, 1.5185699462890625, 1.566741943359375, 1.6149139404296875, 1.6630859375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 8.0, 4.0, 5.0, 8.0, 9.0, 20.0, 27.0, 27.0, 44.0, 82.0, 79.0, 133.0, 223.0, 304.0, 459.0, 620.0, 1146.0, 1572.0, 2649.0, 4330.0, 7165.0, 11838.0, 20521.0, 36493.0, 66515.0, 125244.0, 1387818.0, 209345.0, 97256.0, 52282.0, 28964.0, 16537.0, 9608.0, 5846.0, 3539.0, 2363.0, 1440.0, 872.0, 607.0, 393.0, 267.0, 145.0, 119.0, 78.0, 41.0, 28.0, 27.0, 15.0, 8.0, 10.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-0.6494140625, -0.6302032470703125, -0.610992431640625, -0.5917816162109375, -0.57257080078125, -0.5533599853515625, -0.534149169921875, -0.5149383544921875, -0.4957275390625, -0.4765167236328125, -0.457305908203125, -0.4380950927734375, -0.41888427734375, -0.3996734619140625, -0.380462646484375, -0.3612518310546875, -0.342041015625, -0.3228302001953125, -0.303619384765625, -0.2844085693359375, -0.26519775390625, -0.2459869384765625, -0.226776123046875, -0.2075653076171875, -0.1883544921875, -0.1691436767578125, -0.149932861328125, -0.1307220458984375, -0.11151123046875, -0.0923004150390625, -0.073089599609375, -0.0538787841796875, -0.03466796875, -0.0154571533203125, 0.003753662109375, 0.0229644775390625, 0.04217529296875, 0.0613861083984375, 0.080596923828125, 0.0998077392578125, 0.1190185546875, 0.1382293701171875, 0.157440185546875, 0.1766510009765625, 0.19586181640625, 0.2150726318359375, 0.234283447265625, 0.2534942626953125, 0.272705078125, 0.2919158935546875, 0.311126708984375, 0.3303375244140625, 0.34954833984375, 0.3687591552734375, 0.387969970703125, 0.4071807861328125, 0.4263916015625, 0.4456024169921875, 0.464813232421875, 0.4840240478515625, 0.50323486328125, 0.5224456787109375, 0.541656494140625, 0.5608673095703125, 0.580078125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 2.0, 5.0, 7.0, 12.0, 10.0, 18.0, 17.0, 21.0, 18.0, 25.0, 41.0, 67.0, 73.0, 78.0, 116.0, 88.0, 84.0, 66.0, 51.0, 38.0, 30.0, 26.0, 12.0, 21.0, 12.0, 21.0, 8.0, 9.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.0005950927734375, -0.000578068196773529, -0.0005610436201095581, -0.0005440190434455872, -0.0005269944667816162, -0.0005099698901176453, -0.0004929453134536743, -0.00047592073678970337, -0.0004588961601257324, -0.0004418715834617615, -0.00042484700679779053, -0.0004078224301338196, -0.00039079785346984863, -0.0003737732768058777, -0.00035674870014190674, -0.0003397241234779358, -0.00032269954681396484, -0.0003056749701499939, -0.00028865039348602295, -0.000271625816822052, -0.00025460124015808105, -0.0002375766634941101, -0.00022055208683013916, -0.0002035275101661682, -0.00018650293350219727, -0.00016947835683822632, -0.00015245378017425537, -0.00013542920351028442, -0.00011840462684631348, -0.00010138005018234253, -8.435547351837158e-05, -6.733089685440063e-05, -5.030632019042969e-05, -3.328174352645874e-05, -1.6257166862487793e-05, 7.674098014831543e-07, 1.77919864654541e-05, 3.481656312942505e-05, 5.1841139793395996e-05, 6.886571645736694e-05, 8.589029312133789e-05, 0.00010291486978530884, 0.00011993944644927979, 0.00013696402311325073, 0.00015398859977722168, 0.00017101317644119263, 0.00018803775310516357, 0.00020506232976913452, 0.00022208690643310547, 0.00023911148309707642, 0.00025613605976104736, 0.0002731606364250183, 0.00029018521308898926, 0.0003072097897529602, 0.00032423436641693115, 0.0003412589430809021, 0.00035828351974487305, 0.000375308096408844, 0.00039233267307281494, 0.0004093572497367859, 0.00042638182640075684, 0.0004434064030647278, 0.00046043097972869873, 0.0004774555563926697, 0.0004944801330566406]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 5.0, 0.0, 4.0, 2.0, 6.0, 1.0, 3.0, 9.0, 9.0, 13.0, 12.0, 19.0, 24.0, 40.0, 30.0, 44.0, 63.0, 109.0, 112.0, 221.0, 457.0, 2615.0, 1028139.0, 15160.0, 595.0, 262.0, 187.0, 118.0, 67.0, 54.0, 40.0, 28.0, 20.0, 21.0, 9.0, 16.0, 18.0, 9.0, 6.0, 5.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00975799560546875, -0.009428858757019043, -0.009099721908569336, -0.008770585060119629, -0.008441448211669922, -0.008112311363220215, -0.007783174514770508, -0.007454037666320801, -0.007124900817871094, -0.006795763969421387, -0.00646662712097168, -0.006137490272521973, -0.005808353424072266, -0.005479216575622559, -0.0051500797271728516, -0.0048209428787231445, -0.0044918060302734375, -0.0041626691818237305, -0.0038335323333740234, -0.0035043954849243164, -0.0031752586364746094, -0.0028461217880249023, -0.0025169849395751953, -0.0021878480911254883, -0.0018587112426757812, -0.0015295743942260742, -0.0012004375457763672, -0.0008713006973266602, -0.0005421638488769531, -0.0002130270004272461, 0.00011610984802246094, 0.00044524669647216797, 0.000774383544921875, 0.001103520393371582, 0.001432657241821289, 0.001761794090270996, 0.002090930938720703, 0.00242006778717041, 0.002749204635620117, 0.0030783414840698242, 0.0034074783325195312, 0.0037366151809692383, 0.004065752029418945, 0.004394888877868652, 0.004724025726318359, 0.005053162574768066, 0.0053822994232177734, 0.0057114362716674805, 0.0060405731201171875, 0.0063697099685668945, 0.0066988468170166016, 0.007027983665466309, 0.007357120513916016, 0.007686257362365723, 0.00801539421081543, 0.008344531059265137, 0.008673667907714844, 0.00900280475616455, 0.009331941604614258, 0.009661078453063965, 0.009990215301513672, 0.010319352149963379, 0.010648488998413086, 0.010977625846862793, 0.0113067626953125]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 63.0, 688.0, 259.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002278360305353999, -0.002217974280938506, -0.0021575884893536568, -0.0020972024649381638, -0.0020368166733533144, -0.0019764306489378214, -0.0019160447409376502, -0.001855658832937479, -0.0017952729249373078, -0.0017348870169371367, -0.0016745011089369655, -0.0016141152009367943, -0.0015537291765213013, -0.001493343384936452, -0.001432957360520959, -0.0013725714525207877, -0.0013121855445206165, -0.0012517996365204453, -0.0011914137285202742, -0.001131027820520103, -0.0010706419125199318, -0.0010102558881044388, -0.0009498699801042676, -0.0008894840721040964, -0.0008290981641039252, -0.000768712256103754, -0.0007083263481035829, -0.0006479403818957508, -0.0005875544738955796, -0.0005271685658954084, -0.00046678262879140675, -0.0004063966916874051, -0.0003460106672719121, -0.0002856247592717409, -0.00022523882216773927, -0.00016485289961565286, -0.00010446697706356645, -4.408106906339526e-05, 1.630486804060638e-05, 7.669080514460802e-05, 0.0001370767131447792, 0.00019746263569686562, 0.00025784855824895203, 0.00031823449535295367, 0.00037862040335312486, 0.00043900631135329604, 0.0004993922775611281, 0.0005597781855612993, 0.0006201640935614705, 0.0006805500015616417, 0.0007409359095618129, 0.000801321875769645, 0.0008617077837698162, 0.0009220936917699873, 0.0009824796579778194, 0.0010428655659779906, 0.0011032514739781618, 0.001163637381978333, 0.0012240232899785042, 0.0012844091979786754, 0.0013447951059788465, 0.0014051811303943396, 0.0014655670383945107, 0.001525952946394682, 0.0015863388543948531]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 8.0, 13.0, 10.0, 15.0, 15.0, 23.0, 16.0, 38.0, 23.0, 28.0, 35.0, 30.0, 38.0, 37.0, 48.0, 55.0, 54.0, 38.0, 51.0, 44.0, 42.0, 38.0, 33.0, 40.0, 38.0, 29.0, 30.0, 18.0, 25.0, 6.0, 15.0, 12.0, 11.0, 13.0, 8.0, 9.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000260770320892334, -0.0002523651346564293, -0.0002439599484205246, -0.0002355547621846199, -0.0002271495759487152, -0.00021874438971281052, -0.00021033920347690582, -0.00020193401724100113, -0.00019352883100509644, -0.00018512364476919174, -0.00017671845853328705, -0.00016831327229738235, -0.00015990808606147766, -0.00015150289982557297, -0.00014309771358966827, -0.00013469252735376358, -0.0001262873411178589, -0.00011788215488195419, -0.0001094769686460495, -0.0001010717824101448, -9.266659617424011e-05, -8.426140993833542e-05, -7.585622370243073e-05, -6.745103746652603e-05, -5.904585123062134e-05, -5.0640664994716644e-05, -4.223547875881195e-05, -3.383029252290726e-05, -2.5425106287002563e-05, -1.701992005109787e-05, -8.614733815193176e-06, -2.0954757928848267e-07, 8.195638656616211e-06, 1.6600824892520905e-05, 2.5006011128425598e-05, 3.341119736433029e-05, 4.1816383600234985e-05, 5.022156983613968e-05, 5.862675607204437e-05, 6.703194230794907e-05, 7.543712854385376e-05, 8.384231477975845e-05, 9.224750101566315e-05, 0.00010065268725156784, 0.00010905787348747253, 0.00011746305972337723, 0.00012586824595928192, 0.00013427343219518661, 0.0001426786184310913, 0.000151083804666996, 0.0001594889909029007, 0.0001678941771388054, 0.00017629936337471008, 0.00018470454961061478, 0.00019310973584651947, 0.00020151492208242416, 0.00020992010831832886, 0.00021832529455423355, 0.00022673048079013824, 0.00023513566702604294, 0.00024354085326194763, 0.0002519460394978523, 0.000260351225733757, 0.0002687564119696617, 0.0002771615982055664]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 10.0, 5.0, 7.0, 10.0, 7.0, 12.0, 14.0, 14.0, 22.0, 20.0, 21.0, 14.0, 23.0, 29.0, 40.0, 32.0, 37.0, 32.0, 46.0, 22.0, 37.0, 27.0, 51.0, 41.0, 48.0, 36.0, 40.0, 29.0, 33.0, 24.0, 18.0, 23.0, 20.0, 17.0, 26.0, 21.0, 21.0, 17.0, 12.0, 7.0, 12.0, 7.0, 6.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.177734375, -2.107421875, -2.037109375, -1.966796875, -1.896484375, -1.826171875, -1.755859375, -1.685546875, -1.615234375, -1.544921875, -1.474609375, -1.404296875, -1.333984375, -1.263671875, -1.193359375, -1.123046875, -1.052734375, -0.982421875, -0.912109375, -0.841796875, -0.771484375, -0.701171875, -0.630859375, -0.560546875, -0.490234375, -0.419921875, -0.349609375, -0.279296875, -0.208984375, -0.138671875, -0.068359375, 0.001953125, 0.072265625, 0.142578125, 0.212890625, 0.283203125, 0.353515625, 0.423828125, 0.494140625, 0.564453125, 0.634765625, 0.705078125, 0.775390625, 0.845703125, 0.916015625, 0.986328125, 1.056640625, 1.126953125, 1.197265625, 1.267578125, 1.337890625, 1.408203125, 1.478515625, 1.548828125, 1.619140625, 1.689453125, 1.759765625, 1.830078125, 1.900390625, 1.970703125, 2.041015625, 2.111328125, 2.181640625, 2.251953125, 2.322265625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 2.0, 6.0, 10.0, 13.0, 25.0, 22.0, 28.0, 24.0, 52.0, 62.0, 69.0, 106.0, 141.0, 229.0, 323.0, 570.0, 963.0, 1591.0, 2944.0, 6830.0, 17918.0, 54860.0, 198112.0, 453141.0, 216716.0, 59894.0, 19076.0, 7280.0, 3293.0, 1563.0, 948.0, 538.0, 334.0, 253.0, 156.0, 109.0, 88.0, 63.0, 58.0, 32.0, 31.0, 16.0, 13.0, 16.0, 12.0, 7.0, 6.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4921875, -2.407806396484375, -2.32342529296875, -2.239044189453125, -2.1546630859375, -2.070281982421875, -1.98590087890625, -1.901519775390625, -1.817138671875, -1.732757568359375, -1.64837646484375, -1.563995361328125, -1.4796142578125, -1.395233154296875, -1.31085205078125, -1.226470947265625, -1.14208984375, -1.057708740234375, -0.97332763671875, -0.888946533203125, -0.8045654296875, -0.720184326171875, -0.63580322265625, -0.551422119140625, -0.467041015625, -0.382659912109375, -0.29827880859375, -0.213897705078125, -0.1295166015625, -0.045135498046875, 0.03924560546875, 0.123626708984375, 0.2080078125, 0.292388916015625, 0.37677001953125, 0.461151123046875, 0.5455322265625, 0.629913330078125, 0.71429443359375, 0.798675537109375, 0.883056640625, 0.967437744140625, 1.05181884765625, 1.136199951171875, 1.2205810546875, 1.304962158203125, 1.38934326171875, 1.473724365234375, 1.55810546875, 1.642486572265625, 1.72686767578125, 1.811248779296875, 1.8956298828125, 1.980010986328125, 2.06439208984375, 2.148773193359375, 2.233154296875, 2.317535400390625, 2.40191650390625, 2.486297607421875, 2.5706787109375, 2.655059814453125, 2.73944091796875, 2.823822021484375, 2.908203125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 4.0, 4.0, 8.0, 7.0, 9.0, 12.0, 13.0, 10.0, 16.0, 29.0, 27.0, 41.0, 38.0, 27.0, 42.0, 58.0, 63.0, 117.0, 425.0, 1526.0, 119.0, 71.0, 35.0, 49.0, 45.0, 33.0, 41.0, 41.0, 28.0, 24.0, 16.0, 10.0, 17.0, 12.0, 7.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.09375, -9.7974853515625, -9.501220703125, -9.2049560546875, -8.90869140625, -8.6124267578125, -8.316162109375, -8.0198974609375, -7.7236328125, -7.4273681640625, -7.131103515625, -6.8348388671875, -6.53857421875, -6.2423095703125, -5.946044921875, -5.6497802734375, -5.353515625, -5.0572509765625, -4.760986328125, -4.4647216796875, -4.16845703125, -3.8721923828125, -3.575927734375, -3.2796630859375, -2.9833984375, -2.6871337890625, -2.390869140625, -2.0946044921875, -1.79833984375, -1.5020751953125, -1.205810546875, -0.9095458984375, -0.61328125, -0.3170166015625, -0.020751953125, 0.2755126953125, 0.57177734375, 0.8680419921875, 1.164306640625, 1.4605712890625, 1.7568359375, 2.0531005859375, 2.349365234375, 2.6456298828125, 2.94189453125, 3.2381591796875, 3.534423828125, 3.8306884765625, 4.126953125, 4.4232177734375, 4.719482421875, 5.0157470703125, 5.31201171875, 5.6082763671875, 5.904541015625, 6.2008056640625, 6.4970703125, 6.7933349609375, 7.089599609375, 7.3858642578125, 7.68212890625, 7.9783935546875, 8.274658203125, 8.5709228515625, 8.8671875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 2.0, 7.0, 15.0, 14.0, 20.0, 18.0, 26.0, 39.0, 51.0, 51.0, 80.0, 109.0, 193.0, 386.0, 968.0, 7059.0, 782772.0, 2341593.0, 9991.0, 1243.0, 441.0, 178.0, 100.0, 78.0, 57.0, 54.0, 42.0, 16.0, 17.0, 15.0, 13.0, 12.0, 10.0, 6.0, 7.0, 4.0, 6.0, 5.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.921875, -15.42529296875, -14.9287109375, -14.43212890625, -13.935546875, -13.43896484375, -12.9423828125, -12.44580078125, -11.94921875, -11.45263671875, -10.9560546875, -10.45947265625, -9.962890625, -9.46630859375, -8.9697265625, -8.47314453125, -7.9765625, -7.47998046875, -6.9833984375, -6.48681640625, -5.990234375, -5.49365234375, -4.9970703125, -4.50048828125, -4.00390625, -3.50732421875, -3.0107421875, -2.51416015625, -2.017578125, -1.52099609375, -1.0244140625, -0.52783203125, -0.03125, 0.46533203125, 0.9619140625, 1.45849609375, 1.955078125, 2.45166015625, 2.9482421875, 3.44482421875, 3.94140625, 4.43798828125, 4.9345703125, 5.43115234375, 5.927734375, 6.42431640625, 6.9208984375, 7.41748046875, 7.9140625, 8.41064453125, 8.9072265625, 9.40380859375, 9.900390625, 10.39697265625, 10.8935546875, 11.39013671875, 11.88671875, 12.38330078125, 12.8798828125, 13.37646484375, 13.873046875, 14.36962890625, 14.8662109375, 15.36279296875, 15.859375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [24.0, 989.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.454665184020996, -2.6199545860290527, 3.2147560119628906, 9.049466133117676, 14.884177207946777, 20.718887329101562, 26.55359649658203, 32.388309478759766, 38.223018646240234, 44.0577278137207, 49.89244079589844, 55.727149963378906, 61.561859130859375, 67.39657592773438, 73.23127746582031, 79.06599426269531, 84.90070343017578, 90.73541259765625, 96.57012176513672, 102.40483093261719, 108.23954772949219, 114.07425689697266, 119.90896606445312, 125.74368286132812, 131.57838439941406, 137.41310119628906, 143.247802734375, 149.08251953125, 154.91722106933594, 160.75193786621094, 166.58663940429688, 172.42135620117188, 178.25608825683594, 184.09080505371094, 189.92550659179688, 195.76022338867188, 201.5949249267578, 207.4296417236328, 213.26434326171875, 219.09906005859375, 224.93377685546875, 230.76849365234375, 236.6031951904297, 242.4379119873047, 248.27261352539062, 254.10733032226562, 259.9420471191406, 265.7767639160156, 271.6114501953125, 277.4461669921875, 283.2808837890625, 289.1155700683594, 294.9502868652344, 300.7850036621094, 306.6197204589844, 312.4544372558594, 318.2891540527344, 324.1238708496094, 329.9585876464844, 335.79327392578125, 341.62799072265625, 347.46270751953125, 353.29742431640625, 359.13214111328125, 364.9668273925781]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 7.0, 7.0, 6.0, 13.0, 9.0, 15.0, 15.0, 21.0, 18.0, 23.0, 30.0, 30.0, 27.0, 38.0, 40.0, 39.0, 44.0, 39.0, 38.0, 33.0, 47.0, 33.0, 49.0, 41.0, 41.0, 38.0, 38.0, 30.0, 31.0, 28.0, 19.0, 19.0, 19.0, 14.0, 12.0, 11.0, 12.0, 7.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.91810417175293, -28.028846740722656, -27.139589309692383, -26.250329971313477, -25.361072540283203, -24.47181510925293, -23.582557678222656, -22.69329833984375, -21.804040908813477, -20.914783477783203, -20.02552604675293, -19.136266708374023, -18.24700927734375, -17.357751846313477, -16.468494415283203, -15.579236030578613, -14.68997859954834, -13.800721168518066, -12.911462783813477, -12.022205352783203, -11.132946968078613, -10.24368953704834, -9.35443115234375, -8.465173721313477, -7.575915813446045, -6.686657905578613, -5.797399997711182, -4.90814208984375, -4.018884658813477, -3.129626750946045, -2.2403688430786133, -1.3511109352111816, -0.46185302734375, 0.42740482091903687, 1.3166626691818237, 2.205920457839966, 3.0951783657073975, 3.98443603515625, 4.873693943023682, 5.762951850891113, 6.652209758758545, 7.541467666625977, 8.43072509765625, 9.31998348236084, 10.209240913391113, 11.098499298095703, 11.987756729125977, 12.87701416015625, 13.76627254486084, 14.655529975891113, 15.544788360595703, 16.434045791625977, 17.32330322265625, 18.212562561035156, 19.10181999206543, 19.991077423095703, 20.880334854125977, 21.76959228515625, 22.658849716186523, 23.54810905456543, 24.437366485595703, 25.326623916625977, 26.21588134765625, 27.105140686035156, 27.99439811706543]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 5.0, 5.0, 4.0, 5.0, 7.0, 7.0, 12.0, 8.0, 13.0, 16.0, 21.0, 18.0, 19.0, 21.0, 22.0, 19.0, 30.0, 35.0, 44.0, 44.0, 39.0, 33.0, 38.0, 46.0, 32.0, 37.0, 37.0, 51.0, 43.0, 37.0, 23.0, 18.0, 24.0, 18.0, 23.0, 21.0, 17.0, 23.0, 23.0, 21.0, 15.0, 6.0, 8.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.244140625, -2.169219970703125, -2.09429931640625, -2.019378662109375, -1.9444580078125, -1.869537353515625, -1.79461669921875, -1.719696044921875, -1.644775390625, -1.569854736328125, -1.49493408203125, -1.420013427734375, -1.3450927734375, -1.270172119140625, -1.19525146484375, -1.120330810546875, -1.04541015625, -0.970489501953125, -0.89556884765625, -0.820648193359375, -0.7457275390625, -0.670806884765625, -0.59588623046875, -0.520965576171875, -0.446044921875, -0.371124267578125, -0.29620361328125, -0.221282958984375, -0.1463623046875, -0.071441650390625, 0.00347900390625, 0.078399658203125, 0.1533203125, 0.228240966796875, 0.30316162109375, 0.378082275390625, 0.4530029296875, 0.527923583984375, 0.60284423828125, 0.677764892578125, 0.752685546875, 0.827606201171875, 0.90252685546875, 0.977447509765625, 1.0523681640625, 1.127288818359375, 1.20220947265625, 1.277130126953125, 1.35205078125, 1.426971435546875, 1.50189208984375, 1.576812744140625, 1.6517333984375, 1.726654052734375, 1.80157470703125, 1.876495361328125, 1.951416015625, 2.026336669921875, 2.10125732421875, 2.176177978515625, 2.2510986328125, 2.326019287109375, 2.40093994140625, 2.475860595703125, 2.55078125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 6.0, 7.0, 4.0, 8.0, 17.0, 20.0, 22.0, 20.0, 35.0, 60.0, 66.0, 111.0, 168.0, 360.0, 643.0, 1495.0, 4384.0, 15122.0, 68867.0, 431227.0, 1808287.0, 1498927.0, 296845.0, 49883.0, 11635.0, 3447.0, 1253.0, 511.0, 284.0, 184.0, 105.0, 68.0, 48.0, 30.0, 24.0, 24.0, 15.0, 12.0, 10.0, 18.0, 8.0, 3.0, 7.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.44921875, -4.3004150390625, -4.151611328125, -4.0028076171875, -3.85400390625, -3.7052001953125, -3.556396484375, -3.4075927734375, -3.2587890625, -3.1099853515625, -2.961181640625, -2.8123779296875, -2.66357421875, -2.5147705078125, -2.365966796875, -2.2171630859375, -2.068359375, -1.9195556640625, -1.770751953125, -1.6219482421875, -1.47314453125, -1.3243408203125, -1.175537109375, -1.0267333984375, -0.8779296875, -0.7291259765625, -0.580322265625, -0.4315185546875, -0.28271484375, -0.1339111328125, 0.014892578125, 0.1636962890625, 0.3125, 0.4613037109375, 0.610107421875, 0.7589111328125, 0.90771484375, 1.0565185546875, 1.205322265625, 1.3541259765625, 1.5029296875, 1.6517333984375, 1.800537109375, 1.9493408203125, 2.09814453125, 2.2469482421875, 2.395751953125, 2.5445556640625, 2.693359375, 2.8421630859375, 2.990966796875, 3.1397705078125, 3.28857421875, 3.4373779296875, 3.586181640625, 3.7349853515625, 3.8837890625, 4.0325927734375, 4.181396484375, 4.3302001953125, 4.47900390625, 4.6278076171875, 4.776611328125, 4.9254150390625, 5.07421875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 5.0, 9.0, 12.0, 15.0, 20.0, 32.0, 44.0, 62.0, 98.0, 125.0, 176.0, 240.0, 317.0, 403.0, 474.0, 452.0, 411.0, 319.0, 223.0, 151.0, 131.0, 74.0, 73.0, 43.0, 41.0, 36.0, 21.0, 10.0, 14.0, 7.0, 10.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-8.8203125, -8.5938720703125, -8.367431640625, -8.1409912109375, -7.91455078125, -7.6881103515625, -7.461669921875, -7.2352294921875, -7.0087890625, -6.7823486328125, -6.555908203125, -6.3294677734375, -6.10302734375, -5.8765869140625, -5.650146484375, -5.4237060546875, -5.197265625, -4.9708251953125, -4.744384765625, -4.5179443359375, -4.29150390625, -4.0650634765625, -3.838623046875, -3.6121826171875, -3.3857421875, -3.1593017578125, -2.932861328125, -2.7064208984375, -2.47998046875, -2.2535400390625, -2.027099609375, -1.8006591796875, -1.57421875, -1.3477783203125, -1.121337890625, -0.8948974609375, -0.66845703125, -0.4420166015625, -0.215576171875, 0.0108642578125, 0.2373046875, 0.4637451171875, 0.690185546875, 0.9166259765625, 1.14306640625, 1.3695068359375, 1.595947265625, 1.8223876953125, 2.048828125, 2.2752685546875, 2.501708984375, 2.7281494140625, 2.95458984375, 3.1810302734375, 3.407470703125, 3.6339111328125, 3.8603515625, 4.0867919921875, 4.313232421875, 4.5396728515625, 4.76611328125, 4.9925537109375, 5.218994140625, 5.4454345703125, 5.671875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 5.0, 10.0, 10.0, 18.0, 17.0, 25.0, 44.0, 53.0, 82.0, 136.0, 215.0, 515.0, 2429.0, 99322.0, 4010479.0, 77596.0, 2136.0, 538.0, 232.0, 141.0, 64.0, 60.0, 46.0, 38.0, 17.0, 16.0, 4.0, 10.0, 7.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.125, -23.2138671875, -22.302734375, -21.3916015625, -20.48046875, -19.5693359375, -18.658203125, -17.7470703125, -16.8359375, -15.9248046875, -15.013671875, -14.1025390625, -13.19140625, -12.2802734375, -11.369140625, -10.4580078125, -9.546875, -8.6357421875, -7.724609375, -6.8134765625, -5.90234375, -4.9912109375, -4.080078125, -3.1689453125, -2.2578125, -1.3466796875, -0.435546875, 0.4755859375, 1.38671875, 2.2978515625, 3.208984375, 4.1201171875, 5.03125, 5.9423828125, 6.853515625, 7.7646484375, 8.67578125, 9.5869140625, 10.498046875, 11.4091796875, 12.3203125, 13.2314453125, 14.142578125, 15.0537109375, 15.96484375, 16.8759765625, 17.787109375, 18.6982421875, 19.609375, 20.5205078125, 21.431640625, 22.3427734375, 23.25390625, 24.1650390625, 25.076171875, 25.9873046875, 26.8984375, 27.8095703125, 28.720703125, 29.6318359375, 30.54296875, 31.4541015625, 32.365234375, 33.2763671875, 34.1875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 10.0, 38.0, 158.0, 330.0, 303.0, 137.0, 29.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.01701354980469, -117.21588897705078, -114.41476440429688, -111.61363983154297, -108.81251525878906, -106.01139068603516, -103.21026611328125, -100.40913391113281, -97.60801696777344, -94.80689239501953, -92.00576782226562, -89.20464324951172, -86.40351867675781, -83.6023941040039, -80.80126953125, -78.00013732910156, -75.19901275634766, -72.39788818359375, -69.59676361083984, -66.79563903808594, -63.99451446533203, -61.193389892578125, -58.39226150512695, -55.59113693237305, -52.79001235961914, -49.988887786865234, -47.18776321411133, -44.386634826660156, -41.58551025390625, -38.784385681152344, -35.98326110839844, -33.18213653564453, -30.38100814819336, -27.579883575439453, -24.778759002685547, -21.977632522583008, -19.1765079498291, -16.375383377075195, -13.574256896972656, -10.77313232421875, -7.972007751464844, -5.170882701873779, -2.369757652282715, 0.4313678741455078, 3.232492446899414, 6.03361701965332, 8.83474349975586, 11.635868072509766, 14.436992645263672, 17.238117218017578, 20.039241790771484, 22.840368270874023, 25.64149284362793, 28.442617416381836, 31.243743896484375, 34.04486846923828, 36.84599304199219, 39.647117614746094, 42.4482421875, 45.249366760253906, 48.05049133300781, 50.85161590576172, 53.65274429321289, 56.4538688659668, 59.2549934387207]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 3.0, 2.0, 4.0, 5.0, 8.0, 5.0, 9.0, 16.0, 19.0, 19.0, 22.0, 23.0, 24.0, 22.0, 41.0, 31.0, 26.0, 43.0, 29.0, 35.0, 47.0, 39.0, 43.0, 46.0, 48.0, 44.0, 37.0, 34.0, 27.0, 40.0, 25.0, 32.0, 31.0, 25.0, 15.0, 18.0, 12.0, 10.0, 13.0, 6.0, 7.0, 6.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-27.347843170166016, -26.58557891845703, -25.823314666748047, -25.061052322387695, -24.29878807067871, -23.536523818969727, -22.774261474609375, -22.01199722290039, -21.249732971191406, -20.487468719482422, -19.725204467773438, -18.962942123413086, -18.2006778717041, -17.438413619995117, -16.676151275634766, -15.913887023925781, -15.151622772216797, -14.389358520507812, -13.627095222473145, -12.864831924438477, -12.102567672729492, -11.340303421020508, -10.57804012298584, -9.815776824951172, -9.053512573242188, -8.291248321533203, -7.528985023498535, -6.766721248626709, -6.004457473754883, -5.242193698883057, -4.4799299240112305, -3.7176661491394043, -2.955402374267578, -2.193138599395752, -1.4308748245239258, -0.6686110496520996, 0.09365272521972656, 0.8559165000915527, 1.618180274963379, 2.380444049835205, 3.1427078247070312, 3.9049715995788574, 4.667235374450684, 5.42949914932251, 6.191762924194336, 6.954026699066162, 7.716290473937988, 8.478553771972656, 9.24081802368164, 10.003082275390625, 10.765345573425293, 11.527608871459961, 12.289873123168945, 13.05213737487793, 13.814400672912598, 14.576663970947266, 15.33892822265625, 16.101192474365234, 16.86345672607422, 17.62571907043457, 18.387983322143555, 19.15024757385254, 19.91250991821289, 20.674774169921875, 21.43703842163086]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 3.0, 8.0, 8.0, 13.0, 15.0, 13.0, 22.0, 16.0, 15.0, 22.0, 19.0, 24.0, 28.0, 39.0, 44.0, 24.0, 39.0, 52.0, 37.0, 62.0, 39.0, 37.0, 40.0, 37.0, 30.0, 32.0, 32.0, 22.0, 32.0, 30.0, 23.0, 27.0, 17.0, 21.0, 16.0, 19.0, 11.0, 6.0, 7.0, 9.0, 4.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.57421875, -2.492279052734375, -2.41033935546875, -2.328399658203125, -2.2464599609375, -2.164520263671875, -2.08258056640625, -2.000640869140625, -1.918701171875, -1.836761474609375, -1.75482177734375, -1.672882080078125, -1.5909423828125, -1.509002685546875, -1.42706298828125, -1.345123291015625, -1.26318359375, -1.181243896484375, -1.09930419921875, -1.017364501953125, -0.9354248046875, -0.853485107421875, -0.77154541015625, -0.689605712890625, -0.607666015625, -0.525726318359375, -0.44378662109375, -0.361846923828125, -0.2799072265625, -0.197967529296875, -0.11602783203125, -0.034088134765625, 0.0478515625, 0.129791259765625, 0.21173095703125, 0.293670654296875, 0.3756103515625, 0.457550048828125, 0.53948974609375, 0.621429443359375, 0.703369140625, 0.785308837890625, 0.86724853515625, 0.949188232421875, 1.0311279296875, 1.113067626953125, 1.19500732421875, 1.276947021484375, 1.35888671875, 1.440826416015625, 1.52276611328125, 1.604705810546875, 1.6866455078125, 1.768585205078125, 1.85052490234375, 1.932464599609375, 2.014404296875, 2.096343994140625, 2.17828369140625, 2.260223388671875, 2.3421630859375, 2.424102783203125, 2.50604248046875, 2.587982177734375, 2.669921875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 8.0, 6.0, 9.0, 11.0, 10.0, 22.0, 36.0, 44.0, 76.0, 118.0, 181.0, 263.0, 413.0, 658.0, 1027.0, 1787.0, 2888.0, 4695.0, 7815.0, 12633.0, 21279.0, 35889.0, 64296.0, 123412.0, 342531.0, 211705.0, 92916.0, 50724.0, 28870.0, 17336.0, 10398.0, 6428.0, 3917.0, 2336.0, 1399.0, 825.0, 559.0, 370.0, 228.0, 140.0, 101.0, 67.0, 48.0, 27.0, 18.0, 14.0, 9.0, 5.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.7216796875, -0.699676513671875, -0.67767333984375, -0.655670166015625, -0.6336669921875, -0.611663818359375, -0.58966064453125, -0.567657470703125, -0.545654296875, -0.523651123046875, -0.50164794921875, -0.479644775390625, -0.4576416015625, -0.435638427734375, -0.41363525390625, -0.391632080078125, -0.36962890625, -0.347625732421875, -0.32562255859375, -0.303619384765625, -0.2816162109375, -0.259613037109375, -0.23760986328125, -0.215606689453125, -0.193603515625, -0.171600341796875, -0.14959716796875, -0.127593994140625, -0.1055908203125, -0.083587646484375, -0.06158447265625, -0.039581298828125, -0.017578125, 0.004425048828125, 0.02642822265625, 0.048431396484375, 0.0704345703125, 0.092437744140625, 0.11444091796875, 0.136444091796875, 0.158447265625, 0.180450439453125, 0.20245361328125, 0.224456787109375, 0.2464599609375, 0.268463134765625, 0.29046630859375, 0.312469482421875, 0.33447265625, 0.356475830078125, 0.37847900390625, 0.400482177734375, 0.4224853515625, 0.444488525390625, 0.46649169921875, 0.488494873046875, 0.510498046875, 0.532501220703125, 0.55450439453125, 0.576507568359375, 0.5985107421875, 0.620513916015625, 0.64251708984375, 0.664520263671875, 0.6865234375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 1.0, 5.0, 2.0, 9.0, 7.0, 10.0, 7.0, 19.0, 19.0, 20.0, 20.0, 28.0, 28.0, 37.0, 43.0, 45.0, 49.0, 39.0, 47.0, 39.0, 1072.0, 41.0, 50.0, 53.0, 40.0, 39.0, 35.0, 34.0, 24.0, 31.0, 19.0, 23.0, 13.0, 12.0, 16.0, 11.0, 8.0, 7.0, 4.0, 7.0, 5.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.8671875, -1.810211181640625, -1.75323486328125, -1.696258544921875, -1.6392822265625, -1.582305908203125, -1.52532958984375, -1.468353271484375, -1.411376953125, -1.354400634765625, -1.29742431640625, -1.240447998046875, -1.1834716796875, -1.126495361328125, -1.06951904296875, -1.012542724609375, -0.95556640625, -0.898590087890625, -0.84161376953125, -0.784637451171875, -0.7276611328125, -0.670684814453125, -0.61370849609375, -0.556732177734375, -0.499755859375, -0.442779541015625, -0.38580322265625, -0.328826904296875, -0.2718505859375, -0.214874267578125, -0.15789794921875, -0.100921630859375, -0.0439453125, 0.013031005859375, 0.07000732421875, 0.126983642578125, 0.1839599609375, 0.240936279296875, 0.29791259765625, 0.354888916015625, 0.411865234375, 0.468841552734375, 0.52581787109375, 0.582794189453125, 0.6397705078125, 0.696746826171875, 0.75372314453125, 0.810699462890625, 0.86767578125, 0.924652099609375, 0.98162841796875, 1.038604736328125, 1.0955810546875, 1.152557373046875, 1.20953369140625, 1.266510009765625, 1.323486328125, 1.380462646484375, 1.43743896484375, 1.494415283203125, 1.5513916015625, 1.608367919921875, 1.66534423828125, 1.722320556640625, 1.779296875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 5.0, 5.0, 10.0, 18.0, 15.0, 49.0, 43.0, 76.0, 87.0, 156.0, 242.0, 314.0, 612.0, 891.0, 1368.0, 2287.0, 3767.0, 6253.0, 10932.0, 19404.0, 35962.0, 70084.0, 149346.0, 1455715.0, 172565.0, 77228.0, 39165.0, 21001.0, 11738.0, 6950.0, 4102.0, 2496.0, 1559.0, 943.0, 640.0, 390.0, 241.0, 173.0, 107.0, 67.0, 42.0, 29.0, 20.0, 9.0, 9.0, 10.0, 7.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.73681640625, -0.7134780883789062, -0.6901397705078125, -0.6668014526367188, -0.643463134765625, -0.6201248168945312, -0.5967864990234375, -0.5734481811523438, -0.55010986328125, -0.5267715454101562, -0.5034332275390625, -0.48009490966796875, -0.456756591796875, -0.43341827392578125, -0.4100799560546875, -0.38674163818359375, -0.3634033203125, -0.34006500244140625, -0.3167266845703125, -0.29338836669921875, -0.270050048828125, -0.24671173095703125, -0.2233734130859375, -0.20003509521484375, -0.17669677734375, -0.15335845947265625, -0.1300201416015625, -0.10668182373046875, -0.083343505859375, -0.06000518798828125, -0.0366668701171875, -0.01332855224609375, 0.010009765625, 0.03334808349609375, 0.0566864013671875, 0.08002471923828125, 0.103363037109375, 0.12670135498046875, 0.1500396728515625, 0.17337799072265625, 0.19671630859375, 0.22005462646484375, 0.2433929443359375, 0.26673126220703125, 0.290069580078125, 0.31340789794921875, 0.3367462158203125, 0.36008453369140625, 0.3834228515625, 0.40676116943359375, 0.4300994873046875, 0.45343780517578125, 0.476776123046875, 0.5001144409179688, 0.5234527587890625, 0.5467910766601562, 0.57012939453125, 0.5934677124023438, 0.6168060302734375, 0.6401443481445312, 0.663482666015625, 0.6868209838867188, 0.7101593017578125, 0.7334976196289062, 0.7568359375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 6.0, 7.0, 2.0, 5.0, 7.0, 8.0, 15.0, 23.0, 23.0, 17.0, 35.0, 34.0, 49.0, 79.0, 105.0, 119.0, 109.0, 87.0, 54.0, 47.0, 28.0, 27.0, 22.0, 17.0, 8.0, 11.0, 5.0, 6.0, 6.0, 8.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0005049705505371094, -0.0004903040826320648, -0.00047563761472702026, -0.0004609711468219757, -0.00044630467891693115, -0.0004316382110118866, -0.00041697174310684204, -0.0004023052752017975, -0.00038763880729675293, -0.0003729723393917084, -0.0003583058714866638, -0.00034363940358161926, -0.0003289729356765747, -0.00031430646777153015, -0.0002996399998664856, -0.00028497353196144104, -0.0002703070640563965, -0.00025564059615135193, -0.00024097412824630737, -0.00022630766034126282, -0.00021164119243621826, -0.0001969747245311737, -0.00018230825662612915, -0.0001676417887210846, -0.00015297532081604004, -0.00013830885291099548, -0.00012364238500595093, -0.00010897591710090637, -9.430944919586182e-05, -7.964298129081726e-05, -6.49765133857727e-05, -5.031004548072815e-05, -3.5643577575683594e-05, -2.0977109670639038e-05, -6.310641765594482e-06, 8.355826139450073e-06, 2.302229404449463e-05, 3.7688761949539185e-05, 5.235522985458374e-05, 6.70216977596283e-05, 8.168816566467285e-05, 9.635463356971741e-05, 0.00011102110147476196, 0.00012568756937980652, 0.00014035403728485107, 0.00015502050518989563, 0.00016968697309494019, 0.00018435344099998474, 0.0001990199089050293, 0.00021368637681007385, 0.0002283528447151184, 0.00024301931262016296, 0.0002576857805252075, 0.0002723522484302521, 0.00028701871633529663, 0.0003016851842403412, 0.00031635165214538574, 0.0003310181200504303, 0.00034568458795547485, 0.0003603510558605194, 0.00037501752376556396, 0.0003896839916706085, 0.0004043504595756531, 0.00041901692748069763, 0.0004336833953857422]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 2.0, 3.0, 6.0, 7.0, 13.0, 10.0, 13.0, 18.0, 29.0, 40.0, 53.0, 63.0, 78.0, 140.0, 262.0, 517.0, 5001.0, 1024641.0, 16185.0, 663.0, 288.0, 160.0, 96.0, 58.0, 40.0, 27.0, 32.0, 27.0, 10.0, 6.0, 12.0, 7.0, 12.0, 7.0, 4.0, 4.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.01016998291015625, -0.009867310523986816, -0.009564638137817383, -0.00926196575164795, -0.008959293365478516, -0.008656620979309082, -0.008353948593139648, -0.008051276206970215, -0.007748603820800781, -0.007445931434631348, -0.007143259048461914, -0.0068405866622924805, -0.006537914276123047, -0.006235241889953613, -0.00593256950378418, -0.005629897117614746, -0.0053272247314453125, -0.005024552345275879, -0.004721879959106445, -0.004419207572937012, -0.004116535186767578, -0.0038138628005981445, -0.003511190414428711, -0.0032085180282592773, -0.0029058456420898438, -0.00260317325592041, -0.0023005008697509766, -0.001997828483581543, -0.0016951560974121094, -0.0013924837112426758, -0.0010898113250732422, -0.0007871389389038086, -0.000484466552734375, -0.0001817941665649414, 0.00012087821960449219, 0.0004235506057739258, 0.0007262229919433594, 0.001028895378112793, 0.0013315677642822266, 0.0016342401504516602, 0.0019369125366210938, 0.0022395849227905273, 0.002542257308959961, 0.0028449296951293945, 0.003147602081298828, 0.0034502744674682617, 0.0037529468536376953, 0.004055619239807129, 0.0043582916259765625, 0.004660964012145996, 0.00496363639831543, 0.005266308784484863, 0.005568981170654297, 0.0058716535568237305, 0.006174325942993164, 0.006476998329162598, 0.006779670715332031, 0.007082343101501465, 0.0073850154876708984, 0.007687687873840332, 0.007990360260009766, 0.0082930326461792, 0.008595705032348633, 0.008898377418518066, 0.0092010498046875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 26.0, 64.0, 167.0, 242.0, 266.0, 124.0, 71.0, 31.0, 11.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007197977975010872, -0.0007022435311228037, -0.0006846892647445202, -0.0006671349983662367, -0.0006495807319879532, -0.0006320265238173306, -0.0006144722574390471, -0.0005969179910607636, -0.0005793637246824801, -0.0005618094583041966, -0.0005442551919259131, -0.0005267009255476296, -0.000509146717377007, -0.0004915924509987235, -0.00047403818462044, -0.0004564839182421565, -0.000438929651863873, -0.0004213753854855895, -0.000403821119107306, -0.00038626688183285296, -0.00036871261545456946, -0.00035115834907628596, -0.0003336041118018329, -0.0003160498454235494, -0.0002984955790452659, -0.0002809413126669824, -0.0002633870462886989, -0.00024583280901424587, -0.00022827854263596237, -0.00021072427625767887, -0.0001931700244313106, -0.00017561577260494232, -0.0001580614480189979, -0.0001405071816407144, -0.00012295292981434613, -0.00010539867071202025, -8.784441160969436e-05, -7.029015250736848e-05, -5.273589340504259e-05, -3.5181641578674316e-05, -1.7627375200390816e-05, -7.311609806492925e-08, 1.7481143004260957e-05, 3.5035402106586844e-05, 5.258966120891273e-05, 7.014392031123862e-05, 8.76981794135645e-05, 0.00010525243123993278, 0.00012280669761821628, 0.00014036096399649978, 0.00015791521582286805, 0.00017546946764923632, 0.00019302373402751982, 0.00021057800040580332, 0.0002281322522321716, 0.00024568650405853987, 0.00026324077043682337, 0.00028079503681510687, 0.00029834930319339037, 0.0003159035404678434, 0.0003334578068461269, 0.0003510120732244104, 0.00036856631049886346, 0.00038612057687714696, 0.00040367484325543046]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 5.0, 5.0, 9.0, 3.0, 11.0, 4.0, 12.0, 11.0, 9.0, 18.0, 16.0, 23.0, 24.0, 22.0, 23.0, 25.0, 32.0, 40.0, 33.0, 29.0, 30.0, 35.0, 39.0, 42.0, 48.0, 42.0, 29.0, 38.0, 26.0, 38.0, 36.0, 39.0, 20.0, 19.0, 22.0, 22.0, 15.0, 20.0, 15.0, 10.0, 10.0, 13.0, 6.0, 3.0, 10.0, 3.0, 8.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0], "bins": [-0.00020509958267211914, -0.0001990078017115593, -0.00019291602075099945, -0.0001868242397904396, -0.00018073245882987976, -0.00017464067786931992, -0.00016854889690876007, -0.00016245711594820023, -0.00015636533498764038, -0.00015027355402708054, -0.0001441817730665207, -0.00013808999210596085, -0.000131998211145401, -0.00012590643018484116, -0.00011981464922428131, -0.00011372286826372147, -0.00010763108730316162, -0.00010153930634260178, -9.544752538204193e-05, -8.935574442148209e-05, -8.326396346092224e-05, -7.71721825003624e-05, -7.108040153980255e-05, -6.49886205792427e-05, -5.889683961868286e-05, -5.2805058658123016e-05, -4.671327769756317e-05, -4.0621496737003326e-05, -3.452971577644348e-05, -2.8437934815883636e-05, -2.234615385532379e-05, -1.6254372894763947e-05, -1.0162591934204102e-05, -4.070810973644257e-06, 2.0209699869155884e-06, 8.112750947475433e-06, 1.4204531908035278e-05, 2.0296312868595123e-05, 2.6388093829154968e-05, 3.247987478971481e-05, 3.857165575027466e-05, 4.46634367108345e-05, 5.075521767139435e-05, 5.684699863195419e-05, 6.293877959251404e-05, 6.903056055307388e-05, 7.512234151363373e-05, 8.121412247419357e-05, 8.730590343475342e-05, 9.339768439531326e-05, 9.948946535587311e-05, 0.00010558124631643295, 0.0001116730272769928, 0.00011776480823755264, 0.0001238565891981125, 0.00012994837015867233, 0.00013604015111923218, 0.00014213193207979202, 0.00014822371304035187, 0.0001543154940009117, 0.00016040727496147156, 0.0001664990559220314, 0.00017259083688259125, 0.0001786826178431511, 0.00018477439880371094]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 3.0, 8.0, 8.0, 13.0, 15.0, 13.0, 22.0, 16.0, 15.0, 22.0, 19.0, 24.0, 28.0, 39.0, 44.0, 24.0, 39.0, 52.0, 37.0, 62.0, 39.0, 37.0, 40.0, 37.0, 30.0, 32.0, 32.0, 22.0, 32.0, 30.0, 23.0, 27.0, 17.0, 21.0, 16.0, 19.0, 11.0, 6.0, 7.0, 9.0, 4.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.57421875, -2.492279052734375, -2.41033935546875, -2.328399658203125, -2.2464599609375, -2.164520263671875, -2.08258056640625, -2.000640869140625, -1.918701171875, -1.836761474609375, -1.75482177734375, -1.672882080078125, -1.5909423828125, -1.509002685546875, -1.42706298828125, -1.345123291015625, -1.26318359375, -1.181243896484375, -1.09930419921875, -1.017364501953125, -0.9354248046875, -0.853485107421875, -0.77154541015625, -0.689605712890625, -0.607666015625, -0.525726318359375, -0.44378662109375, -0.361846923828125, -0.2799072265625, -0.197967529296875, -0.11602783203125, -0.034088134765625, 0.0478515625, 0.129791259765625, 0.21173095703125, 0.293670654296875, 0.3756103515625, 0.457550048828125, 0.53948974609375, 0.621429443359375, 0.703369140625, 0.785308837890625, 0.86724853515625, 0.949188232421875, 1.0311279296875, 1.113067626953125, 1.19500732421875, 1.276947021484375, 1.35888671875, 1.440826416015625, 1.52276611328125, 1.604705810546875, 1.6866455078125, 1.768585205078125, 1.85052490234375, 1.932464599609375, 2.014404296875, 2.096343994140625, 2.17828369140625, 2.260223388671875, 2.3421630859375, 2.424102783203125, 2.50604248046875, 2.587982177734375, 2.669921875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 12.0, 8.0, 14.0, 25.0, 44.0, 40.0, 78.0, 90.0, 158.0, 264.0, 407.0, 648.0, 1192.0, 2021.0, 3733.0, 6698.0, 13118.0, 26176.0, 55939.0, 119129.0, 228575.0, 271230.0, 165755.0, 78258.0, 36960.0, 17842.0, 8890.0, 4875.0, 2695.0, 1492.0, 881.0, 466.0, 300.0, 178.0, 137.0, 66.0, 39.0, 43.0, 25.0, 17.0, 11.0, 9.0, 3.0, 3.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.7216796875, -1.6647186279296875, -1.607757568359375, -1.5507965087890625, -1.49383544921875, -1.4368743896484375, -1.379913330078125, -1.3229522705078125, -1.2659912109375, -1.2090301513671875, -1.152069091796875, -1.0951080322265625, -1.03814697265625, -0.9811859130859375, -0.924224853515625, -0.8672637939453125, -0.810302734375, -0.7533416748046875, -0.696380615234375, -0.6394195556640625, -0.58245849609375, -0.5254974365234375, -0.468536376953125, -0.4115753173828125, -0.3546142578125, -0.2976531982421875, -0.240692138671875, -0.1837310791015625, -0.12677001953125, -0.0698089599609375, -0.012847900390625, 0.0441131591796875, 0.10107421875, 0.1580352783203125, 0.214996337890625, 0.2719573974609375, 0.32891845703125, 0.3858795166015625, 0.442840576171875, 0.4998016357421875, 0.5567626953125, 0.6137237548828125, 0.670684814453125, 0.7276458740234375, 0.78460693359375, 0.8415679931640625, 0.898529052734375, 0.9554901123046875, 1.012451171875, 1.0694122314453125, 1.126373291015625, 1.1833343505859375, 1.24029541015625, 1.2972564697265625, 1.354217529296875, 1.4111785888671875, 1.4681396484375, 1.5251007080078125, 1.582061767578125, 1.6390228271484375, 1.69598388671875, 1.7529449462890625, 1.809906005859375, 1.8668670654296875, 1.923828125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 2.0, 5.0, 2.0, 6.0, 4.0, 14.0, 17.0, 18.0, 21.0, 28.0, 28.0, 30.0, 33.0, 47.0, 46.0, 42.0, 68.0, 82.0, 216.0, 1511.0, 260.0, 122.0, 70.0, 49.0, 43.0, 31.0, 26.0, 30.0, 38.0, 27.0, 19.0, 15.0, 13.0, 8.0, 13.0, 9.0, 11.0, 10.0, 7.0, 4.0, 5.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.0, -8.715576171875, -8.43115234375, -8.146728515625, -7.8623046875, -7.577880859375, -7.29345703125, -7.009033203125, -6.724609375, -6.440185546875, -6.15576171875, -5.871337890625, -5.5869140625, -5.302490234375, -5.01806640625, -4.733642578125, -4.44921875, -4.164794921875, -3.88037109375, -3.595947265625, -3.3115234375, -3.027099609375, -2.74267578125, -2.458251953125, -2.173828125, -1.889404296875, -1.60498046875, -1.320556640625, -1.0361328125, -0.751708984375, -0.46728515625, -0.182861328125, 0.1015625, 0.385986328125, 0.67041015625, 0.954833984375, 1.2392578125, 1.523681640625, 1.80810546875, 2.092529296875, 2.376953125, 2.661376953125, 2.94580078125, 3.230224609375, 3.5146484375, 3.799072265625, 4.08349609375, 4.367919921875, 4.65234375, 4.936767578125, 5.22119140625, 5.505615234375, 5.7900390625, 6.074462890625, 6.35888671875, 6.643310546875, 6.927734375, 7.212158203125, 7.49658203125, 7.781005859375, 8.0654296875, 8.349853515625, 8.63427734375, 8.918701171875, 9.203125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 11.0, 6.0, 11.0, 21.0, 13.0, 18.0, 21.0, 21.0, 28.0, 44.0, 78.0, 89.0, 133.0, 207.0, 379.0, 988.0, 7812.0, 1425322.0, 1700015.0, 8370.0, 1045.0, 373.0, 202.0, 144.0, 81.0, 78.0, 45.0, 35.0, 35.0, 17.0, 10.0, 8.0, 9.0, 4.0, 6.0, 9.0, 7.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-20.078125, -19.53564453125, -18.9931640625, -18.45068359375, -17.908203125, -17.36572265625, -16.8232421875, -16.28076171875, -15.73828125, -15.19580078125, -14.6533203125, -14.11083984375, -13.568359375, -13.02587890625, -12.4833984375, -11.94091796875, -11.3984375, -10.85595703125, -10.3134765625, -9.77099609375, -9.228515625, -8.68603515625, -8.1435546875, -7.60107421875, -7.05859375, -6.51611328125, -5.9736328125, -5.43115234375, -4.888671875, -4.34619140625, -3.8037109375, -3.26123046875, -2.71875, -2.17626953125, -1.6337890625, -1.09130859375, -0.548828125, -0.00634765625, 0.5361328125, 1.07861328125, 1.62109375, 2.16357421875, 2.7060546875, 3.24853515625, 3.791015625, 4.33349609375, 4.8759765625, 5.41845703125, 5.9609375, 6.50341796875, 7.0458984375, 7.58837890625, 8.130859375, 8.67333984375, 9.2158203125, 9.75830078125, 10.30078125, 10.84326171875, 11.3857421875, 11.92822265625, 12.470703125, 13.01318359375, 13.5556640625, 14.09814453125, 14.640625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 61.0, 572.0, 366.0, 15.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.350950241088867, -14.81060791015625, -12.270264625549316, -9.729921340942383, -7.189579010009766, -4.649236679077148, -2.108893394470215, 0.43144989013671875, 2.971792221069336, 5.512135028839111, 8.052477836608887, 10.59282112121582, 13.133163452148438, 15.673505783081055, 18.213848114013672, 20.754192352294922, 23.29453468322754, 25.834877014160156, 28.375221252441406, 30.915563583374023, 33.45590591430664, 35.996246337890625, 38.536590576171875, 41.076934814453125, 43.617279052734375, 46.157623291015625, 48.69796371459961, 51.23830795288086, 53.778648376464844, 56.318992614746094, 58.859336853027344, 61.399681091308594, 63.94001770019531, 66.48036193847656, 69.02070617675781, 71.56104278564453, 74.10138702392578, 76.64173126220703, 79.18207550048828, 81.72241973876953, 84.26275634765625, 86.8031005859375, 89.34344482421875, 91.88378143310547, 94.42412567138672, 96.96446990966797, 99.50481414794922, 102.04515838623047, 104.58550262451172, 107.12584686279297, 109.66619110107422, 112.20652770996094, 114.74687194824219, 117.28721618652344, 119.82756042480469, 122.36790466308594, 124.90824890136719, 127.44859313964844, 129.9889373779297, 132.52928161621094, 135.0696258544922, 137.60995483398438, 140.15029907226562, 142.69064331054688, 145.23098754882812]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 3.0, 5.0, 9.0, 12.0, 6.0, 12.0, 12.0, 16.0, 15.0, 13.0, 19.0, 35.0, 27.0, 23.0, 44.0, 33.0, 35.0, 44.0, 40.0, 48.0, 41.0, 38.0, 38.0, 38.0, 47.0, 39.0, 28.0, 34.0, 42.0, 21.0, 31.0, 35.0, 19.0, 20.0, 10.0, 13.0, 10.0, 10.0, 9.0, 6.0, 6.0, 6.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-32.31574249267578, -31.393869400024414, -30.471996307373047, -29.55012321472168, -28.628250122070312, -27.706377029418945, -26.784503936767578, -25.86263084411621, -24.940757751464844, -24.018884658813477, -23.09701156616211, -22.175138473510742, -21.253265380859375, -20.331392288208008, -19.40951919555664, -18.487646102905273, -17.565773010253906, -16.64389991760254, -15.722026824951172, -14.800153732299805, -13.878280639648438, -12.95640754699707, -12.034534454345703, -11.112661361694336, -10.190786361694336, -9.268913269042969, -8.347040176391602, -7.425167083740234, -6.503293991088867, -5.581420421600342, -4.659547328948975, -3.7376742362976074, -2.8158016204833984, -1.8939285278320312, -0.9720553159713745, -0.05018210411071777, 0.8716909885406494, 1.7935643196105957, 2.715437412261963, 3.63731050491333, 4.559183597564697, 5.4810566902160645, 6.402929782867432, 7.324803352355957, 8.246676445007324, 9.168549537658691, 10.090422630310059, 11.012295722961426, 11.934168815612793, 12.85604190826416, 13.777915000915527, 14.699788093566895, 15.621661186218262, 16.543535232543945, 17.465408325195312, 18.38728141784668, 19.309154510498047, 20.231027603149414, 21.15290069580078, 22.07477378845215, 22.996646881103516, 23.918519973754883, 24.84039306640625, 25.762266159057617, 26.684139251708984]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 7.0, 4.0, 9.0, 10.0, 16.0, 16.0, 16.0, 15.0, 20.0, 18.0, 32.0, 32.0, 27.0, 41.0, 39.0, 30.0, 46.0, 51.0, 49.0, 45.0, 47.0, 39.0, 29.0, 33.0, 35.0, 38.0, 32.0, 33.0, 30.0, 27.0, 20.0, 24.0, 20.0, 16.0, 16.0, 11.0, 11.0, 6.0, 6.0, 3.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8046875, -2.71368408203125, -2.6226806640625, -2.53167724609375, -2.440673828125, -2.34967041015625, -2.2586669921875, -2.16766357421875, -2.07666015625, -1.98565673828125, -1.8946533203125, -1.80364990234375, -1.712646484375, -1.62164306640625, -1.5306396484375, -1.43963623046875, -1.3486328125, -1.25762939453125, -1.1666259765625, -1.07562255859375, -0.984619140625, -0.89361572265625, -0.8026123046875, -0.71160888671875, -0.62060546875, -0.52960205078125, -0.4385986328125, -0.34759521484375, -0.256591796875, -0.16558837890625, -0.0745849609375, 0.01641845703125, 0.107421875, 0.19842529296875, 0.2894287109375, 0.38043212890625, 0.471435546875, 0.56243896484375, 0.6534423828125, 0.74444580078125, 0.83544921875, 0.92645263671875, 1.0174560546875, 1.10845947265625, 1.199462890625, 1.29046630859375, 1.3814697265625, 1.47247314453125, 1.5634765625, 1.65447998046875, 1.7454833984375, 1.83648681640625, 1.927490234375, 2.01849365234375, 2.1094970703125, 2.20050048828125, 2.29150390625, 2.38250732421875, 2.4735107421875, 2.56451416015625, 2.655517578125, 2.74652099609375, 2.8375244140625, 2.92852783203125, 3.01953125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 7.0, 7.0, 8.0, 10.0, 19.0, 15.0, 22.0, 27.0, 32.0, 53.0, 69.0, 96.0, 153.0, 265.0, 636.0, 1964.0, 10765.0, 96903.0, 1266255.0, 2469257.0, 314634.0, 26891.0, 4078.0, 1030.0, 393.0, 190.0, 130.0, 89.0, 64.0, 44.0, 29.0, 30.0, 24.0, 16.0, 14.0, 13.0, 9.0, 7.0, 7.0, 8.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.31640625, -7.08935546875, -6.8623046875, -6.63525390625, -6.408203125, -6.18115234375, -5.9541015625, -5.72705078125, -5.5, -5.27294921875, -5.0458984375, -4.81884765625, -4.591796875, -4.36474609375, -4.1376953125, -3.91064453125, -3.68359375, -3.45654296875, -3.2294921875, -3.00244140625, -2.775390625, -2.54833984375, -2.3212890625, -2.09423828125, -1.8671875, -1.64013671875, -1.4130859375, -1.18603515625, -0.958984375, -0.73193359375, -0.5048828125, -0.27783203125, -0.05078125, 0.17626953125, 0.4033203125, 0.63037109375, 0.857421875, 1.08447265625, 1.3115234375, 1.53857421875, 1.765625, 1.99267578125, 2.2197265625, 2.44677734375, 2.673828125, 2.90087890625, 3.1279296875, 3.35498046875, 3.58203125, 3.80908203125, 4.0361328125, 4.26318359375, 4.490234375, 4.71728515625, 4.9443359375, 5.17138671875, 5.3984375, 5.62548828125, 5.8525390625, 6.07958984375, 6.306640625, 6.53369140625, 6.7607421875, 6.98779296875, 7.21484375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 8.0, 9.0, 14.0, 22.0, 37.0, 47.0, 51.0, 98.0, 116.0, 198.0, 233.0, 309.0, 392.0, 513.0, 475.0, 398.0, 327.0, 238.0, 162.0, 136.0, 80.0, 61.0, 50.0, 27.0, 24.0, 10.0, 7.0, 5.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.1875, -8.93231201171875, -8.6771240234375, -8.42193603515625, -8.166748046875, -7.91156005859375, -7.6563720703125, -7.40118408203125, -7.14599609375, -6.89080810546875, -6.6356201171875, -6.38043212890625, -6.125244140625, -5.87005615234375, -5.6148681640625, -5.35968017578125, -5.1044921875, -4.84930419921875, -4.5941162109375, -4.33892822265625, -4.083740234375, -3.82855224609375, -3.5733642578125, -3.31817626953125, -3.06298828125, -2.80780029296875, -2.5526123046875, -2.29742431640625, -2.042236328125, -1.78704833984375, -1.5318603515625, -1.27667236328125, -1.021484375, -0.76629638671875, -0.5111083984375, -0.25592041015625, -0.000732421875, 0.25445556640625, 0.5096435546875, 0.76483154296875, 1.02001953125, 1.27520751953125, 1.5303955078125, 1.78558349609375, 2.040771484375, 2.29595947265625, 2.5511474609375, 2.80633544921875, 3.0615234375, 3.31671142578125, 3.5718994140625, 3.82708740234375, 4.082275390625, 4.33746337890625, 4.5926513671875, 4.84783935546875, 5.10302734375, 5.35821533203125, 5.6134033203125, 5.86859130859375, 6.123779296875, 6.37896728515625, 6.6341552734375, 6.88934326171875, 7.14453125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 9.0, 7.0, 12.0, 17.0, 31.0, 38.0, 47.0, 89.0, 110.0, 190.0, 358.0, 865.0, 4771.0, 289000.0, 3850190.0, 44976.0, 2104.0, 641.0, 282.0, 178.0, 124.0, 71.0, 38.0, 38.0, 38.0, 26.0, 8.0, 9.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.640625, -23.770751953125, -22.90087890625, -22.031005859375, -21.1611328125, -20.291259765625, -19.42138671875, -18.551513671875, -17.681640625, -16.811767578125, -15.94189453125, -15.072021484375, -14.2021484375, -13.332275390625, -12.46240234375, -11.592529296875, -10.72265625, -9.852783203125, -8.98291015625, -8.113037109375, -7.2431640625, -6.373291015625, -5.50341796875, -4.633544921875, -3.763671875, -2.893798828125, -2.02392578125, -1.154052734375, -0.2841796875, 0.585693359375, 1.45556640625, 2.325439453125, 3.1953125, 4.065185546875, 4.93505859375, 5.804931640625, 6.6748046875, 7.544677734375, 8.41455078125, 9.284423828125, 10.154296875, 11.024169921875, 11.89404296875, 12.763916015625, 13.6337890625, 14.503662109375, 15.37353515625, 16.243408203125, 17.11328125, 17.983154296875, 18.85302734375, 19.722900390625, 20.5927734375, 21.462646484375, 22.33251953125, 23.202392578125, 24.072265625, 24.942138671875, 25.81201171875, 26.681884765625, 27.5517578125, 28.421630859375, 29.29150390625, 30.161376953125, 31.03125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 18.0, 49.0, 214.0, 318.0, 274.0, 116.0, 21.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.165061950683594, -49.234886169433594, -46.304710388183594, -43.374534606933594, -40.444358825683594, -37.514183044433594, -34.58400344848633, -31.653827667236328, -28.723651885986328, -25.793476104736328, -22.863300323486328, -19.933122634887695, -17.002946853637695, -14.072771072387695, -11.142593383789062, -8.212417602539062, -5.2822418212890625, -2.3520655632019043, 0.5781106948852539, 3.5082874298095703, 6.43846321105957, 9.36863899230957, 12.298816680908203, 15.228992462158203, 18.159168243408203, 21.089344024658203, 24.019519805908203, 26.949697494506836, 29.879873275756836, 32.81005096435547, 35.74022674560547, 38.67040252685547, 41.60057067871094, 44.53074645996094, 47.46092224121094, 50.39109802246094, 53.32127380371094, 56.25144958496094, 59.1816291809082, 62.1118049621582, 65.04197692871094, 67.97215270996094, 70.90232849121094, 73.83250427246094, 76.76268005371094, 79.69285583496094, 82.62303161621094, 85.55320739746094, 88.48339080810547, 91.41356658935547, 94.34374237060547, 97.27391815185547, 100.20409393310547, 103.13426971435547, 106.064453125, 108.99462890625, 111.9248046875, 114.85498046875, 117.78515625, 120.71533203125, 123.6455078125, 126.57568359375, 129.505859375, 132.43603515625, 135.3662109375]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 12.0, 5.0, 12.0, 11.0, 11.0, 13.0, 14.0, 21.0, 24.0, 23.0, 30.0, 37.0, 35.0, 42.0, 27.0, 24.0, 45.0, 43.0, 40.0, 38.0, 35.0, 43.0, 38.0, 36.0, 42.0, 37.0, 34.0, 36.0, 26.0, 25.0, 16.0, 20.0, 15.0, 14.0, 16.0, 12.0, 7.0, 10.0, 6.0, 0.0, 6.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.087722778320312, -24.257740020751953, -23.427757263183594, -22.597774505615234, -21.767791748046875, -20.937808990478516, -20.107826232910156, -19.277843475341797, -18.447860717773438, -17.617877960205078, -16.78789520263672, -15.95791244506836, -15.1279296875, -14.29794692993164, -13.467963218688965, -12.637980461120605, -11.80799674987793, -10.97801399230957, -10.148031234741211, -9.318048477172852, -8.488065719604492, -7.658082485198975, -6.828099250793457, -5.998116493225098, -5.168133735656738, -4.338150978088379, -3.5081679821014404, -2.678184986114502, -1.8482022285461426, -1.0182194709777832, -0.18823623657226562, 0.6417465209960938, 1.4717273712158203, 2.3017101287841797, 3.131693124771118, 3.9616761207580566, 4.791658878326416, 5.621641635894775, 6.451624870300293, 7.281607627868652, 8.111590385437012, 8.941573143005371, 9.77155590057373, 10.601539611816406, 11.431522369384766, 12.261505126953125, 13.091487884521484, 13.921470642089844, 14.751453399658203, 15.581436157226562, 16.411418914794922, 17.24140167236328, 18.07138442993164, 18.9013671875, 19.73134994506836, 20.56133270263672, 21.391315460205078, 22.221298217773438, 23.051280975341797, 23.881263732910156, 24.711246490478516, 25.541229248046875, 26.371212005615234, 27.201194763183594, 28.031179428100586]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 2.0, 2.0, 7.0, 9.0, 12.0, 9.0, 16.0, 15.0, 19.0, 17.0, 22.0, 17.0, 27.0, 31.0, 33.0, 38.0, 37.0, 39.0, 37.0, 46.0, 38.0, 40.0, 31.0, 34.0, 35.0, 44.0, 35.0, 25.0, 42.0, 29.0, 24.0, 22.0, 28.0, 32.0, 15.0, 14.0, 13.0, 16.0, 10.0, 11.0, 5.0, 7.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-2.830078125, -2.743896484375, -2.65771484375, -2.571533203125, -2.4853515625, -2.399169921875, -2.31298828125, -2.226806640625, -2.140625, -2.054443359375, -1.96826171875, -1.882080078125, -1.7958984375, -1.709716796875, -1.62353515625, -1.537353515625, -1.451171875, -1.364990234375, -1.27880859375, -1.192626953125, -1.1064453125, -1.020263671875, -0.93408203125, -0.847900390625, -0.76171875, -0.675537109375, -0.58935546875, -0.503173828125, -0.4169921875, -0.330810546875, -0.24462890625, -0.158447265625, -0.072265625, 0.013916015625, 0.10009765625, 0.186279296875, 0.2724609375, 0.358642578125, 0.44482421875, 0.531005859375, 0.6171875, 0.703369140625, 0.78955078125, 0.875732421875, 0.9619140625, 1.048095703125, 1.13427734375, 1.220458984375, 1.306640625, 1.392822265625, 1.47900390625, 1.565185546875, 1.6513671875, 1.737548828125, 1.82373046875, 1.909912109375, 1.99609375, 2.082275390625, 2.16845703125, 2.254638671875, 2.3408203125, 2.427001953125, 2.51318359375, 2.599365234375, 2.685546875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 8.0, 7.0, 3.0, 17.0, 28.0, 34.0, 44.0, 66.0, 97.0, 133.0, 195.0, 303.0, 396.0, 545.0, 846.0, 1213.0, 1811.0, 2469.0, 3681.0, 5271.0, 7839.0, 11418.0, 16695.0, 25121.0, 37884.0, 58619.0, 96140.0, 196925.0, 270959.0, 113106.0, 66394.0, 42791.0, 28187.0, 18756.0, 12756.0, 8608.0, 5998.0, 4116.0, 2735.0, 1961.0, 1371.0, 902.0, 621.0, 443.0, 344.0, 213.0, 157.0, 103.0, 71.0, 56.0, 33.0, 28.0, 28.0, 4.0, 3.0, 10.0, 5.0, 0.0, 1.0, 3.0], "bins": [-0.5595703125, -0.5421600341796875, -0.524749755859375, -0.5073394775390625, -0.48992919921875, -0.4725189208984375, -0.455108642578125, -0.4376983642578125, -0.4202880859375, -0.4028778076171875, -0.385467529296875, -0.3680572509765625, -0.35064697265625, -0.3332366943359375, -0.315826416015625, -0.2984161376953125, -0.281005859375, -0.2635955810546875, -0.246185302734375, -0.2287750244140625, -0.21136474609375, -0.1939544677734375, -0.176544189453125, -0.1591339111328125, -0.1417236328125, -0.1243133544921875, -0.106903076171875, -0.0894927978515625, -0.07208251953125, -0.0546722412109375, -0.037261962890625, -0.0198516845703125, -0.00244140625, 0.0149688720703125, 0.032379150390625, 0.0497894287109375, 0.06719970703125, 0.0846099853515625, 0.102020263671875, 0.1194305419921875, 0.1368408203125, 0.1542510986328125, 0.171661376953125, 0.1890716552734375, 0.20648193359375, 0.2238922119140625, 0.241302490234375, 0.2587127685546875, 0.276123046875, 0.2935333251953125, 0.310943603515625, 0.3283538818359375, 0.34576416015625, 0.3631744384765625, 0.380584716796875, 0.3979949951171875, 0.4154052734375, 0.4328155517578125, 0.450225830078125, 0.4676361083984375, 0.48504638671875, 0.5024566650390625, 0.519866943359375, 0.5372772216796875, 0.5546875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 0.0, 6.0, 4.0, 3.0, 3.0, 8.0, 11.0, 8.0, 11.0, 11.0, 16.0, 19.0, 22.0, 30.0, 27.0, 34.0, 20.0, 39.0, 39.0, 42.0, 36.0, 32.0, 41.0, 1060.0, 44.0, 47.0, 43.0, 32.0, 46.0, 36.0, 34.0, 36.0, 21.0, 28.0, 20.0, 12.0, 22.0, 13.0, 17.0, 12.0, 13.0, 4.0, 3.0, 5.0, 9.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.7734375, -1.7177734375, -1.662109375, -1.6064453125, -1.55078125, -1.4951171875, -1.439453125, -1.3837890625, -1.328125, -1.2724609375, -1.216796875, -1.1611328125, -1.10546875, -1.0498046875, -0.994140625, -0.9384765625, -0.8828125, -0.8271484375, -0.771484375, -0.7158203125, -0.66015625, -0.6044921875, -0.548828125, -0.4931640625, -0.4375, -0.3818359375, -0.326171875, -0.2705078125, -0.21484375, -0.1591796875, -0.103515625, -0.0478515625, 0.0078125, 0.0634765625, 0.119140625, 0.1748046875, 0.23046875, 0.2861328125, 0.341796875, 0.3974609375, 0.453125, 0.5087890625, 0.564453125, 0.6201171875, 0.67578125, 0.7314453125, 0.787109375, 0.8427734375, 0.8984375, 0.9541015625, 1.009765625, 1.0654296875, 1.12109375, 1.1767578125, 1.232421875, 1.2880859375, 1.34375, 1.3994140625, 1.455078125, 1.5107421875, 1.56640625, 1.6220703125, 1.677734375, 1.7333984375, 1.7890625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 12.0, 13.0, 21.0, 34.0, 37.0, 52.0, 105.0, 142.0, 202.0, 325.0, 496.0, 807.0, 1201.0, 1941.0, 3006.0, 4931.0, 8063.0, 13758.0, 23804.0, 41822.0, 78372.0, 161328.0, 1427507.0, 155259.0, 75846.0, 40866.0, 22806.0, 13284.0, 7933.0, 4967.0, 2932.0, 1861.0, 1210.0, 736.0, 507.0, 319.0, 212.0, 119.0, 105.0, 73.0, 31.0, 29.0, 21.0, 13.0, 9.0, 3.0, 4.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.75048828125, -0.7273788452148438, -0.7042694091796875, -0.6811599731445312, -0.658050537109375, -0.6349411010742188, -0.6118316650390625, -0.5887222290039062, -0.56561279296875, -0.5425033569335938, -0.5193939208984375, -0.49628448486328125, -0.473175048828125, -0.45006561279296875, -0.4269561767578125, -0.40384674072265625, -0.3807373046875, -0.35762786865234375, -0.3345184326171875, -0.31140899658203125, -0.288299560546875, -0.26519012451171875, -0.2420806884765625, -0.21897125244140625, -0.19586181640625, -0.17275238037109375, -0.1496429443359375, -0.12653350830078125, -0.103424072265625, -0.08031463623046875, -0.0572052001953125, -0.03409576416015625, -0.010986328125, 0.01212310791015625, 0.0352325439453125, 0.05834197998046875, 0.081451416015625, 0.10456085205078125, 0.1276702880859375, 0.15077972412109375, 0.17388916015625, 0.19699859619140625, 0.2201080322265625, 0.24321746826171875, 0.266326904296875, 0.28943634033203125, 0.3125457763671875, 0.33565521240234375, 0.3587646484375, 0.38187408447265625, 0.4049835205078125, 0.42809295654296875, 0.451202392578125, 0.47431182861328125, 0.4974212646484375, 0.5205307006835938, 0.54364013671875, 0.5667495727539062, 0.5898590087890625, 0.6129684448242188, 0.636077880859375, 0.6591873168945312, 0.6822967529296875, 0.7054061889648438, 0.728515625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 10.0, 6.0, 16.0, 12.0, 15.0, 20.0, 26.0, 29.0, 43.0, 48.0, 75.0, 73.0, 101.0, 111.0, 96.0, 75.0, 60.0, 27.0, 30.0, 18.0, 15.0, 12.0, 13.0, 9.0, 7.0, 10.0, 5.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0006213188171386719, -0.0006041377782821655, -0.0005869567394256592, -0.0005697757005691528, -0.0005525946617126465, -0.0005354136228561401, -0.0005182325839996338, -0.0005010515451431274, -0.0004838705062866211, -0.00046668946743011475, -0.0004495084285736084, -0.00043232738971710205, -0.0004151463508605957, -0.00039796531200408936, -0.000380784273147583, -0.00036360323429107666, -0.0003464221954345703, -0.00032924115657806396, -0.0003120601177215576, -0.00029487907886505127, -0.0002776980400085449, -0.0002605170011520386, -0.00024333596229553223, -0.00022615492343902588, -0.00020897388458251953, -0.00019179284572601318, -0.00017461180686950684, -0.0001574307680130005, -0.00014024972915649414, -0.0001230686902999878, -0.00010588765144348145, -8.87066125869751e-05, -7.152557373046875e-05, -5.43445348739624e-05, -3.7163496017456055e-05, -1.9982457160949707e-05, -2.8014183044433594e-06, 1.4379620552062988e-05, 3.1560659408569336e-05, 4.8741698265075684e-05, 6.592273712158203e-05, 8.310377597808838e-05, 0.00010028481483459473, 0.00011746585369110107, 0.00013464689254760742, 0.00015182793140411377, 0.00016900897026062012, 0.00018619000911712646, 0.0002033710479736328, 0.00022055208683013916, 0.0002377331256866455, 0.00025491416454315186, 0.0002720952033996582, 0.00028927624225616455, 0.0003064572811126709, 0.00032363831996917725, 0.0003408193588256836, 0.00035800039768218994, 0.0003751814365386963, 0.00039236247539520264, 0.000409543514251709, 0.00042672455310821533, 0.0004439055919647217, 0.00046108663082122803, 0.0004782676696777344]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 7.0, 9.0, 8.0, 9.0, 11.0, 19.0, 24.0, 30.0, 53.0, 60.0, 97.0, 136.0, 260.0, 463.0, 1822.0, 938278.0, 105300.0, 962.0, 377.0, 167.0, 141.0, 88.0, 64.0, 35.0, 25.0, 19.0, 20.0, 17.0, 8.0, 7.0, 6.0, 6.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0084686279296875, -0.008113622665405273, -0.007758617401123047, -0.00740361213684082, -0.007048606872558594, -0.006693601608276367, -0.006338596343994141, -0.005983591079711914, -0.0056285858154296875, -0.005273580551147461, -0.004918575286865234, -0.004563570022583008, -0.004208564758300781, -0.0038535594940185547, -0.003498554229736328, -0.0031435489654541016, -0.002788543701171875, -0.0024335384368896484, -0.002078533172607422, -0.0017235279083251953, -0.0013685226440429688, -0.0010135173797607422, -0.0006585121154785156, -0.00030350685119628906, 5.14984130859375e-05, 0.00040650367736816406, 0.0007615089416503906, 0.0011165142059326172, 0.0014715194702148438, 0.0018265247344970703, 0.002181529998779297, 0.0025365352630615234, 0.00289154052734375, 0.0032465457916259766, 0.003601551055908203, 0.00395655632019043, 0.004311561584472656, 0.004666566848754883, 0.005021572113037109, 0.005376577377319336, 0.0057315826416015625, 0.006086587905883789, 0.006441593170166016, 0.006796598434448242, 0.007151603698730469, 0.007506608963012695, 0.007861614227294922, 0.008216619491577148, 0.008571624755859375, 0.008926630020141602, 0.009281635284423828, 0.009636640548706055, 0.009991645812988281, 0.010346651077270508, 0.010701656341552734, 0.011056661605834961, 0.011411666870117188, 0.011766672134399414, 0.01212167739868164, 0.012476682662963867, 0.012831687927246094, 0.01318669319152832, 0.013541698455810547, 0.013896703720092773, 0.014251708984375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [7.0, 28.0, 124.0, 330.0, 326.0, 151.0, 35.0, 11.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001202230341732502, -9.109482925850898e-05, -6.196661706781015e-05, -3.2838404877111316e-05, -3.7101999623700976e-06, 2.541800495237112e-05, 5.454622441902757e-05, 8.367442933376878e-05, 0.00011280263424851, 0.00014193083916325122, 0.00017105904407799244, 0.00020018726354464889, 0.0002293154684593901, 0.0002584436733741313, 0.00028757189284078777, 0.00031670008320361376, 0.0003458283026702702, 0.00037495652213692665, 0.00040408471249975264, 0.0004332129319664091, 0.0004623411223292351, 0.0004914693417958915, 0.000520597561262548, 0.0005497257807292044, 0.0005788540001958609, 0.0006079822196625173, 0.0006371104391291738, 0.0006662386003881693, 0.0006953668198548257, 0.0007244950393214822, 0.0007536232587881386, 0.0007827514782547951, 0.0008118796395137906, 0.000841007858980447, 0.0008701360784471035, 0.000899264239706099, 0.0009283924591727555, 0.0009575206786394119, 0.0009866489563137293, 0.0010157771175727248, 0.0010449052788317204, 0.0010740334400907159, 0.0011031617177650332, 0.0011322898790240288, 0.0011614181566983461, 0.0011905463179573417, 0.0012196744792163372, 0.0012488027568906546, 0.001277931034564972, 0.0013070591958239675, 0.0013361874734982848, 0.0013653156347572803, 0.0013944439124315977, 0.0014235720736905932, 0.0014527002349495888, 0.0014818285126239061, 0.0015109566738829017, 0.0015400848351418972, 0.0015692131128162146, 0.00159834127407521, 0.0016274695517495275, 0.001656597713008523, 0.0016857259906828403, 0.0017148541519418359, 0.0017439823132008314]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 7.0, 8.0, 4.0, 9.0, 17.0, 17.0, 24.0, 27.0, 25.0, 24.0, 31.0, 31.0, 33.0, 41.0, 37.0, 40.0, 38.0, 42.0, 42.0, 35.0, 39.0, 40.0, 33.0, 40.0, 46.0, 21.0, 36.0, 28.0, 23.0, 26.0, 24.0, 20.0, 21.0, 13.0, 9.0, 12.0, 12.0, 5.0, 3.0, 9.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022232532501220703, -0.000214453786611557, -0.00020658224821090698, -0.00019871070981025696, -0.00019083917140960693, -0.0001829676330089569, -0.00017509609460830688, -0.00016722455620765686, -0.00015935301780700684, -0.0001514814794063568, -0.0001436099410057068, -0.00013573840260505676, -0.00012786686420440674, -0.00011999532580375671, -0.00011212378740310669, -0.00010425224900245667, -9.638071060180664e-05, -8.850917220115662e-05, -8.063763380050659e-05, -7.276609539985657e-05, -6.489455699920654e-05, -5.702301859855652e-05, -4.9151480197906494e-05, -4.127994179725647e-05, -3.3408403396606445e-05, -2.553686499595642e-05, -1.7665326595306396e-05, -9.793788194656372e-06, -1.9222497940063477e-06, 5.949288606643677e-06, 1.3820827007293701e-05, 2.1692365407943726e-05, 2.956390380859375e-05, 3.7435442209243774e-05, 4.53069806098938e-05, 5.317851901054382e-05, 6.105005741119385e-05, 6.892159581184387e-05, 7.67931342124939e-05, 8.466467261314392e-05, 9.253621101379395e-05, 0.00010040774941444397, 0.000108279287815094, 0.00011615082621574402, 0.00012402236461639404, 0.00013189390301704407, 0.0001397654414176941, 0.00014763697981834412, 0.00015550851821899414, 0.00016338005661964417, 0.0001712515950202942, 0.00017912313342094421, 0.00018699467182159424, 0.00019486621022224426, 0.0002027377486228943, 0.0002106092870235443, 0.00021848082542419434, 0.00022635236382484436, 0.00023422390222549438, 0.0002420954406261444, 0.00024996697902679443, 0.00025783851742744446, 0.0002657100558280945, 0.0002735815942287445, 0.00028145313262939453]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 2.0, 2.0, 7.0, 9.0, 12.0, 9.0, 16.0, 15.0, 19.0, 17.0, 22.0, 17.0, 27.0, 31.0, 33.0, 38.0, 37.0, 39.0, 37.0, 46.0, 38.0, 40.0, 31.0, 34.0, 35.0, 44.0, 35.0, 25.0, 42.0, 29.0, 24.0, 22.0, 28.0, 32.0, 15.0, 14.0, 13.0, 16.0, 10.0, 11.0, 5.0, 7.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-2.830078125, -2.743896484375, -2.65771484375, -2.571533203125, -2.4853515625, -2.399169921875, -2.31298828125, -2.226806640625, -2.140625, -2.054443359375, -1.96826171875, -1.882080078125, -1.7958984375, -1.709716796875, -1.62353515625, -1.537353515625, -1.451171875, -1.364990234375, -1.27880859375, -1.192626953125, -1.1064453125, -1.020263671875, -0.93408203125, -0.847900390625, -0.76171875, -0.675537109375, -0.58935546875, -0.503173828125, -0.4169921875, -0.330810546875, -0.24462890625, -0.158447265625, -0.072265625, 0.013916015625, 0.10009765625, 0.186279296875, 0.2724609375, 0.358642578125, 0.44482421875, 0.531005859375, 0.6171875, 0.703369140625, 0.78955078125, 0.875732421875, 0.9619140625, 1.048095703125, 1.13427734375, 1.220458984375, 1.306640625, 1.392822265625, 1.47900390625, 1.565185546875, 1.6513671875, 1.737548828125, 1.82373046875, 1.909912109375, 1.99609375, 2.082275390625, 2.16845703125, 2.254638671875, 2.3408203125, 2.427001953125, 2.51318359375, 2.599365234375, 2.685546875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 4.0, 16.0, 20.0, 28.0, 20.0, 32.0, 33.0, 56.0, 93.0, 92.0, 162.0, 223.0, 297.0, 415.0, 656.0, 939.0, 1463.0, 2226.0, 3626.0, 5719.0, 9814.0, 18245.0, 37966.0, 94326.0, 277997.0, 364290.0, 128822.0, 48371.0, 22379.0, 11662.0, 6767.0, 4065.0, 2595.0, 1617.0, 1125.0, 710.0, 488.0, 353.0, 223.0, 169.0, 122.0, 83.0, 70.0, 54.0, 40.0, 30.0, 19.0, 15.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.994140625, -2.90380859375, -2.8134765625, -2.72314453125, -2.6328125, -2.54248046875, -2.4521484375, -2.36181640625, -2.271484375, -2.18115234375, -2.0908203125, -2.00048828125, -1.91015625, -1.81982421875, -1.7294921875, -1.63916015625, -1.548828125, -1.45849609375, -1.3681640625, -1.27783203125, -1.1875, -1.09716796875, -1.0068359375, -0.91650390625, -0.826171875, -0.73583984375, -0.6455078125, -0.55517578125, -0.46484375, -0.37451171875, -0.2841796875, -0.19384765625, -0.103515625, -0.01318359375, 0.0771484375, 0.16748046875, 0.2578125, 0.34814453125, 0.4384765625, 0.52880859375, 0.619140625, 0.70947265625, 0.7998046875, 0.89013671875, 0.98046875, 1.07080078125, 1.1611328125, 1.25146484375, 1.341796875, 1.43212890625, 1.5224609375, 1.61279296875, 1.703125, 1.79345703125, 1.8837890625, 1.97412109375, 2.064453125, 2.15478515625, 2.2451171875, 2.33544921875, 2.42578125, 2.51611328125, 2.6064453125, 2.69677734375, 2.787109375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 5.0, 5.0, 8.0, 5.0, 6.0, 10.0, 16.0, 21.0, 19.0, 23.0, 32.0, 32.0, 23.0, 45.0, 42.0, 50.0, 52.0, 68.0, 146.0, 1469.0, 409.0, 129.0, 75.0, 60.0, 30.0, 44.0, 32.0, 30.0, 25.0, 29.0, 17.0, 27.0, 13.0, 12.0, 10.0, 9.0, 5.0, 7.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.046875, -10.701416015625, -10.35595703125, -10.010498046875, -9.6650390625, -9.319580078125, -8.97412109375, -8.628662109375, -8.283203125, -7.937744140625, -7.59228515625, -7.246826171875, -6.9013671875, -6.555908203125, -6.21044921875, -5.864990234375, -5.51953125, -5.174072265625, -4.82861328125, -4.483154296875, -4.1376953125, -3.792236328125, -3.44677734375, -3.101318359375, -2.755859375, -2.410400390625, -2.06494140625, -1.719482421875, -1.3740234375, -1.028564453125, -0.68310546875, -0.337646484375, 0.0078125, 0.353271484375, 0.69873046875, 1.044189453125, 1.3896484375, 1.735107421875, 2.08056640625, 2.426025390625, 2.771484375, 3.116943359375, 3.46240234375, 3.807861328125, 4.1533203125, 4.498779296875, 4.84423828125, 5.189697265625, 5.53515625, 5.880615234375, 6.22607421875, 6.571533203125, 6.9169921875, 7.262451171875, 7.60791015625, 7.953369140625, 8.298828125, 8.644287109375, 8.98974609375, 9.335205078125, 9.6806640625, 10.026123046875, 10.37158203125, 10.717041015625, 11.0625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 6.0, 4.0, 8.0, 14.0, 6.0, 20.0, 21.0, 29.0, 32.0, 43.0, 52.0, 68.0, 116.0, 158.0, 288.0, 525.0, 2394.0, 49436.0, 3032185.0, 56192.0, 2631.0, 528.0, 306.0, 192.0, 103.0, 74.0, 48.0, 47.0, 36.0, 18.0, 26.0, 15.0, 22.0, 10.0, 12.0, 6.0, 3.0, 9.0, 4.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-22.84375, -22.118896484375, -21.39404296875, -20.669189453125, -19.9443359375, -19.219482421875, -18.49462890625, -17.769775390625, -17.044921875, -16.320068359375, -15.59521484375, -14.870361328125, -14.1455078125, -13.420654296875, -12.69580078125, -11.970947265625, -11.24609375, -10.521240234375, -9.79638671875, -9.071533203125, -8.3466796875, -7.621826171875, -6.89697265625, -6.172119140625, -5.447265625, -4.722412109375, -3.99755859375, -3.272705078125, -2.5478515625, -1.822998046875, -1.09814453125, -0.373291015625, 0.3515625, 1.076416015625, 1.80126953125, 2.526123046875, 3.2509765625, 3.975830078125, 4.70068359375, 5.425537109375, 6.150390625, 6.875244140625, 7.60009765625, 8.324951171875, 9.0498046875, 9.774658203125, 10.49951171875, 11.224365234375, 11.94921875, 12.674072265625, 13.39892578125, 14.123779296875, 14.8486328125, 15.573486328125, 16.29833984375, 17.023193359375, 17.748046875, 18.472900390625, 19.19775390625, 19.922607421875, 20.6474609375, 21.372314453125, 22.09716796875, 22.822021484375, 23.546875]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 9.0, 463.0, 536.0, 7.0, 1.0, 1.0], "bins": [-290.40313720703125, -285.5629577636719, -280.7227478027344, -275.882568359375, -271.0423889160156, -266.2021789550781, -261.36199951171875, -256.5218200683594, -251.68161010742188, -246.84141540527344, -242.00123596191406, -237.16104125976562, -232.3208465576172, -227.48065185546875, -222.64047241210938, -217.80027770996094, -212.96009826660156, -208.11990356445312, -203.27972412109375, -198.4395294189453, -193.59933471679688, -188.7591552734375, -183.91896057128906, -179.07876586914062, -174.23858642578125, -169.3983917236328, -164.55821228027344, -159.718017578125, -154.87782287597656, -150.03762817382812, -145.19744873046875, -140.3572540283203, -135.51705932617188, -130.67686462402344, -125.83667755126953, -120.99649047851562, -116.15629577636719, -111.31610870361328, -106.47592163085938, -101.63572692871094, -96.79553985595703, -91.95535278320312, -87.11515808105469, -82.27497100830078, -77.43478393554688, -72.59458923339844, -67.75440216064453, -62.91421127319336, -58.07402038574219, -53.233829498291016, -48.393638610839844, -43.55345153808594, -38.713260650634766, -33.873069763183594, -29.032880783081055, -24.192691802978516, -19.35249900817871, -14.512309074401855, -9.672119140625, -4.8319292068481445, 0.008260726928710938, 4.848451614379883, 9.688640594482422, 14.528829574584961, 19.369020462036133]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 8.0, 7.0, 6.0, 8.0, 9.0, 13.0, 8.0, 20.0, 20.0, 26.0, 27.0, 45.0, 39.0, 29.0, 50.0, 39.0, 45.0, 51.0, 43.0, 60.0, 49.0, 40.0, 44.0, 41.0, 38.0, 22.0, 38.0, 31.0, 36.0, 23.0, 15.0, 20.0, 7.0, 9.0, 8.0, 5.0, 3.0, 11.0, 7.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.334327697753906, -37.260040283203125, -36.18574905395508, -35.1114616394043, -34.03717041015625, -32.96288299560547, -31.888593673706055, -30.81430435180664, -29.740015029907227, -28.665725708007812, -27.5914363861084, -26.517147064208984, -25.442859649658203, -24.368568420410156, -23.294281005859375, -22.21999168395996, -21.145702362060547, -20.071413040161133, -18.99712371826172, -17.922834396362305, -16.84854507446289, -15.774256706237793, -14.699968338012695, -13.625679016113281, -12.551389694213867, -11.477100372314453, -10.402811050415039, -9.328522682189941, -8.254233360290527, -7.179944038391113, -6.105655193328857, -5.031366348266602, -3.957080841064453, -2.882791757583618, -1.8085026741027832, -0.7342135906219482, 0.3400754928588867, 1.4143648147583008, 2.4886536598205566, 3.5629425048828125, 4.637231826782227, 5.711521148681641, 6.7858099937438965, 7.860098838806152, 8.934388160705566, 10.00867748260498, 11.082965850830078, 12.157255172729492, 13.231544494628906, 14.30583381652832, 15.380123138427734, 16.45441246032715, 17.528701782226562, 18.602989196777344, 19.677278518676758, 20.751567840576172, 21.825857162475586, 22.900146484375, 23.974435806274414, 25.048725128173828, 26.12301254272461, 27.197303771972656, 28.271591186523438, 29.34588050842285, 30.420169830322266]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 2.0, 2.0, 10.0, 7.0, 5.0, 7.0, 10.0, 19.0, 17.0, 14.0, 20.0, 24.0, 20.0, 35.0, 25.0, 34.0, 39.0, 31.0, 30.0, 42.0, 31.0, 34.0, 44.0, 43.0, 34.0, 39.0, 37.0, 31.0, 25.0, 32.0, 24.0, 28.0, 27.0, 26.0, 25.0, 19.0, 19.0, 16.0, 11.0, 12.0, 7.0, 19.0, 5.0, 6.0, 4.0, 7.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.703125, -2.6162109375, -2.529296875, -2.4423828125, -2.35546875, -2.2685546875, -2.181640625, -2.0947265625, -2.0078125, -1.9208984375, -1.833984375, -1.7470703125, -1.66015625, -1.5732421875, -1.486328125, -1.3994140625, -1.3125, -1.2255859375, -1.138671875, -1.0517578125, -0.96484375, -0.8779296875, -0.791015625, -0.7041015625, -0.6171875, -0.5302734375, -0.443359375, -0.3564453125, -0.26953125, -0.1826171875, -0.095703125, -0.0087890625, 0.078125, 0.1650390625, 0.251953125, 0.3388671875, 0.42578125, 0.5126953125, 0.599609375, 0.6865234375, 0.7734375, 0.8603515625, 0.947265625, 1.0341796875, 1.12109375, 1.2080078125, 1.294921875, 1.3818359375, 1.46875, 1.5556640625, 1.642578125, 1.7294921875, 1.81640625, 1.9033203125, 1.990234375, 2.0771484375, 2.1640625, 2.2509765625, 2.337890625, 2.4248046875, 2.51171875, 2.5986328125, 2.685546875, 2.7724609375, 2.859375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 8.0, 5.0, 7.0, 12.0, 13.0, 16.0, 31.0, 40.0, 50.0, 76.0, 78.0, 114.0, 231.0, 368.0, 663.0, 1323.0, 2771.0, 6800.0, 19035.0, 61547.0, 222037.0, 726538.0, 1419166.0, 1142020.0, 421663.0, 115642.0, 33772.0, 11477.0, 4496.0, 1947.0, 903.0, 520.0, 285.0, 188.0, 127.0, 90.0, 59.0, 47.0, 26.0, 22.0, 19.0, 14.0, 12.0, 11.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.58203125, -3.46923828125, -3.3564453125, -3.24365234375, -3.130859375, -3.01806640625, -2.9052734375, -2.79248046875, -2.6796875, -2.56689453125, -2.4541015625, -2.34130859375, -2.228515625, -2.11572265625, -2.0029296875, -1.89013671875, -1.77734375, -1.66455078125, -1.5517578125, -1.43896484375, -1.326171875, -1.21337890625, -1.1005859375, -0.98779296875, -0.875, -0.76220703125, -0.6494140625, -0.53662109375, -0.423828125, -0.31103515625, -0.1982421875, -0.08544921875, 0.02734375, 0.14013671875, 0.2529296875, 0.36572265625, 0.478515625, 0.59130859375, 0.7041015625, 0.81689453125, 0.9296875, 1.04248046875, 1.1552734375, 1.26806640625, 1.380859375, 1.49365234375, 1.6064453125, 1.71923828125, 1.83203125, 1.94482421875, 2.0576171875, 2.17041015625, 2.283203125, 2.39599609375, 2.5087890625, 2.62158203125, 2.734375, 2.84716796875, 2.9599609375, 3.07275390625, 3.185546875, 3.29833984375, 3.4111328125, 3.52392578125, 3.63671875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 9.0, 16.0, 27.0, 46.0, 69.0, 108.0, 125.0, 183.0, 283.0, 388.0, 532.0, 582.0, 504.0, 403.0, 259.0, 168.0, 137.0, 68.0, 61.0, 33.0, 19.0, 16.0, 10.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-13.625, -13.310302734375, -12.99560546875, -12.680908203125, -12.3662109375, -12.051513671875, -11.73681640625, -11.422119140625, -11.107421875, -10.792724609375, -10.47802734375, -10.163330078125, -9.8486328125, -9.533935546875, -9.21923828125, -8.904541015625, -8.58984375, -8.275146484375, -7.96044921875, -7.645751953125, -7.3310546875, -7.016357421875, -6.70166015625, -6.386962890625, -6.072265625, -5.757568359375, -5.44287109375, -5.128173828125, -4.8134765625, -4.498779296875, -4.18408203125, -3.869384765625, -3.5546875, -3.239990234375, -2.92529296875, -2.610595703125, -2.2958984375, -1.981201171875, -1.66650390625, -1.351806640625, -1.037109375, -0.722412109375, -0.40771484375, -0.093017578125, 0.2216796875, 0.536376953125, 0.85107421875, 1.165771484375, 1.48046875, 1.795166015625, 2.10986328125, 2.424560546875, 2.7392578125, 3.053955078125, 3.36865234375, 3.683349609375, 3.998046875, 4.312744140625, 4.62744140625, 4.942138671875, 5.2568359375, 5.571533203125, 5.88623046875, 6.200927734375, 6.515625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 5.0, 11.0, 10.0, 26.0, 19.0, 42.0, 52.0, 76.0, 120.0, 202.0, 434.0, 1636.0, 39143.0, 3930409.0, 217936.0, 2880.0, 600.0, 255.0, 149.0, 83.0, 49.0, 37.0, 24.0, 21.0, 22.0, 15.0, 9.0, 4.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.953125, -24.979248046875, -24.00537109375, -23.031494140625, -22.0576171875, -21.083740234375, -20.10986328125, -19.135986328125, -18.162109375, -17.188232421875, -16.21435546875, -15.240478515625, -14.2666015625, -13.292724609375, -12.31884765625, -11.344970703125, -10.37109375, -9.397216796875, -8.42333984375, -7.449462890625, -6.4755859375, -5.501708984375, -4.52783203125, -3.553955078125, -2.580078125, -1.606201171875, -0.63232421875, 0.341552734375, 1.3154296875, 2.289306640625, 3.26318359375, 4.237060546875, 5.2109375, 6.184814453125, 7.15869140625, 8.132568359375, 9.1064453125, 10.080322265625, 11.05419921875, 12.028076171875, 13.001953125, 13.975830078125, 14.94970703125, 15.923583984375, 16.8974609375, 17.871337890625, 18.84521484375, 19.819091796875, 20.79296875, 21.766845703125, 22.74072265625, 23.714599609375, 24.6884765625, 25.662353515625, 26.63623046875, 27.610107421875, 28.583984375, 29.557861328125, 30.53173828125, 31.505615234375, 32.4794921875, 33.453369140625, 34.42724609375, 35.401123046875, 36.375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 11.0, 17.0, 21.0, 42.0, 60.0, 96.0, 117.0, 124.0, 150.0, 103.0, 91.0, 64.0, 50.0, 28.0, 16.0, 4.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.13124084472656, -41.021175384521484, -39.911109924316406, -38.80104446411133, -37.69097900390625, -36.580909729003906, -35.47084426879883, -34.36077880859375, -33.25071334838867, -32.140647888183594, -31.030582427978516, -29.920515060424805, -28.810449600219727, -27.70038414001465, -26.590316772460938, -25.48025131225586, -24.37018585205078, -23.260120391845703, -22.150054931640625, -21.039987564086914, -19.929922103881836, -18.819856643676758, -17.709789276123047, -16.59972381591797, -15.48965835571289, -14.379592895507812, -13.269526481628418, -12.159460067749023, -11.049394607543945, -9.939329147338867, -8.829262733459473, -7.719196796417236, -6.609128952026367, -5.499063014984131, -4.3889970779418945, -3.278931140899658, -2.168865203857422, -1.0587992668151855, 0.05126667022705078, 1.161332607269287, 2.2713985443115234, 3.3814644813537598, 4.491530418395996, 5.601596355438232, 6.711662292480469, 7.821728229522705, 8.931794166564941, 10.041860580444336, 11.151926040649414, 12.261991500854492, 13.372057914733887, 14.482124328613281, 15.59218978881836, 16.702255249023438, 17.812320709228516, 18.922388076782227, 20.032453536987305, 21.142518997192383, 22.252586364746094, 23.362651824951172, 24.47271728515625, 25.582782745361328, 26.692848205566406, 27.802915573120117, 28.912981033325195]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 11.0, 11.0, 9.0, 9.0, 12.0, 17.0, 8.0, 17.0, 20.0, 31.0, 25.0, 26.0, 36.0, 32.0, 38.0, 44.0, 35.0, 39.0, 40.0, 47.0, 31.0, 40.0, 33.0, 36.0, 36.0, 41.0, 28.0, 34.0, 27.0, 26.0, 27.0, 15.0, 21.0, 6.0, 17.0, 13.0, 13.0, 7.0, 7.0, 4.0, 9.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.80202865600586, -21.04667854309082, -20.29132843017578, -19.535980224609375, -18.780630111694336, -18.025279998779297, -17.269929885864258, -16.51457977294922, -15.759230613708496, -15.003880500793457, -14.248531341552734, -13.493181228637695, -12.737831115722656, -11.982481956481934, -11.227131843566895, -10.471782684326172, -9.716432571411133, -8.961082458496094, -8.205733299255371, -7.450383186340332, -6.695033550262451, -5.93968391418457, -5.184333801269531, -4.42898416519165, -3.6736345291137695, -2.9182848930358887, -2.1629350185394287, -1.4075851440429688, -0.6522355079650879, 0.10311412811279297, 0.858464241027832, 1.613813877105713, 2.3691654205322266, 3.1245150566101074, 3.8798649311065674, 4.635214805603027, 5.390564441680908, 6.145914077758789, 6.901264190673828, 7.656613826751709, 8.41196346282959, 9.167313575744629, 9.922662734985352, 10.67801284790039, 11.43336296081543, 12.188712120056152, 12.944062232971191, 13.699411392211914, 14.454761505126953, 15.210111618041992, 15.965460777282715, 16.720809936523438, 17.476160049438477, 18.231510162353516, 18.986860275268555, 19.742210388183594, 20.49755859375, 21.25290870666504, 22.008258819580078, 22.763607025146484, 23.518957138061523, 24.274307250976562, 25.0296573638916, 25.78500747680664, 26.54035758972168]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 10.0, 8.0, 5.0, 10.0, 11.0, 15.0, 21.0, 22.0, 16.0, 21.0, 32.0, 34.0, 26.0, 36.0, 34.0, 29.0, 33.0, 37.0, 36.0, 40.0, 45.0, 44.0, 37.0, 37.0, 32.0, 38.0, 33.0, 30.0, 25.0, 28.0, 21.0, 21.0, 15.0, 14.0, 23.0, 23.0, 9.0, 11.0, 11.0, 5.0, 8.0, 5.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.869140625, -2.7779541015625, -2.686767578125, -2.5955810546875, -2.50439453125, -2.4132080078125, -2.322021484375, -2.2308349609375, -2.1396484375, -2.0484619140625, -1.957275390625, -1.8660888671875, -1.77490234375, -1.6837158203125, -1.592529296875, -1.5013427734375, -1.41015625, -1.3189697265625, -1.227783203125, -1.1365966796875, -1.04541015625, -0.9542236328125, -0.863037109375, -0.7718505859375, -0.6806640625, -0.5894775390625, -0.498291015625, -0.4071044921875, -0.31591796875, -0.2247314453125, -0.133544921875, -0.0423583984375, 0.048828125, 0.1400146484375, 0.231201171875, 0.3223876953125, 0.41357421875, 0.5047607421875, 0.595947265625, 0.6871337890625, 0.7783203125, 0.8695068359375, 0.960693359375, 1.0518798828125, 1.14306640625, 1.2342529296875, 1.325439453125, 1.4166259765625, 1.5078125, 1.5989990234375, 1.690185546875, 1.7813720703125, 1.87255859375, 1.9637451171875, 2.054931640625, 2.1461181640625, 2.2373046875, 2.3284912109375, 2.419677734375, 2.5108642578125, 2.60205078125, 2.6932373046875, 2.784423828125, 2.8756103515625, 2.966796875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 9.0, 20.0, 18.0, 32.0, 39.0, 58.0, 75.0, 135.0, 191.0, 275.0, 390.0, 577.0, 840.0, 1245.0, 1899.0, 2925.0, 4513.0, 6987.0, 10807.0, 17901.0, 28582.0, 47063.0, 81298.0, 163661.0, 344067.0, 144285.0, 74495.0, 43949.0, 26533.0, 16532.0, 10378.0, 6425.0, 4112.0, 2719.0, 1825.0, 1219.0, 794.0, 520.0, 345.0, 235.0, 203.0, 114.0, 70.0, 63.0, 43.0, 31.0, 17.0, 14.0, 12.0, 8.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.76318359375, -0.7396469116210938, -0.7161102294921875, -0.6925735473632812, -0.669036865234375, -0.6455001831054688, -0.6219635009765625, -0.5984268188476562, -0.57489013671875, -0.5513534545898438, -0.5278167724609375, -0.5042800903320312, -0.480743408203125, -0.45720672607421875, -0.4336700439453125, -0.41013336181640625, -0.3865966796875, -0.36305999755859375, -0.3395233154296875, -0.31598663330078125, -0.292449951171875, -0.26891326904296875, -0.2453765869140625, -0.22183990478515625, -0.19830322265625, -0.17476654052734375, -0.1512298583984375, -0.12769317626953125, -0.104156494140625, -0.08061981201171875, -0.0570831298828125, -0.03354644775390625, -0.010009765625, 0.01352691650390625, 0.0370635986328125, 0.06060028076171875, 0.084136962890625, 0.10767364501953125, 0.1312103271484375, 0.15474700927734375, 0.17828369140625, 0.20182037353515625, 0.2253570556640625, 0.24889373779296875, 0.272430419921875, 0.29596710205078125, 0.3195037841796875, 0.34304046630859375, 0.3665771484375, 0.39011383056640625, 0.4136505126953125, 0.43718719482421875, 0.460723876953125, 0.48426055908203125, 0.5077972412109375, 0.5313339233398438, 0.55487060546875, 0.5784072875976562, 0.6019439697265625, 0.6254806518554688, 0.649017333984375, 0.6725540161132812, 0.6960906982421875, 0.7196273803710938, 0.7431640625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 4.0, 3.0, 5.0, 7.0, 6.0, 14.0, 2.0, 14.0, 20.0, 16.0, 21.0, 29.0, 39.0, 29.0, 40.0, 42.0, 37.0, 34.0, 39.0, 34.0, 39.0, 1077.0, 56.0, 38.0, 45.0, 51.0, 31.0, 41.0, 36.0, 25.0, 33.0, 23.0, 21.0, 23.0, 11.0, 7.0, 6.0, 6.0, 8.0, 5.0, 7.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.02734375, -1.960723876953125, -1.89410400390625, -1.827484130859375, -1.7608642578125, -1.694244384765625, -1.62762451171875, -1.561004638671875, -1.494384765625, -1.427764892578125, -1.36114501953125, -1.294525146484375, -1.2279052734375, -1.161285400390625, -1.09466552734375, -1.028045654296875, -0.96142578125, -0.894805908203125, -0.82818603515625, -0.761566162109375, -0.6949462890625, -0.628326416015625, -0.56170654296875, -0.495086669921875, -0.428466796875, -0.361846923828125, -0.29522705078125, -0.228607177734375, -0.1619873046875, -0.095367431640625, -0.02874755859375, 0.037872314453125, 0.1044921875, 0.171112060546875, 0.23773193359375, 0.304351806640625, 0.3709716796875, 0.437591552734375, 0.50421142578125, 0.570831298828125, 0.637451171875, 0.704071044921875, 0.77069091796875, 0.837310791015625, 0.9039306640625, 0.970550537109375, 1.03717041015625, 1.103790283203125, 1.17041015625, 1.237030029296875, 1.30364990234375, 1.370269775390625, 1.4368896484375, 1.503509521484375, 1.57012939453125, 1.636749267578125, 1.703369140625, 1.769989013671875, 1.83660888671875, 1.903228759765625, 1.9698486328125, 2.036468505859375, 2.10308837890625, 2.169708251953125, 2.236328125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 6.0, 10.0, 8.0, 4.0, 22.0, 25.0, 37.0, 54.0, 98.0, 117.0, 218.0, 291.0, 464.0, 825.0, 1270.0, 2038.0, 3510.0, 5856.0, 10155.0, 18235.0, 33634.0, 63618.0, 126817.0, 1425827.0, 206385.0, 92010.0, 47253.0, 24876.0, 13732.0, 7836.0, 4604.0, 2702.0, 1700.0, 1046.0, 659.0, 420.0, 248.0, 175.0, 140.0, 58.0, 59.0, 33.0, 22.0, 10.0, 15.0, 9.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.9091796875, -0.8822555541992188, -0.8553314208984375, -0.8284072875976562, -0.801483154296875, -0.7745590209960938, -0.7476348876953125, -0.7207107543945312, -0.69378662109375, -0.6668624877929688, -0.6399383544921875, -0.6130142211914062, -0.586090087890625, -0.5591659545898438, -0.5322418212890625, -0.5053176879882812, -0.4783935546875, -0.45146942138671875, -0.4245452880859375, -0.39762115478515625, -0.370697021484375, -0.34377288818359375, -0.3168487548828125, -0.28992462158203125, -0.26300048828125, -0.23607635498046875, -0.2091522216796875, -0.18222808837890625, -0.155303955078125, -0.12837982177734375, -0.1014556884765625, -0.07453155517578125, -0.047607421875, -0.02068328857421875, 0.0062408447265625, 0.03316497802734375, 0.060089111328125, 0.08701324462890625, 0.1139373779296875, 0.14086151123046875, 0.16778564453125, 0.19470977783203125, 0.2216339111328125, 0.24855804443359375, 0.275482177734375, 0.30240631103515625, 0.3293304443359375, 0.35625457763671875, 0.3831787109375, 0.41010284423828125, 0.4370269775390625, 0.46395111083984375, 0.490875244140625, 0.5177993774414062, 0.5447235107421875, 0.5716476440429688, 0.59857177734375, 0.6254959106445312, 0.6524200439453125, 0.6793441772460938, 0.706268310546875, 0.7331924438476562, 0.7601165771484375, 0.7870407104492188, 0.81396484375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 6.0, 8.0, 7.0, 5.0, 3.0, 4.0, 11.0, 15.0, 19.0, 15.0, 33.0, 42.0, 56.0, 66.0, 114.0, 109.0, 110.0, 84.0, 70.0, 29.0, 34.0, 24.0, 26.0, 22.0, 21.0, 15.0, 15.0, 6.0, 9.0, 8.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0007166862487792969, -0.0006976425647735596, -0.0006785988807678223, -0.000659555196762085, -0.0006405115127563477, -0.0006214678287506104, -0.000602424144744873, -0.0005833804607391357, -0.0005643367767333984, -0.0005452930927276611, -0.0005262494087219238, -0.0005072057247161865, -0.0004881620407104492, -0.0004691183567047119, -0.0004500746726989746, -0.0004310309886932373, -0.0004119873046875, -0.0003929436206817627, -0.0003738999366760254, -0.0003548562526702881, -0.0003358125686645508, -0.0003167688846588135, -0.00029772520065307617, -0.00027868151664733887, -0.00025963783264160156, -0.00024059414863586426, -0.00022155046463012695, -0.00020250678062438965, -0.00018346309661865234, -0.00016441941261291504, -0.00014537572860717773, -0.00012633204460144043, -0.00010728836059570312, -8.824467658996582e-05, -6.920099258422852e-05, -5.015730857849121e-05, -3.1113624572753906e-05, -1.2069940567016602e-05, 6.973743438720703e-06, 2.6017427444458008e-05, 4.506111145019531e-05, 6.410479545593262e-05, 8.314847946166992e-05, 0.00010219216346740723, 0.00012123584747314453, 0.00014027953147888184, 0.00015932321548461914, 0.00017836689949035645, 0.00019741058349609375, 0.00021645426750183105, 0.00023549795150756836, 0.00025454163551330566, 0.00027358531951904297, 0.0002926290035247803, 0.0003116726875305176, 0.0003307163715362549, 0.0003497600555419922, 0.0003688037395477295, 0.0003878474235534668, 0.0004068911075592041, 0.0004259347915649414, 0.0004449784755706787, 0.000464022159576416, 0.0004830658435821533, 0.0005021095275878906]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 8.0, 8.0, 8.0, 22.0, 18.0, 24.0, 27.0, 40.0, 52.0, 67.0, 97.0, 240.0, 577.0, 6759.0, 1035299.0, 4139.0, 529.0, 272.0, 132.0, 72.0, 45.0, 28.0, 20.0, 12.0, 7.0, 6.0, 9.0, 4.0, 3.0, 8.0, 2.0, 2.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0120849609375, -0.011660337448120117, -0.011235713958740234, -0.010811090469360352, -0.010386466979980469, -0.009961843490600586, -0.009537220001220703, -0.00911259651184082, -0.008687973022460938, -0.008263349533081055, -0.007838726043701172, -0.007414102554321289, -0.006989479064941406, -0.0065648555755615234, -0.006140232086181641, -0.005715608596801758, -0.005290985107421875, -0.004866361618041992, -0.004441738128662109, -0.0040171146392822266, -0.0035924911499023438, -0.003167867660522461, -0.002743244171142578, -0.0023186206817626953, -0.0018939971923828125, -0.0014693737030029297, -0.0010447502136230469, -0.0006201267242431641, -0.00019550323486328125, 0.00022912025451660156, 0.0006537437438964844, 0.0010783672332763672, 0.00150299072265625, 0.0019276142120361328, 0.0023522377014160156, 0.0027768611907958984, 0.0032014846801757812, 0.003626108169555664, 0.004050731658935547, 0.00447535514831543, 0.0048999786376953125, 0.005324602127075195, 0.005749225616455078, 0.006173849105834961, 0.006598472595214844, 0.0070230960845947266, 0.007447719573974609, 0.007872343063354492, 0.008296966552734375, 0.008721590042114258, 0.00914621353149414, 0.009570837020874023, 0.009995460510253906, 0.010420083999633789, 0.010844707489013672, 0.011269330978393555, 0.011693954467773438, 0.01211857795715332, 0.012543201446533203, 0.012967824935913086, 0.013392448425292969, 0.013817071914672852, 0.014241695404052734, 0.014666318893432617, 0.0150909423828125]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 19.0, 111.0, 353.0, 390.0, 112.0, 27.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006598635809496045, -0.0006233363528735936, -0.0005868090665899217, -0.0005502818385139108, -0.0005137546104378998, -0.00047722735325805843, -0.00044070009607821703, -0.0004041728680022061, -0.0003676456108223647, -0.0003311183536425233, -0.00029459112556651235, -0.00025806386838667095, -0.00022153662575874478, -0.0001850093831308186, -0.0001484821259509772, -0.00011195489787496626, -7.542764069512486e-05, -3.890039442921989e-05, -2.3731481633149087e-06, 3.4154101740568876e-05, 7.068134436849505e-05, 0.00010720858699642122, 0.00014373584417626262, 0.00018026307225227356, 0.00021679032943211496, 0.00025331758661195636, 0.0002898448146879673, 0.0003263720718678087, 0.0003628993290476501, 0.00039942655712366104, 0.00043595381430350244, 0.0004724810423795134, 0.0005090082995593548, 0.0005455355276353657, 0.0005820628139190376, 0.0006185900419950485, 0.0006551172700710595, 0.0006916444981470704, 0.0007281717844307423, 0.0007646990125067532, 0.0008012262405827641, 0.0008377534686587751, 0.000874280754942447, 0.0009108079830184579, 0.0009473352110944688, 0.0009838624391704798, 0.0010203897254541516, 0.0010569170117378235, 0.0010934441816061735, 0.0011299714678898454, 0.0011664986377581954, 0.0012030259240418673, 0.0012395532103255391, 0.0012760803801938891, 0.001312607666477561, 0.001349134836345911, 0.0013856622390449047, 0.0014221895253285766, 0.0014587166951969266, 0.0014952439814805984, 0.0015317712677642703, 0.0015682984376326203, 0.0016048257239162922, 0.0016413528937846422, 0.001677880180068314]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 5.0, 7.0, 5.0, 2.0, 8.0, 7.0, 10.0, 17.0, 11.0, 9.0, 13.0, 15.0, 22.0, 24.0, 31.0, 34.0, 24.0, 35.0, 30.0, 33.0, 28.0, 32.0, 31.0, 34.0, 26.0, 44.0, 33.0, 38.0, 41.0, 39.0, 27.0, 29.0, 23.0, 36.0, 24.0, 23.0, 27.0, 18.0, 12.0, 19.0, 14.0, 6.0, 8.0, 8.0, 11.0, 10.0, 4.0, 10.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0002008676528930664, -0.00019372627139091492, -0.00018658488988876343, -0.00017944350838661194, -0.00017230212688446045, -0.00016516074538230896, -0.00015801936388015747, -0.00015087798237800598, -0.0001437366008758545, -0.000136595219373703, -0.00012945383787155151, -0.00012231245636940002, -0.00011517107486724854, -0.00010802969336509705, -0.00010088831186294556, -9.374693036079407e-05, -8.660554885864258e-05, -7.946416735649109e-05, -7.23227858543396e-05, -6.518140435218811e-05, -5.804002285003662e-05, -5.089864134788513e-05, -4.375725984573364e-05, -3.661587834358215e-05, -2.9474496841430664e-05, -2.2333115339279175e-05, -1.5191733837127686e-05, -8.050352334976196e-06, -9.08970832824707e-07, 6.232410669326782e-06, 1.3373792171478271e-05, 2.051517367362976e-05, 2.765655517578125e-05, 3.479793667793274e-05, 4.193931818008423e-05, 4.908069968223572e-05, 5.622208118438721e-05, 6.33634626865387e-05, 7.050484418869019e-05, 7.764622569084167e-05, 8.478760719299316e-05, 9.192898869514465e-05, 9.907037019729614e-05, 0.00010621175169944763, 0.00011335313320159912, 0.00012049451470375061, 0.0001276358962059021, 0.0001347772777080536, 0.00014191865921020508, 0.00014906004071235657, 0.00015620142221450806, 0.00016334280371665955, 0.00017048418521881104, 0.00017762556672096252, 0.00018476694822311401, 0.0001919083297252655, 0.000199049711227417, 0.00020619109272956848, 0.00021333247423171997, 0.00022047385573387146, 0.00022761523723602295, 0.00023475661873817444, 0.00024189800024032593, 0.0002490393817424774, 0.0002561807632446289]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 10.0, 8.0, 5.0, 10.0, 11.0, 15.0, 21.0, 22.0, 16.0, 21.0, 32.0, 34.0, 26.0, 36.0, 34.0, 29.0, 33.0, 37.0, 36.0, 40.0, 45.0, 44.0, 37.0, 37.0, 32.0, 38.0, 33.0, 30.0, 25.0, 28.0, 21.0, 21.0, 15.0, 14.0, 23.0, 23.0, 9.0, 11.0, 11.0, 5.0, 8.0, 5.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.869140625, -2.7779541015625, -2.686767578125, -2.5955810546875, -2.50439453125, -2.4132080078125, -2.322021484375, -2.2308349609375, -2.1396484375, -2.0484619140625, -1.957275390625, -1.8660888671875, -1.77490234375, -1.6837158203125, -1.592529296875, -1.5013427734375, -1.41015625, -1.3189697265625, -1.227783203125, -1.1365966796875, -1.04541015625, -0.9542236328125, -0.863037109375, -0.7718505859375, -0.6806640625, -0.5894775390625, -0.498291015625, -0.4071044921875, -0.31591796875, -0.2247314453125, -0.133544921875, -0.0423583984375, 0.048828125, 0.1400146484375, 0.231201171875, 0.3223876953125, 0.41357421875, 0.5047607421875, 0.595947265625, 0.6871337890625, 0.7783203125, 0.8695068359375, 0.960693359375, 1.0518798828125, 1.14306640625, 1.2342529296875, 1.325439453125, 1.4166259765625, 1.5078125, 1.5989990234375, 1.690185546875, 1.7813720703125, 1.87255859375, 1.9637451171875, 2.054931640625, 2.1461181640625, 2.2373046875, 2.3284912109375, 2.419677734375, 2.5108642578125, 2.60205078125, 2.6932373046875, 2.784423828125, 2.8756103515625, 2.966796875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 11.0, 8.0, 6.0, 10.0, 28.0, 27.0, 45.0, 73.0, 122.0, 187.0, 305.0, 553.0, 989.0, 1892.0, 3595.0, 7094.0, 14642.0, 32520.0, 83745.0, 239450.0, 383511.0, 171083.0, 60620.0, 24667.0, 11464.0, 5538.0, 2790.0, 1511.0, 846.0, 462.0, 258.0, 182.0, 98.0, 64.0, 36.0, 32.0, 15.0, 16.0, 8.0, 12.0, 7.0, 11.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.224609375, -3.1217041015625, -3.018798828125, -2.9158935546875, -2.81298828125, -2.7100830078125, -2.607177734375, -2.5042724609375, -2.4013671875, -2.2984619140625, -2.195556640625, -2.0926513671875, -1.98974609375, -1.8868408203125, -1.783935546875, -1.6810302734375, -1.578125, -1.4752197265625, -1.372314453125, -1.2694091796875, -1.16650390625, -1.0635986328125, -0.960693359375, -0.8577880859375, -0.7548828125, -0.6519775390625, -0.549072265625, -0.4461669921875, -0.34326171875, -0.2403564453125, -0.137451171875, -0.0345458984375, 0.068359375, 0.1712646484375, 0.274169921875, 0.3770751953125, 0.47998046875, 0.5828857421875, 0.685791015625, 0.7886962890625, 0.8916015625, 0.9945068359375, 1.097412109375, 1.2003173828125, 1.30322265625, 1.4061279296875, 1.509033203125, 1.6119384765625, 1.71484375, 1.8177490234375, 1.920654296875, 2.0235595703125, 2.12646484375, 2.2293701171875, 2.332275390625, 2.4351806640625, 2.5380859375, 2.6409912109375, 2.743896484375, 2.8468017578125, 2.94970703125, 3.0526123046875, 3.155517578125, 3.2584228515625, 3.361328125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 5.0, 7.0, 8.0, 16.0, 12.0, 23.0, 20.0, 29.0, 20.0, 36.0, 33.0, 35.0, 43.0, 58.0, 72.0, 111.0, 259.0, 1506.0, 206.0, 110.0, 61.0, 58.0, 39.0, 42.0, 38.0, 34.0, 40.0, 16.0, 24.0, 12.0, 19.0, 7.0, 13.0, 11.0, 3.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.3828125, -12.0106201171875, -11.638427734375, -11.2662353515625, -10.89404296875, -10.5218505859375, -10.149658203125, -9.7774658203125, -9.4052734375, -9.0330810546875, -8.660888671875, -8.2886962890625, -7.91650390625, -7.5443115234375, -7.172119140625, -6.7999267578125, -6.427734375, -6.0555419921875, -5.683349609375, -5.3111572265625, -4.93896484375, -4.5667724609375, -4.194580078125, -3.8223876953125, -3.4501953125, -3.0780029296875, -2.705810546875, -2.3336181640625, -1.96142578125, -1.5892333984375, -1.217041015625, -0.8448486328125, -0.47265625, -0.1004638671875, 0.271728515625, 0.6439208984375, 1.01611328125, 1.3883056640625, 1.760498046875, 2.1326904296875, 2.5048828125, 2.8770751953125, 3.249267578125, 3.6214599609375, 3.99365234375, 4.3658447265625, 4.738037109375, 5.1102294921875, 5.482421875, 5.8546142578125, 6.226806640625, 6.5989990234375, 6.97119140625, 7.3433837890625, 7.715576171875, 8.0877685546875, 8.4599609375, 8.8321533203125, 9.204345703125, 9.5765380859375, 9.94873046875, 10.3209228515625, 10.693115234375, 11.0653076171875, 11.4375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 5.0, 5.0, 15.0, 20.0, 26.0, 29.0, 53.0, 71.0, 124.0, 181.0, 291.0, 677.0, 4312.0, 2992285.0, 144846.0, 1681.0, 412.0, 236.0, 147.0, 75.0, 69.0, 37.0, 39.0, 17.0, 13.0, 8.0, 4.0, 5.0, 10.0, 5.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.28125, -40.060546875, -38.83984375, -37.619140625, -36.3984375, -35.177734375, -33.95703125, -32.736328125, -31.515625, -30.294921875, -29.07421875, -27.853515625, -26.6328125, -25.412109375, -24.19140625, -22.970703125, -21.75, -20.529296875, -19.30859375, -18.087890625, -16.8671875, -15.646484375, -14.42578125, -13.205078125, -11.984375, -10.763671875, -9.54296875, -8.322265625, -7.1015625, -5.880859375, -4.66015625, -3.439453125, -2.21875, -0.998046875, 0.22265625, 1.443359375, 2.6640625, 3.884765625, 5.10546875, 6.326171875, 7.546875, 8.767578125, 9.98828125, 11.208984375, 12.4296875, 13.650390625, 14.87109375, 16.091796875, 17.3125, 18.533203125, 19.75390625, 20.974609375, 22.1953125, 23.416015625, 24.63671875, 25.857421875, 27.078125, 28.298828125, 29.51953125, 30.740234375, 31.9609375, 33.181640625, 34.40234375, 35.623046875, 36.84375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 1004.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.31707763671875, -92.31100463867188, -84.304931640625, -76.29886627197266, -68.29279327392578, -60.286720275878906, -52.2806510925293, -44.27458190917969, -36.26850891113281, -28.26243782043457, -20.256366729736328, -12.250295639038086, -4.244224548339844, 3.7618484497070312, 11.76791763305664, 19.77398681640625, 27.780059814453125, 35.7861328125, 43.79220199584961, 51.79827117919922, 59.804344177246094, 67.81041717529297, 75.81648254394531, 83.82255554199219, 91.82862854003906, 99.83470153808594, 107.84077453613281, 115.84683990478516, 123.85291290283203, 131.85897827148438, 139.86505126953125, 147.87112426757812, 155.87716674804688, 163.88323974609375, 171.88931274414062, 179.8953857421875, 187.90145874023438, 195.90753173828125, 203.91358947753906, 211.91966247558594, 219.9257354736328, 227.9318084716797, 235.93788146972656, 243.94395446777344, 251.95001220703125, 259.9560852050781, 267.962158203125, 275.9682312011719, 283.97430419921875, 291.9803771972656, 299.9864501953125, 307.9925231933594, 315.99859619140625, 324.0046691894531, 332.0107421875, 340.01678466796875, 348.02288818359375, 356.0289611816406, 364.0350341796875, 372.0411071777344, 380.04718017578125, 388.0532531738281, 396.059326171875, 404.06536865234375, 412.0714416503906]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 5.0, 3.0, 9.0, 8.0, 8.0, 10.0, 18.0, 15.0, 28.0, 20.0, 28.0, 23.0, 33.0, 15.0, 34.0, 34.0, 32.0, 43.0, 37.0, 52.0, 37.0, 48.0, 45.0, 40.0, 42.0, 40.0, 45.0, 31.0, 42.0, 32.0, 30.0, 16.0, 16.0, 15.0, 11.0, 11.0, 10.0, 8.0, 11.0, 3.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.759153366088867, -22.88620376586914, -22.01325225830078, -21.140300750732422, -20.267351150512695, -19.39440155029297, -18.52145004272461, -17.64849853515625, -16.775548934936523, -15.90259838104248, -15.029647827148438, -14.156697273254395, -13.283746719360352, -12.410796165466309, -11.537845611572266, -10.664895057678223, -9.79194450378418, -8.918993949890137, -8.046043395996094, -7.173092842102051, -6.300142288208008, -5.427191734313965, -4.554241180419922, -3.681290626525879, -2.808340072631836, -1.935389518737793, -1.06243896484375, -0.18948841094970703, 0.6834621429443359, 1.556412696838379, 2.429363250732422, 3.302313804626465, 4.175266265869141, 5.048216819763184, 5.921167373657227, 6.7941179275512695, 7.6670684814453125, 8.540019035339355, 9.412969589233398, 10.285920143127441, 11.158870697021484, 12.031821250915527, 12.90477180480957, 13.777722358703613, 14.650672912597656, 15.5236234664917, 16.396574020385742, 17.26952362060547, 18.142475128173828, 19.015426635742188, 19.888376235961914, 20.76132583618164, 21.63427734375, 22.50722885131836, 23.380178451538086, 24.253128051757812, 25.126079559326172, 25.99903106689453, 26.871980667114258, 27.744930267333984, 28.617881774902344, 29.490833282470703, 30.36378288269043, 31.236732482910156, 32.109683990478516]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 5.0, 4.0, 8.0, 7.0, 12.0, 14.0, 6.0, 20.0, 14.0, 26.0, 18.0, 29.0, 37.0, 23.0, 33.0, 41.0, 32.0, 27.0, 38.0, 38.0, 35.0, 44.0, 49.0, 36.0, 33.0, 38.0, 41.0, 30.0, 30.0, 30.0, 28.0, 20.0, 16.0, 16.0, 22.0, 19.0, 21.0, 13.0, 13.0, 3.0, 10.0, 6.0, 6.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.09375, -2.9964599609375, -2.899169921875, -2.8018798828125, -2.70458984375, -2.6072998046875, -2.510009765625, -2.4127197265625, -2.3154296875, -2.2181396484375, -2.120849609375, -2.0235595703125, -1.92626953125, -1.8289794921875, -1.731689453125, -1.6343994140625, -1.537109375, -1.4398193359375, -1.342529296875, -1.2452392578125, -1.14794921875, -1.0506591796875, -0.953369140625, -0.8560791015625, -0.7587890625, -0.6614990234375, -0.564208984375, -0.4669189453125, -0.36962890625, -0.2723388671875, -0.175048828125, -0.0777587890625, 0.01953125, 0.1168212890625, 0.214111328125, 0.3114013671875, 0.40869140625, 0.5059814453125, 0.603271484375, 0.7005615234375, 0.7978515625, 0.8951416015625, 0.992431640625, 1.0897216796875, 1.18701171875, 1.2843017578125, 1.381591796875, 1.4788818359375, 1.576171875, 1.6734619140625, 1.770751953125, 1.8680419921875, 1.96533203125, 2.0626220703125, 2.159912109375, 2.2572021484375, 2.3544921875, 2.4517822265625, 2.549072265625, 2.6463623046875, 2.74365234375, 2.8409423828125, 2.938232421875, 3.0355224609375, 3.1328125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 3.0, 4.0, 5.0, 9.0, 3.0, 17.0, 18.0, 17.0, 22.0, 23.0, 22.0, 37.0, 50.0, 59.0, 72.0, 81.0, 140.0, 154.0, 312.0, 1161.0, 19430.0, 1916710.0, 2229700.0, 23822.0, 1325.0, 355.0, 174.0, 110.0, 91.0, 68.0, 50.0, 41.0, 32.0, 37.0, 18.0, 21.0, 20.0, 15.0, 14.0, 11.0, 2.0, 7.0, 8.0, 5.0, 2.0, 5.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.6171875, -15.1295166015625, -14.641845703125, -14.1541748046875, -13.66650390625, -13.1788330078125, -12.691162109375, -12.2034912109375, -11.7158203125, -11.2281494140625, -10.740478515625, -10.2528076171875, -9.76513671875, -9.2774658203125, -8.789794921875, -8.3021240234375, -7.814453125, -7.3267822265625, -6.839111328125, -6.3514404296875, -5.86376953125, -5.3760986328125, -4.888427734375, -4.4007568359375, -3.9130859375, -3.4254150390625, -2.937744140625, -2.4500732421875, -1.96240234375, -1.4747314453125, -0.987060546875, -0.4993896484375, -0.01171875, 0.4759521484375, 0.963623046875, 1.4512939453125, 1.93896484375, 2.4266357421875, 2.914306640625, 3.4019775390625, 3.8896484375, 4.3773193359375, 4.864990234375, 5.3526611328125, 5.84033203125, 6.3280029296875, 6.815673828125, 7.3033447265625, 7.791015625, 8.2786865234375, 8.766357421875, 9.2540283203125, 9.74169921875, 10.2293701171875, 10.717041015625, 11.2047119140625, 11.6923828125, 12.1800537109375, 12.667724609375, 13.1553955078125, 13.64306640625, 14.1307373046875, 14.618408203125, 15.1060791015625, 15.59375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 6.0, 8.0, 11.0, 13.0, 7.0, 21.0, 59.0, 66.0, 105.0, 181.0, 255.0, 386.0, 555.0, 616.0, 591.0, 422.0, 282.0, 176.0, 116.0, 80.0, 43.0, 36.0, 16.0, 12.0, 7.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.0234375, -14.67010498046875, -14.3167724609375, -13.96343994140625, -13.610107421875, -13.25677490234375, -12.9034423828125, -12.55010986328125, -12.19677734375, -11.84344482421875, -11.4901123046875, -11.13677978515625, -10.783447265625, -10.43011474609375, -10.0767822265625, -9.72344970703125, -9.3701171875, -9.01678466796875, -8.6634521484375, -8.31011962890625, -7.956787109375, -7.60345458984375, -7.2501220703125, -6.89678955078125, -6.54345703125, -6.19012451171875, -5.8367919921875, -5.48345947265625, -5.130126953125, -4.77679443359375, -4.4234619140625, -4.07012939453125, -3.716796875, -3.36346435546875, -3.0101318359375, -2.65679931640625, -2.303466796875, -1.95013427734375, -1.5968017578125, -1.24346923828125, -0.89013671875, -0.53680419921875, -0.1834716796875, 0.16986083984375, 0.523193359375, 0.87652587890625, 1.2298583984375, 1.58319091796875, 1.9365234375, 2.28985595703125, 2.6431884765625, 2.99652099609375, 3.349853515625, 3.70318603515625, 4.0565185546875, 4.40985107421875, 4.76318359375, 5.11651611328125, 5.4698486328125, 5.82318115234375, 6.176513671875, 6.52984619140625, 6.8831787109375, 7.23651123046875, 7.58984375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 9.0, 16.0, 29.0, 32.0, 42.0, 72.0, 105.0, 169.0, 256.0, 403.0, 872.0, 4598.0, 976240.0, 3199167.0, 10087.0, 1000.0, 419.0, 267.0, 162.0, 110.0, 80.0, 45.0, 35.0, 23.0, 16.0, 12.0, 8.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.578125, -22.511962890625, -21.44580078125, -20.379638671875, -19.3134765625, -18.247314453125, -17.18115234375, -16.114990234375, -15.048828125, -13.982666015625, -12.91650390625, -11.850341796875, -10.7841796875, -9.718017578125, -8.65185546875, -7.585693359375, -6.51953125, -5.453369140625, -4.38720703125, -3.321044921875, -2.2548828125, -1.188720703125, -0.12255859375, 0.943603515625, 2.009765625, 3.075927734375, 4.14208984375, 5.208251953125, 6.2744140625, 7.340576171875, 8.40673828125, 9.472900390625, 10.5390625, 11.605224609375, 12.67138671875, 13.737548828125, 14.8037109375, 15.869873046875, 16.93603515625, 18.002197265625, 19.068359375, 20.134521484375, 21.20068359375, 22.266845703125, 23.3330078125, 24.399169921875, 25.46533203125, 26.531494140625, 27.59765625, 28.663818359375, 29.72998046875, 30.796142578125, 31.8623046875, 32.928466796875, 33.99462890625, 35.060791015625, 36.126953125, 37.193115234375, 38.25927734375, 39.325439453125, 40.3916015625, 41.457763671875, 42.52392578125, 43.590087890625, 44.65625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 8.0, 21.0, 52.0, 102.0, 144.0, 161.0, 171.0, 147.0, 103.0, 54.0, 23.0, 12.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.486167907714844, -43.67652893066406, -41.86688995361328, -40.057247161865234, -38.24760818481445, -36.43796920776367, -34.628326416015625, -32.818687438964844, -31.009048461914062, -29.19940948486328, -27.389768600463867, -25.580127716064453, -23.770488739013672, -21.96084976196289, -20.151208877563477, -18.341567993164062, -16.53192901611328, -14.722289085388184, -12.912649154663086, -11.103009223937988, -9.29336929321289, -7.483729362487793, -5.674089431762695, -3.8644495010375977, -2.0548095703125, -0.24516963958740234, 1.5644702911376953, 3.374110221862793, 5.183750152587891, 6.993390083312988, 8.803030014038086, 10.612669944763184, 12.422309875488281, 14.231949806213379, 16.041589736938477, 17.85123062133789, 19.660869598388672, 21.470508575439453, 23.280149459838867, 25.08979034423828, 26.899429321289062, 28.709068298339844, 30.518709182739258, 32.32835006713867, 34.13798904418945, 35.947628021240234, 37.75727081298828, 39.56690979003906, 41.376548767089844, 43.186187744140625, 44.995826721191406, 46.80546951293945, 48.615108489990234, 50.424747467041016, 52.23439025878906, 54.044029235839844, 55.853668212890625, 57.663307189941406, 59.47294616699219, 61.282588958740234, 63.092227935791016, 64.90187072753906, 66.71150970458984, 68.52114868164062, 70.3307876586914]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 6.0, 10.0, 10.0, 16.0, 11.0, 20.0, 22.0, 16.0, 18.0, 20.0, 26.0, 33.0, 19.0, 28.0, 26.0, 43.0, 38.0, 45.0, 46.0, 35.0, 36.0, 47.0, 39.0, 31.0, 38.0, 38.0, 27.0, 38.0, 28.0, 25.0, 35.0, 25.0, 13.0, 18.0, 10.0, 14.0, 8.0, 15.0, 7.0, 7.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-26.277694702148438, -25.503896713256836, -24.730098724365234, -23.956302642822266, -23.182504653930664, -22.408706665039062, -21.634910583496094, -20.861112594604492, -20.08731460571289, -19.31351661682129, -18.539718627929688, -17.76592254638672, -16.992124557495117, -16.218326568603516, -15.44452953338623, -14.670732498168945, -13.896934509277344, -13.123136520385742, -12.349339485168457, -11.575542449951172, -10.80174446105957, -10.027946472167969, -9.254149436950684, -8.480352401733398, -7.706554412841797, -6.9327569007873535, -6.15895938873291, -5.385161876678467, -4.611364364624023, -3.83756685256958, -3.0637693405151367, -2.2899718284606934, -1.51617431640625, -0.7423768043518066, 0.03142070770263672, 0.8052182197570801, 1.5790157318115234, 2.352813243865967, 3.12661075592041, 3.9004082679748535, 4.674205780029297, 5.44800329208374, 6.221800804138184, 6.995598316192627, 7.76939582824707, 8.543193817138672, 9.316990852355957, 10.090787887573242, 10.864585876464844, 11.638383865356445, 12.41218090057373, 13.185977935791016, 13.959775924682617, 14.733573913574219, 15.507370948791504, 16.28116798400879, 17.05496597290039, 17.828763961791992, 18.602561950683594, 19.376358032226562, 20.150156021118164, 20.923954010009766, 21.697750091552734, 22.471548080444336, 23.245346069335938]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 4.0, 4.0, 10.0, 11.0, 10.0, 7.0, 20.0, 11.0, 24.0, 31.0, 29.0, 25.0, 33.0, 38.0, 25.0, 32.0, 31.0, 30.0, 40.0, 41.0, 49.0, 39.0, 45.0, 59.0, 31.0, 36.0, 33.0, 24.0, 31.0, 17.0, 24.0, 22.0, 21.0, 22.0, 17.0, 16.0, 10.0, 12.0, 6.0, 7.0, 8.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.259765625, -3.160186767578125, -3.06060791015625, -2.961029052734375, -2.8614501953125, -2.761871337890625, -2.66229248046875, -2.562713623046875, -2.463134765625, -2.363555908203125, -2.26397705078125, -2.164398193359375, -2.0648193359375, -1.965240478515625, -1.86566162109375, -1.766082763671875, -1.66650390625, -1.566925048828125, -1.46734619140625, -1.367767333984375, -1.2681884765625, -1.168609619140625, -1.06903076171875, -0.969451904296875, -0.869873046875, -0.770294189453125, -0.67071533203125, -0.571136474609375, -0.4715576171875, -0.371978759765625, -0.27239990234375, -0.172821044921875, -0.0732421875, 0.026336669921875, 0.12591552734375, 0.225494384765625, 0.3250732421875, 0.424652099609375, 0.52423095703125, 0.623809814453125, 0.723388671875, 0.822967529296875, 0.92254638671875, 1.022125244140625, 1.1217041015625, 1.221282958984375, 1.32086181640625, 1.420440673828125, 1.52001953125, 1.619598388671875, 1.71917724609375, 1.818756103515625, 1.9183349609375, 2.017913818359375, 2.11749267578125, 2.217071533203125, 2.316650390625, 2.416229248046875, 2.51580810546875, 2.615386962890625, 2.7149658203125, 2.814544677734375, 2.91412353515625, 3.013702392578125, 3.11328125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 6.0, 10.0, 19.0, 25.0, 38.0, 54.0, 83.0, 121.0, 155.0, 256.0, 383.0, 551.0, 865.0, 1244.0, 1921.0, 2891.0, 4335.0, 6737.0, 10548.0, 16153.0, 25280.0, 40024.0, 64173.0, 110888.0, 300590.0, 210070.0, 95574.0, 56599.0, 35001.0, 22477.0, 14367.0, 9194.0, 6018.0, 3994.0, 2618.0, 1746.0, 1150.0, 822.0, 515.0, 309.0, 231.0, 180.0, 121.0, 64.0, 56.0, 34.0, 22.0, 13.0, 13.0, 11.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.72216796875, -0.6995086669921875, -0.676849365234375, -0.6541900634765625, -0.63153076171875, -0.6088714599609375, -0.586212158203125, -0.5635528564453125, -0.5408935546875, -0.5182342529296875, -0.495574951171875, -0.4729156494140625, -0.45025634765625, -0.4275970458984375, -0.404937744140625, -0.3822784423828125, -0.359619140625, -0.3369598388671875, -0.314300537109375, -0.2916412353515625, -0.26898193359375, -0.2463226318359375, -0.223663330078125, -0.2010040283203125, -0.1783447265625, -0.1556854248046875, -0.133026123046875, -0.1103668212890625, -0.08770751953125, -0.0650482177734375, -0.042388916015625, -0.0197296142578125, 0.0029296875, 0.0255889892578125, 0.048248291015625, 0.0709075927734375, 0.09356689453125, 0.1162261962890625, 0.138885498046875, 0.1615447998046875, 0.1842041015625, 0.2068634033203125, 0.229522705078125, 0.2521820068359375, 0.27484130859375, 0.2975006103515625, 0.320159912109375, 0.3428192138671875, 0.365478515625, 0.3881378173828125, 0.410797119140625, 0.4334564208984375, 0.45611572265625, 0.4787750244140625, 0.501434326171875, 0.5240936279296875, 0.5467529296875, 0.5694122314453125, 0.592071533203125, 0.6147308349609375, 0.63739013671875, 0.6600494384765625, 0.682708740234375, 0.7053680419921875, 0.72802734375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 2.0, 5.0, 4.0, 6.0, 3.0, 13.0, 10.0, 19.0, 17.0, 13.0, 11.0, 20.0, 29.0, 27.0, 29.0, 34.0, 27.0, 46.0, 43.0, 36.0, 42.0, 36.0, 1069.0, 48.0, 33.0, 39.0, 42.0, 36.0, 35.0, 30.0, 37.0, 20.0, 21.0, 18.0, 19.0, 18.0, 19.0, 16.0, 11.0, 10.0, 7.0, 7.0, 10.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.125, -2.05877685546875, -1.9925537109375, -1.92633056640625, -1.860107421875, -1.79388427734375, -1.7276611328125, -1.66143798828125, -1.59521484375, -1.52899169921875, -1.4627685546875, -1.39654541015625, -1.330322265625, -1.26409912109375, -1.1978759765625, -1.13165283203125, -1.0654296875, -0.99920654296875, -0.9329833984375, -0.86676025390625, -0.800537109375, -0.73431396484375, -0.6680908203125, -0.60186767578125, -0.53564453125, -0.46942138671875, -0.4031982421875, -0.33697509765625, -0.270751953125, -0.20452880859375, -0.1383056640625, -0.07208251953125, -0.005859375, 0.06036376953125, 0.1265869140625, 0.19281005859375, 0.259033203125, 0.32525634765625, 0.3914794921875, 0.45770263671875, 0.52392578125, 0.59014892578125, 0.6563720703125, 0.72259521484375, 0.788818359375, 0.85504150390625, 0.9212646484375, 0.98748779296875, 1.0537109375, 1.11993408203125, 1.1861572265625, 1.25238037109375, 1.318603515625, 1.38482666015625, 1.4510498046875, 1.51727294921875, 1.58349609375, 1.64971923828125, 1.7159423828125, 1.78216552734375, 1.848388671875, 1.91461181640625, 1.9808349609375, 2.04705810546875, 2.11328125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 12.0, 16.0, 23.0, 33.0, 40.0, 67.0, 115.0, 156.0, 259.0, 377.0, 600.0, 907.0, 1465.0, 2262.0, 3724.0, 6058.0, 9856.0, 16957.0, 28891.0, 51405.0, 96331.0, 230170.0, 1385948.0, 117494.0, 60559.0, 33564.0, 19676.0, 11589.0, 7218.0, 4342.0, 2606.0, 1655.0, 1010.0, 617.0, 388.0, 245.0, 161.0, 125.0, 70.0, 42.0, 39.0, 18.0, 11.0, 11.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8798828125, -0.852508544921875, -0.82513427734375, -0.797760009765625, -0.7703857421875, -0.743011474609375, -0.71563720703125, -0.688262939453125, -0.660888671875, -0.633514404296875, -0.60614013671875, -0.578765869140625, -0.5513916015625, -0.524017333984375, -0.49664306640625, -0.469268798828125, -0.44189453125, -0.414520263671875, -0.38714599609375, -0.359771728515625, -0.3323974609375, -0.305023193359375, -0.27764892578125, -0.250274658203125, -0.222900390625, -0.195526123046875, -0.16815185546875, -0.140777587890625, -0.1134033203125, -0.086029052734375, -0.05865478515625, -0.031280517578125, -0.00390625, 0.023468017578125, 0.05084228515625, 0.078216552734375, 0.1055908203125, 0.132965087890625, 0.16033935546875, 0.187713623046875, 0.215087890625, 0.242462158203125, 0.26983642578125, 0.297210693359375, 0.3245849609375, 0.351959228515625, 0.37933349609375, 0.406707763671875, 0.43408203125, 0.461456298828125, 0.48883056640625, 0.516204833984375, 0.5435791015625, 0.570953369140625, 0.59832763671875, 0.625701904296875, 0.653076171875, 0.680450439453125, 0.70782470703125, 0.735198974609375, 0.7625732421875, 0.789947509765625, 0.81732177734375, 0.844696044921875, 0.8720703125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 6.0, 5.0, 2.0, 1.0, 4.0, 4.0, 6.0, 3.0, 5.0, 6.0, 11.0, 22.0, 13.0, 19.0, 24.0, 34.0, 49.0, 76.0, 105.0, 123.0, 124.0, 99.0, 60.0, 53.0, 26.0, 21.0, 13.0, 14.0, 10.0, 8.0, 10.0, 4.0, 7.0, 7.0, 4.0, 2.0, 3.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0007624626159667969, -0.0007386058568954468, -0.0007147490978240967, -0.0006908923387527466, -0.0006670355796813965, -0.0006431788206100464, -0.0006193220615386963, -0.0005954653024673462, -0.0005716085433959961, -0.000547751784324646, -0.0005238950252532959, -0.0005000382661819458, -0.0004761815071105957, -0.0004523247480392456, -0.0004284679889678955, -0.0004046112298965454, -0.0003807544708251953, -0.0003568977117538452, -0.0003330409526824951, -0.000309184193611145, -0.0002853274345397949, -0.0002614706754684448, -0.00023761391639709473, -0.00021375715732574463, -0.00018990039825439453, -0.00016604363918304443, -0.00014218688011169434, -0.00011833012104034424, -9.447336196899414e-05, -7.061660289764404e-05, -4.6759843826293945e-05, -2.2903084754943848e-05, 9.5367431640625e-07, 2.4810433387756348e-05, 4.8667192459106445e-05, 7.252395153045654e-05, 9.638071060180664e-05, 0.00012023746967315674, 0.00014409422874450684, 0.00016795098781585693, 0.00019180774688720703, 0.00021566450595855713, 0.00023952126502990723, 0.0002633780241012573, 0.0002872347831726074, 0.0003110915422439575, 0.0003349483013153076, 0.0003588050603866577, 0.0003826618194580078, 0.0004065185785293579, 0.000430375337600708, 0.0004542320966720581, 0.0004780888557434082, 0.0005019456148147583, 0.0005258023738861084, 0.0005496591329574585, 0.0005735158920288086, 0.0005973726511001587, 0.0006212294101715088, 0.0006450861692428589, 0.000668942928314209, 0.0006927996873855591, 0.0007166564464569092, 0.0007405132055282593, 0.0007643699645996094]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 7.0, 1.0, 2.0, 4.0, 10.0, 11.0, 6.0, 7.0, 28.0, 14.0, 31.0, 39.0, 50.0, 89.0, 168.0, 311.0, 757.0, 42285.0, 1001775.0, 1915.0, 395.0, 235.0, 132.0, 74.0, 52.0, 40.0, 24.0, 25.0, 15.0, 7.0, 8.0, 3.0, 3.0, 5.0, 3.0, 2.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0153045654296875, -0.014814615249633789, -0.014324665069580078, -0.013834714889526367, -0.013344764709472656, -0.012854814529418945, -0.012364864349365234, -0.011874914169311523, -0.011384963989257812, -0.010895013809204102, -0.01040506362915039, -0.00991511344909668, -0.009425163269042969, -0.008935213088989258, -0.008445262908935547, -0.007955312728881836, -0.007465362548828125, -0.006975412368774414, -0.006485462188720703, -0.005995512008666992, -0.005505561828613281, -0.00501561164855957, -0.004525661468505859, -0.0040357112884521484, -0.0035457611083984375, -0.0030558109283447266, -0.0025658607482910156, -0.0020759105682373047, -0.0015859603881835938, -0.0010960102081298828, -0.0006060600280761719, -0.00011610984802246094, 0.00037384033203125, 0.0008637905120849609, 0.0013537406921386719, 0.0018436908721923828, 0.0023336410522460938, 0.0028235912322998047, 0.0033135414123535156, 0.0038034915924072266, 0.0042934417724609375, 0.0047833919525146484, 0.005273342132568359, 0.00576329231262207, 0.006253242492675781, 0.006743192672729492, 0.007233142852783203, 0.007723093032836914, 0.008213043212890625, 0.008702993392944336, 0.009192943572998047, 0.009682893753051758, 0.010172843933105469, 0.01066279411315918, 0.01115274429321289, 0.011642694473266602, 0.012132644653320312, 0.012622594833374023, 0.013112545013427734, 0.013602495193481445, 0.014092445373535156, 0.014582395553588867, 0.015072345733642578, 0.015562295913696289, 0.01605224609375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 10.0, 80.0, 432.0, 405.0, 82.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002764529548585415, -0.002709224121645093, -0.002653918694704771, -0.0025986130349338055, -0.0025433076079934835, -0.0024880021810531616, -0.0024326967541128397, -0.002377391094341874, -0.002322085667401552, -0.0022667802404612303, -0.0022114748135209084, -0.0021561691537499428, -0.002100863726809621, -0.002045558299869299, -0.001990252872928977, -0.0019349473295733333, -0.0018796417862176895, -0.0018243363592773676, -0.0017690308159217238, -0.001713725388981402, -0.0016584198456257582, -0.0016031144186854362, -0.0015478088753297925, -0.0014925034483894706, -0.0014371980214491487, -0.0013818925945088267, -0.001326587051153183, -0.001271281624212861, -0.0012159760808572173, -0.0011606706539168954, -0.0011053651105612516, -0.0010500596836209297, -0.0009947542566806078, -0.000939448771532625, -0.0008841432863846421, -0.0008288378012366593, -0.0007735323160886765, -0.0007182268891483545, -0.0006629213457927108, -0.0006076159188523889, -0.0005523103754967451, -0.0004970048903487623, -0.00044169940520077944, -0.0003863939200527966, -0.00033108843490481377, -0.0002757829788606614, -0.00022047749371267855, -0.00016517200856469572, -0.00010986649431288242, -5.4561012802878395e-05, 7.44468707125634e-07, 5.6049946579150856e-05, 0.00011135543172713369, 0.0001666609023232013, 0.00022196638747118413, 0.00027727187261916697, 0.0003325773577671498, 0.00038788284291513264, 0.0004431883280631155, 0.0004984937841072679, 0.0005537992692552507, 0.0006091047544032335, 0.0006644102395512164, 0.0007197157246991992, 0.000775021209847182]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 8.0, 8.0, 7.0, 8.0, 8.0, 10.0, 17.0, 17.0, 15.0, 15.0, 20.0, 23.0, 21.0, 34.0, 37.0, 43.0, 35.0, 27.0, 43.0, 43.0, 36.0, 41.0, 30.0, 30.0, 28.0, 39.0, 34.0, 41.0, 28.0, 39.0, 27.0, 18.0, 30.0, 27.0, 19.0, 11.0, 11.0, 12.0, 8.0, 7.0, 9.0, 7.0, 7.0, 10.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.0003108978271484375, -0.000300760380923748, -0.00029062293469905853, -0.00028048548847436905, -0.00027034804224967957, -0.0002602105960249901, -0.0002500731498003006, -0.00023993570357561111, -0.00022979825735092163, -0.00021966081112623215, -0.00020952336490154266, -0.00019938591867685318, -0.0001892484724521637, -0.0001791110262274742, -0.00016897358000278473, -0.00015883613377809525, -0.00014869868755340576, -0.00013856124132871628, -0.0001284237951040268, -0.00011828634887933731, -0.00010814890265464783, -9.801145642995834e-05, -8.787401020526886e-05, -7.773656398057938e-05, -6.759911775588989e-05, -5.746167153120041e-05, -4.7324225306510925e-05, -3.718677908182144e-05, -2.7049332857131958e-05, -1.6911886632442474e-05, -6.774440407752991e-06, 3.363005816936493e-06, 1.3500452041625977e-05, 2.363789826631546e-05, 3.3775344491004944e-05, 4.391279071569443e-05, 5.405023694038391e-05, 6.41876831650734e-05, 7.432512938976288e-05, 8.446257561445236e-05, 9.460002183914185e-05, 0.00010473746806383133, 0.00011487491428852081, 0.0001250123605132103, 0.00013514980673789978, 0.00014528725296258926, 0.00015542469918727875, 0.00016556214541196823, 0.00017569959163665771, 0.0001858370378613472, 0.00019597448408603668, 0.00020611193031072617, 0.00021624937653541565, 0.00022638682276010513, 0.00023652426898479462, 0.0002466617152094841, 0.0002567991614341736, 0.00026693660765886307, 0.00027707405388355255, 0.00028721150010824203, 0.0002973489463329315, 0.000307486392557621, 0.0003176238387823105, 0.00032776128500699997, 0.00033789873123168945]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 4.0, 4.0, 10.0, 11.0, 10.0, 7.0, 20.0, 11.0, 24.0, 31.0, 29.0, 25.0, 33.0, 38.0, 25.0, 32.0, 31.0, 30.0, 40.0, 41.0, 49.0, 39.0, 45.0, 59.0, 31.0, 36.0, 33.0, 24.0, 31.0, 17.0, 24.0, 22.0, 21.0, 22.0, 17.0, 16.0, 10.0, 12.0, 6.0, 7.0, 8.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.259765625, -3.160186767578125, -3.06060791015625, -2.961029052734375, -2.8614501953125, -2.761871337890625, -2.66229248046875, -2.562713623046875, -2.463134765625, -2.363555908203125, -2.26397705078125, -2.164398193359375, -2.0648193359375, -1.965240478515625, -1.86566162109375, -1.766082763671875, -1.66650390625, -1.566925048828125, -1.46734619140625, -1.367767333984375, -1.2681884765625, -1.168609619140625, -1.06903076171875, -0.969451904296875, -0.869873046875, -0.770294189453125, -0.67071533203125, -0.571136474609375, -0.4715576171875, -0.371978759765625, -0.27239990234375, -0.172821044921875, -0.0732421875, 0.026336669921875, 0.12591552734375, 0.225494384765625, 0.3250732421875, 0.424652099609375, 0.52423095703125, 0.623809814453125, 0.723388671875, 0.822967529296875, 0.92254638671875, 1.022125244140625, 1.1217041015625, 1.221282958984375, 1.32086181640625, 1.420440673828125, 1.52001953125, 1.619598388671875, 1.71917724609375, 1.818756103515625, 1.9183349609375, 2.017913818359375, 2.11749267578125, 2.217071533203125, 2.316650390625, 2.416229248046875, 2.51580810546875, 2.615386962890625, 2.7149658203125, 2.814544677734375, 2.91412353515625, 3.013702392578125, 3.11328125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 4.0, 2.0, 8.0, 14.0, 16.0, 23.0, 35.0, 30.0, 55.0, 76.0, 115.0, 174.0, 310.0, 503.0, 873.0, 1482.0, 2619.0, 4645.0, 8413.0, 15156.0, 27127.0, 49520.0, 95872.0, 208725.0, 309103.0, 157274.0, 75221.0, 40423.0, 22120.0, 12516.0, 6920.0, 3918.0, 2195.0, 1204.0, 713.0, 403.0, 287.0, 151.0, 97.0, 70.0, 58.0, 28.0, 12.0, 11.0, 14.0, 5.0, 6.0, 4.0, 0.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.5, -2.42266845703125, -2.3453369140625, -2.26800537109375, -2.190673828125, -2.11334228515625, -2.0360107421875, -1.95867919921875, -1.88134765625, -1.80401611328125, -1.7266845703125, -1.64935302734375, -1.572021484375, -1.49468994140625, -1.4173583984375, -1.34002685546875, -1.2626953125, -1.18536376953125, -1.1080322265625, -1.03070068359375, -0.953369140625, -0.87603759765625, -0.7987060546875, -0.72137451171875, -0.64404296875, -0.56671142578125, -0.4893798828125, -0.41204833984375, -0.334716796875, -0.25738525390625, -0.1800537109375, -0.10272216796875, -0.025390625, 0.05194091796875, 0.1292724609375, 0.20660400390625, 0.283935546875, 0.36126708984375, 0.4385986328125, 0.51593017578125, 0.59326171875, 0.67059326171875, 0.7479248046875, 0.82525634765625, 0.902587890625, 0.97991943359375, 1.0572509765625, 1.13458251953125, 1.2119140625, 1.28924560546875, 1.3665771484375, 1.44390869140625, 1.521240234375, 1.59857177734375, 1.6759033203125, 1.75323486328125, 1.83056640625, 1.90789794921875, 1.9852294921875, 2.06256103515625, 2.139892578125, 2.21722412109375, 2.2945556640625, 2.37188720703125, 2.44921875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 7.0, 8.0, 6.0, 9.0, 13.0, 13.0, 15.0, 14.0, 20.0, 29.0, 28.0, 29.0, 40.0, 37.0, 36.0, 41.0, 51.0, 76.0, 144.0, 1461.0, 358.0, 123.0, 65.0, 55.0, 44.0, 35.0, 39.0, 39.0, 24.0, 19.0, 16.0, 20.0, 25.0, 21.0, 16.0, 12.0, 15.0, 6.0, 8.0, 6.0, 3.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.5390625, -11.1883544921875, -10.837646484375, -10.4869384765625, -10.13623046875, -9.7855224609375, -9.434814453125, -9.0841064453125, -8.7333984375, -8.3826904296875, -8.031982421875, -7.6812744140625, -7.33056640625, -6.9798583984375, -6.629150390625, -6.2784423828125, -5.927734375, -5.5770263671875, -5.226318359375, -4.8756103515625, -4.52490234375, -4.1741943359375, -3.823486328125, -3.4727783203125, -3.1220703125, -2.7713623046875, -2.420654296875, -2.0699462890625, -1.71923828125, -1.3685302734375, -1.017822265625, -0.6671142578125, -0.31640625, 0.0343017578125, 0.385009765625, 0.7357177734375, 1.08642578125, 1.4371337890625, 1.787841796875, 2.1385498046875, 2.4892578125, 2.8399658203125, 3.190673828125, 3.5413818359375, 3.89208984375, 4.2427978515625, 4.593505859375, 4.9442138671875, 5.294921875, 5.6456298828125, 5.996337890625, 6.3470458984375, 6.69775390625, 7.0484619140625, 7.399169921875, 7.7498779296875, 8.1005859375, 8.4512939453125, 8.802001953125, 9.1527099609375, 9.50341796875, 9.8541259765625, 10.204833984375, 10.5555419921875, 10.90625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 1.0, 6.0, 4.0, 4.0, 4.0, 8.0, 15.0, 14.0, 17.0, 23.0, 30.0, 67.0, 97.0, 131.0, 273.0, 707.0, 9884.0, 3126108.0, 6962.0, 632.0, 273.0, 146.0, 94.0, 63.0, 42.0, 31.0, 22.0, 16.0, 5.0, 7.0, 5.0, 6.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-65.3125, -63.5693359375, -61.826171875, -60.0830078125, -58.33984375, -56.5966796875, -54.853515625, -53.1103515625, -51.3671875, -49.6240234375, -47.880859375, -46.1376953125, -44.39453125, -42.6513671875, -40.908203125, -39.1650390625, -37.421875, -35.6787109375, -33.935546875, -32.1923828125, -30.44921875, -28.7060546875, -26.962890625, -25.2197265625, -23.4765625, -21.7333984375, -19.990234375, -18.2470703125, -16.50390625, -14.7607421875, -13.017578125, -11.2744140625, -9.53125, -7.7880859375, -6.044921875, -4.3017578125, -2.55859375, -0.8154296875, 0.927734375, 2.6708984375, 4.4140625, 6.1572265625, 7.900390625, 9.6435546875, 11.38671875, 13.1298828125, 14.873046875, 16.6162109375, 18.359375, 20.1025390625, 21.845703125, 23.5888671875, 25.33203125, 27.0751953125, 28.818359375, 30.5615234375, 32.3046875, 34.0478515625, 35.791015625, 37.5341796875, 39.27734375, 41.0205078125, 42.763671875, 44.5068359375, 46.25]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 74.0, 937.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.73299026489258, -25.17411231994629, -17.615234375, -10.056354522705078, -2.497476577758789, 5.0614013671875, 12.620281219482422, 20.179157257080078, 27.738037109375, 35.29691696166992, 42.85579299926758, 50.4146728515625, 57.973548889160156, 65.53242492675781, 73.09130859375, 80.65018463134766, 88.20906066894531, 95.76793670654297, 103.32682037353516, 110.88569641113281, 118.44457244873047, 126.00344848632812, 133.5623321533203, 141.1212158203125, 148.68008422851562, 156.2389678955078, 163.79783630371094, 171.35671997070312, 178.9156036376953, 186.47447204589844, 194.03335571289062, 201.59222412109375, 209.15110778808594, 216.70999145507812, 224.26885986328125, 231.82774353027344, 239.38662719726562, 246.94549560546875, 254.50437927246094, 262.0632629394531, 269.62213134765625, 277.1809997558594, 284.7398986816406, 292.29876708984375, 299.8576354980469, 307.4165344238281, 314.97540283203125, 322.5342712402344, 330.0931701660156, 337.65203857421875, 345.2109375, 352.7698059082031, 360.32867431640625, 367.8875732421875, 375.4464416503906, 383.00531005859375, 390.5641784667969, 398.123046875, 405.68194580078125, 413.2408142089844, 420.7996826171875, 428.35858154296875, 435.9174499511719, 443.476318359375, 451.03521728515625]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 6.0, 7.0, 7.0, 8.0, 10.0, 9.0, 19.0, 23.0, 26.0, 33.0, 23.0, 30.0, 37.0, 31.0, 36.0, 42.0, 49.0, 51.0, 45.0, 39.0, 38.0, 48.0, 52.0, 32.0, 32.0, 30.0, 33.0, 34.0, 26.0, 13.0, 29.0, 13.0, 15.0, 14.0, 9.0, 11.0, 12.0, 8.0, 10.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-36.23344421386719, -35.129539489746094, -34.025634765625, -32.921730041503906, -31.81782341003418, -30.713916778564453, -29.61001205444336, -28.506107330322266, -27.402202606201172, -26.298297882080078, -25.19439125061035, -24.090486526489258, -22.986581802368164, -21.882675170898438, -20.778770446777344, -19.67486572265625, -18.570959091186523, -17.46705436706543, -16.363147735595703, -15.25924301147461, -14.155338287353516, -13.051432609558105, -11.947526931762695, -10.843622207641602, -9.739716529846191, -8.635810852050781, -7.5319061279296875, -6.428000450134277, -5.324095249176025, -4.220190048217773, -3.1162843704223633, -2.0123791694641113, -0.9084739685058594, 0.19543135166168213, 1.2993366718292236, 2.4032421112060547, 3.5071473121643066, 4.611052513122559, 5.714958190917969, 6.818863391876221, 7.922768592834473, 9.026674270629883, 10.130578994750977, 11.234484672546387, 12.338390350341797, 13.44229507446289, 14.5462007522583, 15.650106430053711, 16.754011154174805, 17.8579158782959, 18.961822509765625, 20.06572723388672, 21.169631958007812, 22.273536682128906, 23.377443313598633, 24.481348037719727, 25.585254669189453, 26.689159393310547, 27.793066024780273, 28.896970748901367, 30.00087547302246, 31.104782104492188, 32.20868682861328, 33.312591552734375, 34.41649627685547]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 6.0, 5.0, 18.0, 6.0, 16.0, 16.0, 12.0, 23.0, 34.0, 29.0, 28.0, 32.0, 44.0, 23.0, 33.0, 43.0, 38.0, 42.0, 41.0, 43.0, 43.0, 45.0, 48.0, 38.0, 34.0, 35.0, 28.0, 25.0, 22.0, 18.0, 26.0, 15.0, 14.0, 17.0, 12.0, 8.0, 11.0, 8.0, 8.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.8828125, -3.76837158203125, -3.6539306640625, -3.53948974609375, -3.425048828125, -3.31060791015625, -3.1961669921875, -3.08172607421875, -2.96728515625, -2.85284423828125, -2.7384033203125, -2.62396240234375, -2.509521484375, -2.39508056640625, -2.2806396484375, -2.16619873046875, -2.0517578125, -1.93731689453125, -1.8228759765625, -1.70843505859375, -1.593994140625, -1.47955322265625, -1.3651123046875, -1.25067138671875, -1.13623046875, -1.02178955078125, -0.9073486328125, -0.79290771484375, -0.678466796875, -0.56402587890625, -0.4495849609375, -0.33514404296875, -0.220703125, -0.10626220703125, 0.0081787109375, 0.12261962890625, 0.237060546875, 0.35150146484375, 0.4659423828125, 0.58038330078125, 0.69482421875, 0.80926513671875, 0.9237060546875, 1.03814697265625, 1.152587890625, 1.26702880859375, 1.3814697265625, 1.49591064453125, 1.6103515625, 1.72479248046875, 1.8392333984375, 1.95367431640625, 2.068115234375, 2.18255615234375, 2.2969970703125, 2.41143798828125, 2.52587890625, 2.64031982421875, 2.7547607421875, 2.86920166015625, 2.983642578125, 3.09808349609375, 3.2125244140625, 3.32696533203125, 3.44140625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 8.0, 10.0, 6.0, 19.0, 18.0, 20.0, 32.0, 40.0, 44.0, 60.0, 98.0, 106.0, 145.0, 241.0, 386.0, 697.0, 1661.0, 4418.0, 14453.0, 59029.0, 278023.0, 998928.0, 1634334.0, 896934.0, 233446.0, 50653.0, 13018.0, 3982.0, 1489.0, 694.0, 401.0, 272.0, 173.0, 124.0, 66.0, 65.0, 45.0, 31.0, 30.0, 17.0, 18.0, 11.0, 10.0, 6.0, 4.0, 9.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-5.015625, -4.86566162109375, -4.7156982421875, -4.56573486328125, -4.415771484375, -4.26580810546875, -4.1158447265625, -3.96588134765625, -3.81591796875, -3.66595458984375, -3.5159912109375, -3.36602783203125, -3.216064453125, -3.06610107421875, -2.9161376953125, -2.76617431640625, -2.6162109375, -2.46624755859375, -2.3162841796875, -2.16632080078125, -2.016357421875, -1.86639404296875, -1.7164306640625, -1.56646728515625, -1.41650390625, -1.26654052734375, -1.1165771484375, -0.96661376953125, -0.816650390625, -0.66668701171875, -0.5167236328125, -0.36676025390625, -0.216796875, -0.06683349609375, 0.0831298828125, 0.23309326171875, 0.383056640625, 0.53302001953125, 0.6829833984375, 0.83294677734375, 0.98291015625, 1.13287353515625, 1.2828369140625, 1.43280029296875, 1.582763671875, 1.73272705078125, 1.8826904296875, 2.03265380859375, 2.1826171875, 2.33258056640625, 2.4825439453125, 2.63250732421875, 2.782470703125, 2.93243408203125, 3.0823974609375, 3.23236083984375, 3.38232421875, 3.53228759765625, 3.6822509765625, 3.83221435546875, 3.982177734375, 4.13214111328125, 4.2821044921875, 4.43206787109375, 4.58203125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 9.0, 12.0, 8.0, 21.0, 32.0, 48.0, 86.0, 122.0, 226.0, 357.0, 476.0, 658.0, 600.0, 490.0, 335.0, 197.0, 155.0, 82.0, 68.0, 45.0, 18.0, 16.0, 12.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6328125, -13.243408203125, -12.85400390625, -12.464599609375, -12.0751953125, -11.685791015625, -11.29638671875, -10.906982421875, -10.517578125, -10.128173828125, -9.73876953125, -9.349365234375, -8.9599609375, -8.570556640625, -8.18115234375, -7.791748046875, -7.40234375, -7.012939453125, -6.62353515625, -6.234130859375, -5.8447265625, -5.455322265625, -5.06591796875, -4.676513671875, -4.287109375, -3.897705078125, -3.50830078125, -3.118896484375, -2.7294921875, -2.340087890625, -1.95068359375, -1.561279296875, -1.171875, -0.782470703125, -0.39306640625, -0.003662109375, 0.3857421875, 0.775146484375, 1.16455078125, 1.553955078125, 1.943359375, 2.332763671875, 2.72216796875, 3.111572265625, 3.5009765625, 3.890380859375, 4.27978515625, 4.669189453125, 5.05859375, 5.447998046875, 5.83740234375, 6.226806640625, 6.6162109375, 7.005615234375, 7.39501953125, 7.784423828125, 8.173828125, 8.563232421875, 8.95263671875, 9.342041015625, 9.7314453125, 10.120849609375, 10.51025390625, 10.899658203125, 11.2890625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 4.0, 9.0, 9.0, 4.0, 15.0, 18.0, 16.0, 39.0, 59.0, 66.0, 66.0, 134.0, 178.0, 294.0, 548.0, 1541.0, 17613.0, 2139127.0, 2015109.0, 16535.0, 1454.0, 563.0, 308.0, 150.0, 118.0, 81.0, 53.0, 44.0, 29.0, 25.0, 11.0, 16.0, 13.0, 7.0, 9.0, 6.0, 2.0, 3.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.453125, -18.642333984375, -17.83154296875, -17.020751953125, -16.2099609375, -15.399169921875, -14.58837890625, -13.777587890625, -12.966796875, -12.156005859375, -11.34521484375, -10.534423828125, -9.7236328125, -8.912841796875, -8.10205078125, -7.291259765625, -6.48046875, -5.669677734375, -4.85888671875, -4.048095703125, -3.2373046875, -2.426513671875, -1.61572265625, -0.804931640625, 0.005859375, 0.816650390625, 1.62744140625, 2.438232421875, 3.2490234375, 4.059814453125, 4.87060546875, 5.681396484375, 6.4921875, 7.302978515625, 8.11376953125, 8.924560546875, 9.7353515625, 10.546142578125, 11.35693359375, 12.167724609375, 12.978515625, 13.789306640625, 14.60009765625, 15.410888671875, 16.2216796875, 17.032470703125, 17.84326171875, 18.654052734375, 19.46484375, 20.275634765625, 21.08642578125, 21.897216796875, 22.7080078125, 23.518798828125, 24.32958984375, 25.140380859375, 25.951171875, 26.761962890625, 27.57275390625, 28.383544921875, 29.1943359375, 30.005126953125, 30.81591796875, 31.626708984375, 32.4375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 12.0, 137.0, 392.0, 366.0, 97.0, 12.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.17577362060547, -76.65739440917969, -72.13900756835938, -67.6206283569336, -63.10224533081055, -58.5838623046875, -54.06548309326172, -49.54710006713867, -45.028717041015625, -40.51033401489258, -35.99195098876953, -31.47357177734375, -26.955188751220703, -22.436805725097656, -17.918424606323242, -13.400043487548828, -8.881660461425781, -4.363278388977051, 0.1551036834716797, 4.67348575592041, 9.19186782836914, 13.710250854492188, 18.2286319732666, 22.747013092041016, 27.265396118164062, 31.78377914428711, 36.302162170410156, 40.82054138183594, 45.338924407958984, 49.85730743408203, 54.37568664550781, 58.89406967163086, 63.41246032714844, 67.93083953857422, 72.44922637939453, 76.96760559082031, 81.48599243164062, 86.0043716430664, 90.52275085449219, 95.0411376953125, 99.55951690673828, 104.07789611816406, 108.59628295898438, 113.11466217041016, 117.63304138183594, 122.15142822265625, 126.66980743408203, 131.1881866455078, 135.70657348632812, 140.22496032714844, 144.7433319091797, 149.26171875, 153.7801055908203, 158.29849243164062, 162.81686401367188, 167.3352508544922, 171.8536376953125, 176.3720245361328, 180.89039611816406, 185.40878295898438, 189.9271697998047, 194.445556640625, 198.96392822265625, 203.48231506347656, 208.0006866455078]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 1.0, 3.0, 9.0, 4.0, 13.0, 19.0, 21.0, 20.0, 23.0, 21.0, 21.0, 30.0, 27.0, 35.0, 38.0, 49.0, 42.0, 42.0, 54.0, 47.0, 47.0, 39.0, 43.0, 35.0, 33.0, 41.0, 30.0, 27.0, 25.0, 23.0, 18.0, 15.0, 23.0, 14.0, 14.0, 12.0, 9.0, 7.0, 5.0, 6.0, 5.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.767471313476562, -26.87171745300293, -25.975963592529297, -25.080211639404297, -24.184457778930664, -23.28870391845703, -22.3929500579834, -21.497196197509766, -20.601444244384766, -19.705690383911133, -18.8099365234375, -17.9141845703125, -17.018430709838867, -16.122676849365234, -15.226922988891602, -14.331170082092285, -13.435416221618652, -12.53966236114502, -11.643909454345703, -10.74815559387207, -9.852402687072754, -8.956648826599121, -8.060895919799805, -7.165142059326172, -6.269388675689697, -5.373635292053223, -4.477881908416748, -3.5821282863616943, -2.6863749027252197, -1.790621280670166, -0.8948678970336914, 0.0008854866027832031, 0.8966388702392578, 1.7923922538757324, 2.688145637512207, 3.5838992595672607, 4.479652404785156, 5.375406265258789, 6.271159648895264, 7.166913032531738, 8.062665939331055, 8.958419799804688, 9.854172706604004, 10.749926567077637, 11.645679473876953, 12.541433334350586, 13.437187194824219, 14.332940101623535, 15.228693962097168, 16.124446868896484, 17.020200729370117, 17.91595458984375, 18.811708450317383, 19.707462310791016, 20.603214263916016, 21.49896812438965, 22.39472198486328, 23.290475845336914, 24.186229705810547, 25.081981658935547, 25.97773551940918, 26.873489379882812, 27.769243240356445, 28.664997100830078, 29.560749053955078]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 8.0, 5.0, 6.0, 5.0, 3.0, 13.0, 12.0, 15.0, 15.0, 15.0, 14.0, 21.0, 25.0, 22.0, 33.0, 30.0, 33.0, 35.0, 44.0, 36.0, 34.0, 40.0, 42.0, 50.0, 51.0, 37.0, 45.0, 45.0, 25.0, 24.0, 34.0, 27.0, 23.0, 22.0, 24.0, 16.0, 12.0, 14.0, 20.0, 10.0, 4.0, 7.0, 2.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.904296875, -3.79156494140625, -3.6788330078125, -3.56610107421875, -3.453369140625, -3.34063720703125, -3.2279052734375, -3.11517333984375, -3.00244140625, -2.88970947265625, -2.7769775390625, -2.66424560546875, -2.551513671875, -2.43878173828125, -2.3260498046875, -2.21331787109375, -2.1005859375, -1.98785400390625, -1.8751220703125, -1.76239013671875, -1.649658203125, -1.53692626953125, -1.4241943359375, -1.31146240234375, -1.19873046875, -1.08599853515625, -0.9732666015625, -0.86053466796875, -0.747802734375, -0.63507080078125, -0.5223388671875, -0.40960693359375, -0.296875, -0.18414306640625, -0.0714111328125, 0.04132080078125, 0.154052734375, 0.26678466796875, 0.3795166015625, 0.49224853515625, 0.60498046875, 0.71771240234375, 0.8304443359375, 0.94317626953125, 1.055908203125, 1.16864013671875, 1.2813720703125, 1.39410400390625, 1.5068359375, 1.61956787109375, 1.7322998046875, 1.84503173828125, 1.957763671875, 2.07049560546875, 2.1832275390625, 2.29595947265625, 2.40869140625, 2.52142333984375, 2.6341552734375, 2.74688720703125, 2.859619140625, 2.97235107421875, 3.0850830078125, 3.19781494140625, 3.310546875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 11.0, 18.0, 14.0, 26.0, 58.0, 86.0, 115.0, 140.0, 232.0, 353.0, 511.0, 747.0, 1154.0, 1776.0, 2589.0, 4108.0, 6507.0, 9645.0, 15128.0, 23262.0, 38184.0, 64814.0, 121477.0, 323482.0, 202583.0, 92369.0, 52044.0, 31270.0, 19795.0, 12345.0, 8078.0, 5356.0, 3473.0, 2300.0, 1515.0, 1016.0, 656.0, 432.0, 299.0, 176.0, 118.0, 90.0, 77.0, 43.0, 23.0, 17.0, 14.0, 9.0, 8.0, 6.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.89892578125, -0.8723297119140625, -0.845733642578125, -0.8191375732421875, -0.79254150390625, -0.7659454345703125, -0.739349365234375, -0.7127532958984375, -0.6861572265625, -0.6595611572265625, -0.632965087890625, -0.6063690185546875, -0.57977294921875, -0.5531768798828125, -0.526580810546875, -0.4999847412109375, -0.473388671875, -0.4467926025390625, -0.420196533203125, -0.3936004638671875, -0.36700439453125, -0.3404083251953125, -0.313812255859375, -0.2872161865234375, -0.2606201171875, -0.2340240478515625, -0.207427978515625, -0.1808319091796875, -0.15423583984375, -0.1276397705078125, -0.101043701171875, -0.0744476318359375, -0.0478515625, -0.0212554931640625, 0.005340576171875, 0.0319366455078125, 0.05853271484375, 0.0851287841796875, 0.111724853515625, 0.1383209228515625, 0.1649169921875, 0.1915130615234375, 0.218109130859375, 0.2447052001953125, 0.27130126953125, 0.2978973388671875, 0.324493408203125, 0.3510894775390625, 0.377685546875, 0.4042816162109375, 0.430877685546875, 0.4574737548828125, 0.48406982421875, 0.5106658935546875, 0.537261962890625, 0.5638580322265625, 0.5904541015625, 0.6170501708984375, 0.643646240234375, 0.6702423095703125, 0.69683837890625, 0.7234344482421875, 0.750030517578125, 0.7766265869140625, 0.80322265625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 8.0, 5.0, 10.0, 11.0, 10.0, 20.0, 18.0, 18.0, 22.0, 20.0, 32.0, 23.0, 28.0, 38.0, 40.0, 33.0, 48.0, 38.0, 31.0, 34.0, 1057.0, 37.0, 40.0, 41.0, 38.0, 41.0, 39.0, 32.0, 37.0, 25.0, 20.0, 24.0, 17.0, 13.0, 5.0, 9.0, 13.0, 7.0, 3.0, 9.0, 4.0, 4.0, 4.0, 4.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.185546875, -2.115081787109375, -2.04461669921875, -1.974151611328125, -1.9036865234375, -1.833221435546875, -1.76275634765625, -1.692291259765625, -1.621826171875, -1.551361083984375, -1.48089599609375, -1.410430908203125, -1.3399658203125, -1.269500732421875, -1.19903564453125, -1.128570556640625, -1.05810546875, -0.987640380859375, -0.91717529296875, -0.846710205078125, -0.7762451171875, -0.705780029296875, -0.63531494140625, -0.564849853515625, -0.494384765625, -0.423919677734375, -0.35345458984375, -0.282989501953125, -0.2125244140625, -0.142059326171875, -0.07159423828125, -0.001129150390625, 0.0693359375, 0.139801025390625, 0.21026611328125, 0.280731201171875, 0.3511962890625, 0.421661376953125, 0.49212646484375, 0.562591552734375, 0.633056640625, 0.703521728515625, 0.77398681640625, 0.844451904296875, 0.9149169921875, 0.985382080078125, 1.05584716796875, 1.126312255859375, 1.19677734375, 1.267242431640625, 1.33770751953125, 1.408172607421875, 1.4786376953125, 1.549102783203125, 1.61956787109375, 1.690032958984375, 1.760498046875, 1.830963134765625, 1.90142822265625, 1.971893310546875, 2.0423583984375, 2.112823486328125, 2.18328857421875, 2.253753662109375, 2.32421875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 8.0, 8.0, 5.0, 6.0, 8.0, 30.0, 26.0, 47.0, 82.0, 106.0, 156.0, 170.0, 336.0, 506.0, 713.0, 1194.0, 1757.0, 2823.0, 4562.0, 7335.0, 11939.0, 19848.0, 33605.0, 60072.0, 114278.0, 1346599.0, 250285.0, 104873.0, 56236.0, 31583.0, 18122.0, 10904.0, 6849.0, 4161.0, 2817.0, 1759.0, 1157.0, 783.0, 503.0, 289.0, 221.0, 125.0, 89.0, 51.0, 32.0, 26.0, 31.0, 8.0, 9.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.93603515625, -0.9076156616210938, -0.8791961669921875, -0.8507766723632812, -0.822357177734375, -0.7939376831054688, -0.7655181884765625, -0.7370986938476562, -0.70867919921875, -0.6802597045898438, -0.6518402099609375, -0.6234207153320312, -0.595001220703125, -0.5665817260742188, -0.5381622314453125, -0.5097427368164062, -0.4813232421875, -0.45290374755859375, -0.4244842529296875, -0.39606475830078125, -0.367645263671875, -0.33922576904296875, -0.3108062744140625, -0.28238677978515625, -0.25396728515625, -0.22554779052734375, -0.1971282958984375, -0.16870880126953125, -0.140289306640625, -0.11186981201171875, -0.0834503173828125, -0.05503082275390625, -0.026611328125, 0.00180816650390625, 0.0302276611328125, 0.05864715576171875, 0.087066650390625, 0.11548614501953125, 0.1439056396484375, 0.17232513427734375, 0.20074462890625, 0.22916412353515625, 0.2575836181640625, 0.28600311279296875, 0.314422607421875, 0.34284210205078125, 0.3712615966796875, 0.39968109130859375, 0.4281005859375, 0.45652008056640625, 0.4849395751953125, 0.5133590698242188, 0.541778564453125, 0.5701980590820312, 0.5986175537109375, 0.6270370483398438, 0.65545654296875, 0.6838760375976562, 0.7122955322265625, 0.7407150268554688, 0.769134521484375, 0.7975540161132812, 0.8259735107421875, 0.8543930053710938, 0.8828125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 2.0, 4.0, 7.0, 8.0, 3.0, 15.0, 12.0, 17.0, 21.0, 24.0, 38.0, 41.0, 46.0, 63.0, 71.0, 73.0, 85.0, 82.0, 74.0, 64.0, 43.0, 39.0, 36.0, 24.0, 16.0, 19.0, 14.0, 9.0, 8.0, 3.0, 10.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0006814002990722656, -0.0006605237722396851, -0.0006396472454071045, -0.0006187707185745239, -0.0005978941917419434, -0.0005770176649093628, -0.0005561411380767822, -0.0005352646112442017, -0.0005143880844116211, -0.0004935115575790405, -0.00047263503074645996, -0.0004517585039138794, -0.00043088197708129883, -0.00041000545024871826, -0.0003891289234161377, -0.00036825239658355713, -0.00034737586975097656, -0.000326499342918396, -0.00030562281608581543, -0.00028474628925323486, -0.0002638697624206543, -0.00024299323558807373, -0.00022211670875549316, -0.0002012401819229126, -0.00018036365509033203, -0.00015948712825775146, -0.0001386106014251709, -0.00011773407459259033, -9.685754776000977e-05, -7.59810209274292e-05, -5.510449409484863e-05, -3.4227967262268066e-05, -1.33514404296875e-05, 7.525086402893066e-06, 2.8401613235473633e-05, 4.92781400680542e-05, 7.015466690063477e-05, 9.103119373321533e-05, 0.0001119077205657959, 0.00013278424739837646, 0.00015366077423095703, 0.0001745373010635376, 0.00019541382789611816, 0.00021629035472869873, 0.0002371668815612793, 0.00025804340839385986, 0.00027891993522644043, 0.000299796462059021, 0.00032067298889160156, 0.00034154951572418213, 0.0003624260425567627, 0.00038330256938934326, 0.00040417909622192383, 0.0004250556230545044, 0.00044593214988708496, 0.00046680867671966553, 0.0004876852035522461, 0.0005085617303848267, 0.0005294382572174072, 0.0005503147840499878, 0.0005711913108825684, 0.0005920678377151489, 0.0006129443645477295, 0.0006338208913803101, 0.0006546974182128906]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 5.0, 7.0, 4.0, 5.0, 10.0, 9.0, 18.0, 19.0, 27.0, 45.0, 58.0, 90.0, 179.0, 354.0, 814.0, 29872.0, 1012999.0, 2798.0, 566.0, 255.0, 123.0, 89.0, 62.0, 37.0, 24.0, 13.0, 14.0, 12.0, 4.0, 8.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 3.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.01558685302734375, -0.015118718147277832, -0.014650583267211914, -0.014182448387145996, -0.013714313507080078, -0.01324617862701416, -0.012778043746948242, -0.012309908866882324, -0.011841773986816406, -0.011373639106750488, -0.01090550422668457, -0.010437369346618652, -0.009969234466552734, -0.009501099586486816, -0.009032964706420898, -0.00856482982635498, -0.008096694946289062, -0.0076285600662231445, -0.0071604251861572266, -0.006692290306091309, -0.006224155426025391, -0.005756020545959473, -0.005287885665893555, -0.004819750785827637, -0.004351615905761719, -0.0038834810256958008, -0.003415346145629883, -0.002947211265563965, -0.002479076385498047, -0.002010941505432129, -0.001542806625366211, -0.001074671745300293, -0.000606536865234375, -0.00013840198516845703, 0.00032973289489746094, 0.0007978677749633789, 0.0012660026550292969, 0.0017341375350952148, 0.002202272415161133, 0.0026704072952270508, 0.0031385421752929688, 0.0036066770553588867, 0.004074811935424805, 0.004542946815490723, 0.005011081695556641, 0.005479216575622559, 0.0059473514556884766, 0.0064154863357543945, 0.0068836212158203125, 0.0073517560958862305, 0.007819890975952148, 0.008288025856018066, 0.008756160736083984, 0.009224295616149902, 0.00969243049621582, 0.010160565376281738, 0.010628700256347656, 0.011096835136413574, 0.011564970016479492, 0.01203310489654541, 0.012501239776611328, 0.012969374656677246, 0.013437509536743164, 0.013905644416809082, 0.014373779296875]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 9.0, 75.0, 221.0, 352.0, 247.0, 84.0, 19.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001797436154447496, -0.0017618568381294608, -0.0017262775218114257, -0.0016906982054933906, -0.0016551188891753554, -0.0016195395728573203, -0.0015839602565392852, -0.00154838094022125, -0.001512801623903215, -0.0014772223075851798, -0.0014416429912671447, -0.0014060636749491096, -0.0013704843586310744, -0.0013349050423130393, -0.0012993257259950042, -0.001263746409676969, -0.001228167093358934, -0.0011925877770408988, -0.0011570084607228637, -0.0011214291444048285, -0.0010858498280867934, -0.0010502705117687583, -0.0010146911954507232, -0.000979111879132688, -0.0009435325628146529, -0.0009079532464966178, -0.0008723739301785827, -0.0008367946138605475, -0.0008012152975425124, -0.0007656359812244773, -0.0007300566649064422, -0.000694477348588407, -0.0006588980322703719, -0.0006233187159523368, -0.0005877393996343017, -0.0005521600833162665, -0.0005165807669982314, -0.0004810014506801963, -0.00044542213436216116, -0.00040984281804412603, -0.0003742635017260909, -0.0003386841854080558, -0.00030310486909002066, -0.00026752555277198553, -0.0002319462364539504, -0.00019636692013591528, -0.00016078760381788015, -0.00012520828749984503, -8.96289711818099e-05, -5.4049654863774776e-05, -1.847033854573965e-05, 1.7108977772295475e-05, 5.26882940903306e-05, 8.826761040836573e-05, 0.00012384692672640085, 0.00015942624304443598, 0.0001950055593624711, 0.00023058487568050623, 0.00026616419199854136, 0.0003017435083165765, 0.0003373228246346116, 0.00037290214095264673, 0.00040848145727068186, 0.000444060773588717, 0.0004796400899067521]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 7.0, 6.0, 3.0, 9.0, 16.0, 10.0, 24.0, 8.0, 15.0, 27.0, 20.0, 27.0, 24.0, 35.0, 31.0, 37.0, 38.0, 38.0, 33.0, 44.0, 31.0, 38.0, 38.0, 30.0, 38.0, 36.0, 34.0, 30.0, 24.0, 38.0, 35.0, 17.0, 31.0, 14.0, 19.0, 12.0, 15.0, 10.0, 7.0, 9.0, 14.0, 7.0, 4.0, 12.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0003033876419067383, -0.0002940865233540535, -0.0002847854048013687, -0.00027548428624868393, -0.00026618316769599915, -0.00025688204914331436, -0.0002475809305906296, -0.0002382798120379448, -0.00022897869348526, -0.00021967757493257523, -0.00021037645637989044, -0.00020107533782720566, -0.00019177421927452087, -0.0001824731007218361, -0.0001731719821691513, -0.00016387086361646652, -0.00015456974506378174, -0.00014526862651109695, -0.00013596750795841217, -0.0001266663894057274, -0.0001173652708530426, -0.00010806415230035782, -9.876303374767303e-05, -8.946191519498825e-05, -8.016079664230347e-05, -7.085967808961868e-05, -6.15585595369339e-05, -5.2257440984249115e-05, -4.295632243156433e-05, -3.365520387887955e-05, -2.4354085326194763e-05, -1.505296677350998e-05, -5.751848220825195e-06, 3.5492703318595886e-06, 1.2850388884544373e-05, 2.2151507437229156e-05, 3.145262598991394e-05, 4.0753744542598724e-05, 5.005486309528351e-05, 5.935598164796829e-05, 6.865710020065308e-05, 7.795821875333786e-05, 8.725933730602264e-05, 9.656045585870743e-05, 0.00010586157441139221, 0.000115162692964077, 0.00012446381151676178, 0.00013376493006944656, 0.00014306604862213135, 0.00015236716717481613, 0.00016166828572750092, 0.0001709694042801857, 0.00018027052283287048, 0.00018957164138555527, 0.00019887275993824005, 0.00020817387849092484, 0.00021747499704360962, 0.0002267761155962944, 0.0002360772341489792, 0.00024537835270166397, 0.00025467947125434875, 0.00026398058980703354, 0.0002732817083597183, 0.0002825828269124031, 0.0002918839454650879]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 8.0, 5.0, 6.0, 5.0, 3.0, 13.0, 12.0, 15.0, 15.0, 15.0, 14.0, 21.0, 25.0, 22.0, 33.0, 30.0, 33.0, 35.0, 44.0, 36.0, 34.0, 40.0, 42.0, 50.0, 51.0, 37.0, 46.0, 44.0, 25.0, 24.0, 34.0, 27.0, 23.0, 22.0, 24.0, 16.0, 12.0, 14.0, 20.0, 10.0, 4.0, 7.0, 2.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.904296875, -3.79156494140625, -3.6788330078125, -3.56610107421875, -3.453369140625, -3.34063720703125, -3.2279052734375, -3.11517333984375, -3.00244140625, -2.88970947265625, -2.7769775390625, -2.66424560546875, -2.551513671875, -2.43878173828125, -2.3260498046875, -2.21331787109375, -2.1005859375, -1.98785400390625, -1.8751220703125, -1.76239013671875, -1.649658203125, -1.53692626953125, -1.4241943359375, -1.31146240234375, -1.19873046875, -1.08599853515625, -0.9732666015625, -0.86053466796875, -0.747802734375, -0.63507080078125, -0.5223388671875, -0.40960693359375, -0.296875, -0.18414306640625, -0.0714111328125, 0.04132080078125, 0.154052734375, 0.26678466796875, 0.3795166015625, 0.49224853515625, 0.60498046875, 0.71771240234375, 0.8304443359375, 0.94317626953125, 1.055908203125, 1.16864013671875, 1.2813720703125, 1.39410400390625, 1.5068359375, 1.61956787109375, 1.7322998046875, 1.84503173828125, 1.957763671875, 2.07049560546875, 2.1832275390625, 2.29595947265625, 2.40869140625, 2.52142333984375, 2.6341552734375, 2.74688720703125, 2.859619140625, 2.97235107421875, 3.0850830078125, 3.19781494140625, 3.310546875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 5.0, 10.0, 15.0, 26.0, 39.0, 42.0, 68.0, 82.0, 149.0, 230.0, 315.0, 521.0, 879.0, 1452.0, 2719.0, 5154.0, 10025.0, 19005.0, 36478.0, 70618.0, 138808.0, 247586.0, 240357.0, 132232.0, 67479.0, 34853.0, 18198.0, 9637.0, 5040.0, 2736.0, 1491.0, 832.0, 497.0, 305.0, 218.0, 138.0, 104.0, 74.0, 52.0, 35.0, 21.0, 9.0, 8.0, 10.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.03515625, -2.94580078125, -2.8564453125, -2.76708984375, -2.677734375, -2.58837890625, -2.4990234375, -2.40966796875, -2.3203125, -2.23095703125, -2.1416015625, -2.05224609375, -1.962890625, -1.87353515625, -1.7841796875, -1.69482421875, -1.60546875, -1.51611328125, -1.4267578125, -1.33740234375, -1.248046875, -1.15869140625, -1.0693359375, -0.97998046875, -0.890625, -0.80126953125, -0.7119140625, -0.62255859375, -0.533203125, -0.44384765625, -0.3544921875, -0.26513671875, -0.17578125, -0.08642578125, 0.0029296875, 0.09228515625, 0.181640625, 0.27099609375, 0.3603515625, 0.44970703125, 0.5390625, 0.62841796875, 0.7177734375, 0.80712890625, 0.896484375, 0.98583984375, 1.0751953125, 1.16455078125, 1.25390625, 1.34326171875, 1.4326171875, 1.52197265625, 1.611328125, 1.70068359375, 1.7900390625, 1.87939453125, 1.96875, 2.05810546875, 2.1474609375, 2.23681640625, 2.326171875, 2.41552734375, 2.5048828125, 2.59423828125, 2.68359375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 5.0, 8.0, 6.0, 7.0, 12.0, 7.0, 12.0, 12.0, 23.0, 17.0, 33.0, 28.0, 35.0, 34.0, 45.0, 45.0, 59.0, 71.0, 114.0, 221.0, 1392.0, 254.0, 124.0, 75.0, 56.0, 47.0, 39.0, 39.0, 36.0, 30.0, 24.0, 19.0, 11.0, 25.0, 15.0, 17.0, 12.0, 6.0, 3.0, 7.0, 6.0, 7.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.125, -13.704833984375, -13.28466796875, -12.864501953125, -12.4443359375, -12.024169921875, -11.60400390625, -11.183837890625, -10.763671875, -10.343505859375, -9.92333984375, -9.503173828125, -9.0830078125, -8.662841796875, -8.24267578125, -7.822509765625, -7.40234375, -6.982177734375, -6.56201171875, -6.141845703125, -5.7216796875, -5.301513671875, -4.88134765625, -4.461181640625, -4.041015625, -3.620849609375, -3.20068359375, -2.780517578125, -2.3603515625, -1.940185546875, -1.52001953125, -1.099853515625, -0.6796875, -0.259521484375, 0.16064453125, 0.580810546875, 1.0009765625, 1.421142578125, 1.84130859375, 2.261474609375, 2.681640625, 3.101806640625, 3.52197265625, 3.942138671875, 4.3623046875, 4.782470703125, 5.20263671875, 5.622802734375, 6.04296875, 6.463134765625, 6.88330078125, 7.303466796875, 7.7236328125, 8.143798828125, 8.56396484375, 8.984130859375, 9.404296875, 9.824462890625, 10.24462890625, 10.664794921875, 11.0849609375, 11.505126953125, 11.92529296875, 12.345458984375, 12.765625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 8.0, 7.0, 9.0, 16.0, 33.0, 46.0, 73.0, 113.0, 173.0, 295.0, 662.0, 8434.0, 3129426.0, 5036.0, 629.0, 301.0, 175.0, 103.0, 55.0, 40.0, 27.0, 17.0, 14.0, 6.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.875, -59.7001953125, -57.525390625, -55.3505859375, -53.17578125, -51.0009765625, -48.826171875, -46.6513671875, -44.4765625, -42.3017578125, -40.126953125, -37.9521484375, -35.77734375, -33.6025390625, -31.427734375, -29.2529296875, -27.078125, -24.9033203125, -22.728515625, -20.5537109375, -18.37890625, -16.2041015625, -14.029296875, -11.8544921875, -9.6796875, -7.5048828125, -5.330078125, -3.1552734375, -0.98046875, 1.1943359375, 3.369140625, 5.5439453125, 7.71875, 9.8935546875, 12.068359375, 14.2431640625, 16.41796875, 18.5927734375, 20.767578125, 22.9423828125, 25.1171875, 27.2919921875, 29.466796875, 31.6416015625, 33.81640625, 35.9912109375, 38.166015625, 40.3408203125, 42.515625, 44.6904296875, 46.865234375, 49.0400390625, 51.21484375, 53.3896484375, 55.564453125, 57.7392578125, 59.9140625, 62.0888671875, 64.263671875, 66.4384765625, 68.61328125, 70.7880859375, 72.962890625, 75.1376953125, 77.3125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 12.0, 854.0, 150.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.3556137084961, -70.14604187011719, -62.93647003173828, -55.726898193359375, -48.51732635498047, -41.30775833129883, -34.09818649291992, -26.888614654541016, -19.67904281616211, -12.469470977783203, -5.259900093078613, 1.9496707916259766, 9.159242630004883, 16.368812561035156, 23.578384399414062, 30.78795623779297, 37.997528076171875, 45.20709991455078, 52.41667175292969, 59.626243591308594, 66.8358154296875, 74.04537963867188, 81.25495910644531, 88.46452331542969, 95.67410278320312, 102.88367462158203, 110.09324645996094, 117.30281829833984, 124.51239013671875, 131.72195434570312, 138.93153381347656, 146.14109802246094, 153.3506622314453, 160.5602264404297, 167.76980590820312, 174.9793701171875, 182.18894958496094, 189.3985137939453, 196.60809326171875, 203.81765747070312, 211.02723693847656, 218.23680114746094, 225.44638061523438, 232.65594482421875, 239.8655242919922, 247.07508850097656, 254.28466796875, 261.4942321777344, 268.70379638671875, 275.9133605957031, 283.1229248046875, 290.33251953125, 297.5420837402344, 304.75164794921875, 311.9612121582031, 319.1708068847656, 326.38037109375, 333.5899353027344, 340.79949951171875, 348.00909423828125, 355.2186584472656, 362.42822265625, 369.6377868652344, 376.8473815917969, 384.05694580078125]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 7.0, 11.0, 6.0, 16.0, 15.0, 15.0, 18.0, 10.0, 14.0, 20.0, 34.0, 21.0, 31.0, 34.0, 30.0, 41.0, 42.0, 32.0, 37.0, 32.0, 45.0, 34.0, 35.0, 41.0, 37.0, 35.0, 34.0, 24.0, 24.0, 21.0, 21.0, 19.0, 21.0, 15.0, 22.0, 17.0, 18.0, 12.0, 7.0, 7.0, 7.0, 9.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.411911010742188, -26.490345001220703, -25.56878089904785, -24.647214889526367, -23.725650787353516, -22.80408477783203, -21.88252067565918, -20.960954666137695, -20.039390563964844, -19.11782455444336, -18.196260452270508, -17.274694442749023, -16.353130340576172, -15.431564331054688, -14.510000228881836, -13.588434219360352, -12.666869163513184, -11.745304107666016, -10.823739051818848, -9.90217399597168, -8.980608940124512, -8.059043884277344, -7.137478351593018, -6.21591329574585, -5.294348239898682, -4.372783184051514, -3.4512181282043457, -2.5296528339385986, -1.6080877780914307, -0.6865224838256836, 0.23504257202148438, 1.1566076278686523, 2.0781726837158203, 2.9997377395629883, 3.9213027954101562, 4.842867851257324, 5.764432907104492, 6.685998439788818, 7.607563495635986, 8.529129028320312, 9.450693130493164, 10.372258186340332, 11.2938232421875, 12.215388298034668, 13.136953353881836, 14.05851936340332, 14.980083465576172, 15.901649475097656, 16.82321548461914, 17.744781494140625, 18.666345596313477, 19.58791160583496, 20.509475708007812, 21.431041717529297, 22.35260581970215, 23.274171829223633, 24.195735931396484, 25.11730194091797, 26.03886604309082, 26.960432052612305, 27.881996154785156, 28.80356216430664, 29.725126266479492, 30.646692276000977, 31.568256378173828]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 7.0, 10.0, 7.0, 14.0, 6.0, 8.0, 16.0, 18.0, 18.0, 17.0, 19.0, 26.0, 28.0, 31.0, 33.0, 39.0, 34.0, 48.0, 34.0, 39.0, 33.0, 30.0, 54.0, 34.0, 37.0, 46.0, 38.0, 38.0, 27.0, 24.0, 26.0, 25.0, 21.0, 19.0, 21.0, 9.0, 17.0, 12.0, 11.0, 5.0, 6.0, 3.0, 7.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.97265625, -3.85247802734375, -3.7322998046875, -3.61212158203125, -3.491943359375, -3.37176513671875, -3.2515869140625, -3.13140869140625, -3.01123046875, -2.89105224609375, -2.7708740234375, -2.65069580078125, -2.530517578125, -2.41033935546875, -2.2901611328125, -2.16998291015625, -2.0498046875, -1.92962646484375, -1.8094482421875, -1.68927001953125, -1.569091796875, -1.44891357421875, -1.3287353515625, -1.20855712890625, -1.08837890625, -0.96820068359375, -0.8480224609375, -0.72784423828125, -0.607666015625, -0.48748779296875, -0.3673095703125, -0.24713134765625, -0.126953125, -0.00677490234375, 0.1134033203125, 0.23358154296875, 0.353759765625, 0.47393798828125, 0.5941162109375, 0.71429443359375, 0.83447265625, 0.95465087890625, 1.0748291015625, 1.19500732421875, 1.315185546875, 1.43536376953125, 1.5555419921875, 1.67572021484375, 1.7958984375, 1.91607666015625, 2.0362548828125, 2.15643310546875, 2.276611328125, 2.39678955078125, 2.5169677734375, 2.63714599609375, 2.75732421875, 2.87750244140625, 2.9976806640625, 3.11785888671875, 3.238037109375, 3.35821533203125, 3.4783935546875, 3.59857177734375, 3.71875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 6.0, 7.0, 10.0, 6.0, 12.0, 8.0, 18.0, 12.0, 14.0, 14.0, 24.0, 30.0, 30.0, 40.0, 64.0, 98.0, 146.0, 296.0, 1002.0, 8398.0, 492083.0, 3447118.0, 237655.0, 5494.0, 851.0, 318.0, 149.0, 91.0, 42.0, 43.0, 36.0, 30.0, 27.0, 30.0, 17.0, 13.0, 10.0, 10.0, 8.0, 7.0, 5.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-16.640625, -16.1707763671875, -15.700927734375, -15.2310791015625, -14.76123046875, -14.2913818359375, -13.821533203125, -13.3516845703125, -12.8818359375, -12.4119873046875, -11.942138671875, -11.4722900390625, -11.00244140625, -10.5325927734375, -10.062744140625, -9.5928955078125, -9.123046875, -8.6531982421875, -8.183349609375, -7.7135009765625, -7.24365234375, -6.7738037109375, -6.303955078125, -5.8341064453125, -5.3642578125, -4.8944091796875, -4.424560546875, -3.9547119140625, -3.48486328125, -3.0150146484375, -2.545166015625, -2.0753173828125, -1.60546875, -1.1356201171875, -0.665771484375, -0.1959228515625, 0.27392578125, 0.7437744140625, 1.213623046875, 1.6834716796875, 2.1533203125, 2.6231689453125, 3.093017578125, 3.5628662109375, 4.03271484375, 4.5025634765625, 4.972412109375, 5.4422607421875, 5.912109375, 6.3819580078125, 6.851806640625, 7.3216552734375, 7.79150390625, 8.2613525390625, 8.731201171875, 9.2010498046875, 9.6708984375, 10.1407470703125, 10.610595703125, 11.0804443359375, 11.55029296875, 12.0201416015625, 12.489990234375, 12.9598388671875, 13.4296875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 10.0, 8.0, 14.0, 18.0, 37.0, 44.0, 56.0, 87.0, 139.0, 162.0, 231.0, 321.0, 438.0, 498.0, 484.0, 380.0, 285.0, 254.0, 179.0, 116.0, 85.0, 73.0, 46.0, 31.0, 15.0, 15.0, 11.0, 7.0, 7.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1484375, -7.855712890625, -7.56298828125, -7.270263671875, -6.9775390625, -6.684814453125, -6.39208984375, -6.099365234375, -5.806640625, -5.513916015625, -5.22119140625, -4.928466796875, -4.6357421875, -4.343017578125, -4.05029296875, -3.757568359375, -3.46484375, -3.172119140625, -2.87939453125, -2.586669921875, -2.2939453125, -2.001220703125, -1.70849609375, -1.415771484375, -1.123046875, -0.830322265625, -0.53759765625, -0.244873046875, 0.0478515625, 0.340576171875, 0.63330078125, 0.926025390625, 1.21875, 1.511474609375, 1.80419921875, 2.096923828125, 2.3896484375, 2.682373046875, 2.97509765625, 3.267822265625, 3.560546875, 3.853271484375, 4.14599609375, 4.438720703125, 4.7314453125, 5.024169921875, 5.31689453125, 5.609619140625, 5.90234375, 6.195068359375, 6.48779296875, 6.780517578125, 7.0732421875, 7.365966796875, 7.65869140625, 7.951416015625, 8.244140625, 8.536865234375, 8.82958984375, 9.122314453125, 9.4150390625, 9.707763671875, 10.00048828125, 10.293212890625, 10.5859375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 10.0, 6.0, 8.0, 21.0, 15.0, 40.0, 58.0, 66.0, 96.0, 160.0, 213.0, 440.0, 1088.0, 18330.0, 3847561.0, 322302.0, 2464.0, 582.0, 288.0, 172.0, 118.0, 79.0, 50.0, 32.0, 22.0, 18.0, 10.0, 12.0, 7.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.109375, -27.016845703125, -25.92431640625, -24.831787109375, -23.7392578125, -22.646728515625, -21.55419921875, -20.461669921875, -19.369140625, -18.276611328125, -17.18408203125, -16.091552734375, -14.9990234375, -13.906494140625, -12.81396484375, -11.721435546875, -10.62890625, -9.536376953125, -8.44384765625, -7.351318359375, -6.2587890625, -5.166259765625, -4.07373046875, -2.981201171875, -1.888671875, -0.796142578125, 0.29638671875, 1.388916015625, 2.4814453125, 3.573974609375, 4.66650390625, 5.759033203125, 6.8515625, 7.944091796875, 9.03662109375, 10.129150390625, 11.2216796875, 12.314208984375, 13.40673828125, 14.499267578125, 15.591796875, 16.684326171875, 17.77685546875, 18.869384765625, 19.9619140625, 21.054443359375, 22.14697265625, 23.239501953125, 24.33203125, 25.424560546875, 26.51708984375, 27.609619140625, 28.7021484375, 29.794677734375, 30.88720703125, 31.979736328125, 33.072265625, 34.164794921875, 35.25732421875, 36.349853515625, 37.4423828125, 38.534912109375, 39.62744140625, 40.719970703125, 41.8125]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 40.0, 115.0, 245.0, 318.0, 208.0, 72.0, 10.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.05057144165039, -43.94791793823242, -40.84526824951172, -37.74261474609375, -34.63996124267578, -31.537309646606445, -28.43465805053711, -25.33200454711914, -22.229352951049805, -19.12670135498047, -16.0240478515625, -12.921396255493164, -9.818743705749512, -6.716091156005859, -3.6134395599365234, -0.5107860565185547, 2.5918655395507812, 5.694518089294434, 8.797170639038086, 11.899822235107422, 15.002474784851074, 18.105127334594727, 21.207778930664062, 24.31043243408203, 27.413084030151367, 30.515735626220703, 33.61838912963867, 36.721038818359375, 39.823692321777344, 42.92634582519531, 46.02899932861328, 49.13165283203125, 52.23430633544922, 55.33695983886719, 58.43960952758789, 61.54226303100586, 64.64491271972656, 67.74756622314453, 70.8502197265625, 73.95287322998047, 77.05552673339844, 80.1581802368164, 83.26083374023438, 86.36347961425781, 89.46613311767578, 92.56878662109375, 95.67144012451172, 98.77409362792969, 101.87673950195312, 104.9793930053711, 108.08204650878906, 111.1846923828125, 114.28734588623047, 117.38999938964844, 120.4926528930664, 123.59530639648438, 126.69795989990234, 129.8006134033203, 132.90325927734375, 136.00592041015625, 139.1085662841797, 142.2112274169922, 145.31387329101562, 148.41653442382812, 151.51918029785156]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 8.0, 5.0, 7.0, 7.0, 6.0, 9.0, 9.0, 12.0, 15.0, 19.0, 15.0, 13.0, 24.0, 27.0, 30.0, 23.0, 30.0, 32.0, 47.0, 37.0, 30.0, 48.0, 41.0, 36.0, 44.0, 46.0, 29.0, 31.0, 28.0, 31.0, 31.0, 26.0, 21.0, 23.0, 19.0, 23.0, 24.0, 14.0, 5.0, 21.0, 11.0, 14.0, 11.0, 9.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.873661041259766, -24.083269119262695, -23.292877197265625, -22.502487182617188, -21.712095260620117, -20.921703338623047, -20.13131332397461, -19.34092140197754, -18.55052947998047, -17.7601375579834, -16.969745635986328, -16.17935562133789, -15.38896369934082, -14.59857177734375, -13.808180809020996, -13.017789840698242, -12.227397918701172, -11.437005996704102, -10.646615028381348, -9.856224060058594, -9.065832138061523, -8.275440216064453, -7.485049247741699, -6.694657802581787, -5.904266357421875, -5.113874912261963, -4.323483467102051, -3.5330920219421387, -2.7427005767822266, -1.9523091316223145, -1.1619176864624023, -0.37152624130249023, 0.4188652038574219, 1.209256649017334, 1.999648094177246, 2.790039539337158, 3.5804309844970703, 4.370822429656982, 5.1612138748168945, 5.951605319976807, 6.741996765136719, 7.532388210296631, 8.322779655456543, 9.113170623779297, 9.903562545776367, 10.693954467773438, 11.484345436096191, 12.274736404418945, 13.065128326416016, 13.855520248413086, 14.64591121673584, 15.436302185058594, 16.226694107055664, 17.017086029052734, 17.807476043701172, 18.597867965698242, 19.388259887695312, 20.178651809692383, 20.969043731689453, 21.75943374633789, 22.54982566833496, 23.34021759033203, 24.13060760498047, 24.92099952697754, 25.71139144897461]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 9.0, 4.0, 3.0, 5.0, 11.0, 10.0, 11.0, 14.0, 17.0, 19.0, 16.0, 21.0, 20.0, 16.0, 21.0, 25.0, 36.0, 30.0, 33.0, 44.0, 37.0, 41.0, 35.0, 33.0, 42.0, 40.0, 46.0, 39.0, 40.0, 27.0, 29.0, 34.0, 34.0, 20.0, 18.0, 32.0, 16.0, 10.0, 13.0, 8.0, 9.0, 12.0, 6.0, 13.0, 5.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.951171875, -3.836395263671875, -3.72161865234375, -3.606842041015625, -3.4920654296875, -3.377288818359375, -3.26251220703125, -3.147735595703125, -3.032958984375, -2.918182373046875, -2.80340576171875, -2.688629150390625, -2.5738525390625, -2.459075927734375, -2.34429931640625, -2.229522705078125, -2.11474609375, -1.999969482421875, -1.88519287109375, -1.770416259765625, -1.6556396484375, -1.540863037109375, -1.42608642578125, -1.311309814453125, -1.196533203125, -1.081756591796875, -0.96697998046875, -0.852203369140625, -0.7374267578125, -0.622650146484375, -0.50787353515625, -0.393096923828125, -0.2783203125, -0.163543701171875, -0.04876708984375, 0.066009521484375, 0.1807861328125, 0.295562744140625, 0.41033935546875, 0.525115966796875, 0.639892578125, 0.754669189453125, 0.86944580078125, 0.984222412109375, 1.0989990234375, 1.213775634765625, 1.32855224609375, 1.443328857421875, 1.55810546875, 1.672882080078125, 1.78765869140625, 1.902435302734375, 2.0172119140625, 2.131988525390625, 2.24676513671875, 2.361541748046875, 2.476318359375, 2.591094970703125, 2.70587158203125, 2.820648193359375, 2.9354248046875, 3.050201416015625, 3.16497802734375, 3.279754638671875, 3.39453125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 7.0, 9.0, 8.0, 15.0, 24.0, 45.0, 65.0, 126.0, 150.0, 261.0, 387.0, 748.0, 1214.0, 1841.0, 2764.0, 4221.0, 6556.0, 10006.0, 15991.0, 25732.0, 42078.0, 73314.0, 146270.0, 343422.0, 169965.0, 81611.0, 46165.0, 27627.0, 17039.0, 10920.0, 6981.0, 4658.0, 3129.0, 1963.0, 1217.0, 747.0, 498.0, 316.0, 173.0, 98.0, 68.0, 44.0, 27.0, 25.0, 15.0, 4.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.03515625, -1.0052261352539062, -0.9752960205078125, -0.9453659057617188, -0.915435791015625, -0.8855056762695312, -0.8555755615234375, -0.8256454467773438, -0.79571533203125, -0.7657852172851562, -0.7358551025390625, -0.7059249877929688, -0.675994873046875, -0.6460647583007812, -0.6161346435546875, -0.5862045288085938, -0.5562744140625, -0.5263442993164062, -0.4964141845703125, -0.46648406982421875, -0.436553955078125, -0.40662384033203125, -0.3766937255859375, -0.34676361083984375, -0.31683349609375, -0.28690338134765625, -0.2569732666015625, -0.22704315185546875, -0.197113037109375, -0.16718292236328125, -0.1372528076171875, -0.10732269287109375, -0.077392578125, -0.04746246337890625, -0.0175323486328125, 0.01239776611328125, 0.042327880859375, 0.07225799560546875, 0.1021881103515625, 0.13211822509765625, 0.16204833984375, 0.19197845458984375, 0.2219085693359375, 0.25183868408203125, 0.281768798828125, 0.31169891357421875, 0.3416290283203125, 0.37155914306640625, 0.4014892578125, 0.43141937255859375, 0.4613494873046875, 0.49127960205078125, 0.521209716796875, 0.5511398315429688, 0.5810699462890625, 0.6110000610351562, 0.64093017578125, 0.6708602905273438, 0.7007904052734375, 0.7307205200195312, 0.760650634765625, 0.7905807495117188, 0.8205108642578125, 0.8504409790039062, 0.88037109375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 4.0, 7.0, 12.0, 12.0, 16.0, 15.0, 17.0, 32.0, 27.0, 29.0, 29.0, 30.0, 42.0, 37.0, 39.0, 33.0, 52.0, 49.0, 1066.0, 36.0, 44.0, 53.0, 43.0, 36.0, 33.0, 27.0, 35.0, 19.0, 22.0, 12.0, 23.0, 16.0, 14.0, 11.0, 12.0, 4.0, 4.0, 9.0, 3.0, 3.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-2.794921875, -2.7132568359375, -2.631591796875, -2.5499267578125, -2.46826171875, -2.3865966796875, -2.304931640625, -2.2232666015625, -2.1416015625, -2.0599365234375, -1.978271484375, -1.8966064453125, -1.81494140625, -1.7332763671875, -1.651611328125, -1.5699462890625, -1.48828125, -1.4066162109375, -1.324951171875, -1.2432861328125, -1.16162109375, -1.0799560546875, -0.998291015625, -0.9166259765625, -0.8349609375, -0.7532958984375, -0.671630859375, -0.5899658203125, -0.50830078125, -0.4266357421875, -0.344970703125, -0.2633056640625, -0.181640625, -0.0999755859375, -0.018310546875, 0.0633544921875, 0.14501953125, 0.2266845703125, 0.308349609375, 0.3900146484375, 0.4716796875, 0.5533447265625, 0.635009765625, 0.7166748046875, 0.79833984375, 0.8800048828125, 0.961669921875, 1.0433349609375, 1.125, 1.2066650390625, 1.288330078125, 1.3699951171875, 1.45166015625, 1.5333251953125, 1.614990234375, 1.6966552734375, 1.7783203125, 1.8599853515625, 1.941650390625, 2.0233154296875, 2.10498046875, 2.1866455078125, 2.268310546875, 2.3499755859375, 2.431640625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 10.0, 10.0, 6.0, 19.0, 27.0, 43.0, 41.0, 83.0, 133.0, 143.0, 243.0, 374.0, 554.0, 828.0, 1333.0, 2127.0, 3454.0, 5872.0, 9813.0, 17078.0, 30213.0, 55291.0, 107327.0, 1358654.0, 278042.0, 103443.0, 52554.0, 28588.0, 16261.0, 9485.0, 5815.0, 3457.0, 2097.0, 1325.0, 874.0, 551.0, 352.0, 204.0, 156.0, 74.0, 65.0, 40.0, 18.0, 23.0, 15.0, 4.0, 8.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0068359375, -0.973236083984375, -0.93963623046875, -0.906036376953125, -0.8724365234375, -0.838836669921875, -0.80523681640625, -0.771636962890625, -0.738037109375, -0.704437255859375, -0.67083740234375, -0.637237548828125, -0.6036376953125, -0.570037841796875, -0.53643798828125, -0.502838134765625, -0.46923828125, -0.435638427734375, -0.40203857421875, -0.368438720703125, -0.3348388671875, -0.301239013671875, -0.26763916015625, -0.234039306640625, -0.200439453125, -0.166839599609375, -0.13323974609375, -0.099639892578125, -0.0660400390625, -0.032440185546875, 0.00115966796875, 0.034759521484375, 0.068359375, 0.101959228515625, 0.13555908203125, 0.169158935546875, 0.2027587890625, 0.236358642578125, 0.26995849609375, 0.303558349609375, 0.337158203125, 0.370758056640625, 0.40435791015625, 0.437957763671875, 0.4715576171875, 0.505157470703125, 0.53875732421875, 0.572357177734375, 0.60595703125, 0.639556884765625, 0.67315673828125, 0.706756591796875, 0.7403564453125, 0.773956298828125, 0.80755615234375, 0.841156005859375, 0.874755859375, 0.908355712890625, 0.94195556640625, 0.975555419921875, 1.0091552734375, 1.042755126953125, 1.07635498046875, 1.109954833984375, 1.1435546875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 7.0, 6.0, 7.0, 11.0, 17.0, 18.0, 20.0, 31.0, 44.0, 53.0, 81.0, 112.0, 116.0, 106.0, 97.0, 75.0, 55.0, 40.0, 25.0, 22.0, 21.0, 12.0, 10.0, 8.0, 5.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00101470947265625, -0.0009866058826446533, -0.0009585022926330566, -0.00093039870262146, -0.0009022951126098633, -0.0008741915225982666, -0.0008460879325866699, -0.0008179843425750732, -0.0007898807525634766, -0.0007617771625518799, -0.0007336735725402832, -0.0007055699825286865, -0.0006774663925170898, -0.0006493628025054932, -0.0006212592124938965, -0.0005931556224822998, -0.0005650520324707031, -0.0005369484424591064, -0.0005088448524475098, -0.0004807412624359131, -0.0004526376724243164, -0.0004245340824127197, -0.00039643049240112305, -0.00036832690238952637, -0.0003402233123779297, -0.000312119722366333, -0.00028401613235473633, -0.00025591254234313965, -0.00022780895233154297, -0.0001997053623199463, -0.0001716017723083496, -0.00014349818229675293, -0.00011539459228515625, -8.729100227355957e-05, -5.918741226196289e-05, -3.108382225036621e-05, -2.9802322387695312e-06, 2.512335777282715e-05, 5.322694778442383e-05, 8.133053779602051e-05, 0.00010943412780761719, 0.00013753771781921387, 0.00016564130783081055, 0.00019374489784240723, 0.0002218484878540039, 0.0002499520778656006, 0.00027805566787719727, 0.00030615925788879395, 0.0003342628479003906, 0.0003623664379119873, 0.000390470027923584, 0.00041857361793518066, 0.00044667720794677734, 0.000474780797958374, 0.0005028843879699707, 0.0005309879779815674, 0.0005590915679931641, 0.0005871951580047607, 0.0006152987480163574, 0.0006434023380279541, 0.0006715059280395508, 0.0006996095180511475, 0.0007277131080627441, 0.0007558166980743408, 0.0007839202880859375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 8.0, 1.0, 12.0, 11.0, 16.0, 13.0, 32.0, 37.0, 50.0, 79.0, 156.0, 285.0, 1150.0, 970966.0, 74400.0, 702.0, 255.0, 138.0, 71.0, 43.0, 38.0, 32.0, 18.0, 11.0, 12.0, 7.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0169525146484375, -0.01634383201599121, -0.015735149383544922, -0.015126466751098633, -0.014517784118652344, -0.013909101486206055, -0.013300418853759766, -0.012691736221313477, -0.012083053588867188, -0.011474370956420898, -0.01086568832397461, -0.01025700569152832, -0.009648323059082031, -0.009039640426635742, -0.008430957794189453, -0.007822275161743164, -0.007213592529296875, -0.006604909896850586, -0.005996227264404297, -0.005387544631958008, -0.004778861999511719, -0.00417017936706543, -0.0035614967346191406, -0.0029528141021728516, -0.0023441314697265625, -0.0017354488372802734, -0.0011267662048339844, -0.0005180835723876953, 9.059906005859375e-05, 0.0006992816925048828, 0.0013079643249511719, 0.001916646957397461, 0.00252532958984375, 0.003134012222290039, 0.003742694854736328, 0.004351377487182617, 0.004960060119628906, 0.005568742752075195, 0.006177425384521484, 0.0067861080169677734, 0.0073947906494140625, 0.008003473281860352, 0.00861215591430664, 0.00922083854675293, 0.009829521179199219, 0.010438203811645508, 0.011046886444091797, 0.011655569076538086, 0.012264251708984375, 0.012872934341430664, 0.013481616973876953, 0.014090299606323242, 0.014698982238769531, 0.01530766487121582, 0.01591634750366211, 0.0165250301361084, 0.017133712768554688, 0.017742395401000977, 0.018351078033447266, 0.018959760665893555, 0.019568443298339844, 0.020177125930786133, 0.020785808563232422, 0.02139449119567871, 0.022003173828125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 33.0, 135.0, 313.0, 337.0, 149.0, 34.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001753966324031353, -0.0017149875639006495, -0.001676008803769946, -0.0016370301600545645, -0.001598051399923861, -0.0015590726397931576, -0.0015200938796624541, -0.0014811151195317507, -0.001442136475816369, -0.0014031577156856656, -0.0013641789555549622, -0.0013252003118395805, -0.001286221551708877, -0.0012472427915781736, -0.0012082640314474702, -0.0011692852713167667, -0.0011303066276013851, -0.0010913278674706817, -0.0010523491073399782, -0.0010133704636245966, -0.0009743917034938931, -0.0009354129433631897, -0.0008964341832324862, -0.0008574554813094437, -0.0008184766629710793, -0.0007794979028403759, -0.0007405192009173334, -0.0007015404407866299, -0.0006625617388635874, -0.0006235829787328839, -0.0005846042186021805, -0.0005456255166791379, -0.0005066467565484345, -0.0004676680255215615, -0.0004286892944946885, -0.00038971053436398506, -0.0003507318324409425, -0.0003117530723102391, -0.0002727743412833661, -0.0002337956102564931, -0.0001948168792296201, -0.0001558381482027471, -0.0001168594098999165, -7.788067159708589e-05, -3.89019405702129e-05, 7.679045666009188e-08, 3.905553603544831e-05, 7.80342670623213e-05, 0.0001170129980891943, 0.0001559917291160673, 0.00019497046014294028, 0.0002339492057217285, 0.00027292792219668627, 0.0003119066823273897, 0.0003508854133542627, 0.0003898641443811357, 0.0004288428754080087, 0.0004678216064348817, 0.0005068003665655851, 0.0005457790684886277, 0.0005847578286193311, 0.0006237365305423737, 0.0006627152906730771, 0.0007016940508037806, 0.0007406727527268231]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 8.0, 7.0, 9.0, 7.0, 19.0, 16.0, 16.0, 21.0, 17.0, 23.0, 22.0, 33.0, 33.0, 31.0, 38.0, 47.0, 36.0, 43.0, 36.0, 40.0, 46.0, 35.0, 37.0, 47.0, 44.0, 38.0, 35.0, 32.0, 25.0, 24.0, 21.0, 24.0, 17.0, 10.0, 10.0, 12.0, 9.0, 6.0, 6.0, 4.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0003139972686767578, -0.00030429940670728683, -0.00029460154473781586, -0.0002849036827683449, -0.0002752058207988739, -0.0002655079588294029, -0.00025581009685993195, -0.00024611223489046097, -0.00023641437292099, -0.000226716510951519, -0.00021701864898204803, -0.00020732078701257706, -0.00019762292504310608, -0.0001879250630736351, -0.00017822720110416412, -0.00016852933913469315, -0.00015883147716522217, -0.0001491336151957512, -0.0001394357532262802, -0.00012973789125680923, -0.00012004002928733826, -0.00011034216731786728, -0.0001006443053483963, -9.094644337892532e-05, -8.124858140945435e-05, -7.155071943998337e-05, -6.185285747051239e-05, -5.215499550104141e-05, -4.2457133531570435e-05, -3.275927156209946e-05, -2.306140959262848e-05, -1.3363547623157501e-05, -3.6656856536865234e-06, 6.032176315784454e-06, 1.5730038285255432e-05, 2.542790025472641e-05, 3.512576222419739e-05, 4.4823624193668365e-05, 5.452148616313934e-05, 6.421934813261032e-05, 7.39172101020813e-05, 8.361507207155228e-05, 9.331293404102325e-05, 0.00010301079601049423, 0.00011270865797996521, 0.0001224065199494362, 0.00013210438191890717, 0.00014180224388837814, 0.00015150010585784912, 0.0001611979678273201, 0.00017089582979679108, 0.00018059369176626205, 0.00019029155373573303, 0.000199989415705204, 0.000209687277674675, 0.00021938513964414597, 0.00022908300161361694, 0.00023878086358308792, 0.0002484787255525589, 0.0002581765875220299, 0.00026787444949150085, 0.00027757231146097183, 0.0002872701734304428, 0.0002969680353999138, 0.00030666589736938477]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 9.0, 4.0, 3.0, 5.0, 11.0, 10.0, 11.0, 14.0, 17.0, 19.0, 16.0, 21.0, 20.0, 16.0, 21.0, 25.0, 36.0, 30.0, 33.0, 44.0, 37.0, 41.0, 35.0, 33.0, 42.0, 40.0, 46.0, 39.0, 40.0, 27.0, 29.0, 34.0, 34.0, 20.0, 18.0, 32.0, 16.0, 10.0, 13.0, 8.0, 9.0, 12.0, 6.0, 13.0, 5.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.951171875, -3.836395263671875, -3.72161865234375, -3.606842041015625, -3.4920654296875, -3.377288818359375, -3.26251220703125, -3.147735595703125, -3.032958984375, -2.918182373046875, -2.80340576171875, -2.688629150390625, -2.5738525390625, -2.459075927734375, -2.34429931640625, -2.229522705078125, -2.11474609375, -1.999969482421875, -1.88519287109375, -1.770416259765625, -1.6556396484375, -1.540863037109375, -1.42608642578125, -1.311309814453125, -1.196533203125, -1.081756591796875, -0.96697998046875, -0.852203369140625, -0.7374267578125, -0.622650146484375, -0.50787353515625, -0.393096923828125, -0.2783203125, -0.163543701171875, -0.04876708984375, 0.066009521484375, 0.1807861328125, 0.295562744140625, 0.41033935546875, 0.525115966796875, 0.639892578125, 0.754669189453125, 0.86944580078125, 0.984222412109375, 1.0989990234375, 1.213775634765625, 1.32855224609375, 1.443328857421875, 1.55810546875, 1.672882080078125, 1.78765869140625, 1.902435302734375, 2.0172119140625, 2.131988525390625, 2.24676513671875, 2.361541748046875, 2.476318359375, 2.591094970703125, 2.70587158203125, 2.820648193359375, 2.9354248046875, 3.050201416015625, 3.16497802734375, 3.279754638671875, 3.39453125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 6.0, 9.0, 7.0, 17.0, 16.0, 26.0, 35.0, 60.0, 62.0, 126.0, 183.0, 329.0, 494.0, 1013.0, 2399.0, 6633.0, 21911.0, 73697.0, 251660.0, 466608.0, 154978.0, 46332.0, 13836.0, 4409.0, 1760.0, 817.0, 429.0, 233.0, 152.0, 109.0, 56.0, 47.0, 34.0, 19.0, 17.0, 15.0, 8.0, 6.0, 4.0, 3.0, 1.0, 0.0, 4.0], "bins": [-7.1640625, -6.986328125, -6.80859375, -6.630859375, -6.453125, -6.275390625, -6.09765625, -5.919921875, -5.7421875, -5.564453125, -5.38671875, -5.208984375, -5.03125, -4.853515625, -4.67578125, -4.498046875, -4.3203125, -4.142578125, -3.96484375, -3.787109375, -3.609375, -3.431640625, -3.25390625, -3.076171875, -2.8984375, -2.720703125, -2.54296875, -2.365234375, -2.1875, -2.009765625, -1.83203125, -1.654296875, -1.4765625, -1.298828125, -1.12109375, -0.943359375, -0.765625, -0.587890625, -0.41015625, -0.232421875, -0.0546875, 0.123046875, 0.30078125, 0.478515625, 0.65625, 0.833984375, 1.01171875, 1.189453125, 1.3671875, 1.544921875, 1.72265625, 1.900390625, 2.078125, 2.255859375, 2.43359375, 2.611328125, 2.7890625, 2.966796875, 3.14453125, 3.322265625, 3.5, 3.677734375, 3.85546875, 4.033203125, 4.2109375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 7.0, 8.0, 13.0, 11.0, 14.0, 17.0, 9.0, 25.0, 28.0, 30.0, 33.0, 44.0, 37.0, 55.0, 59.0, 95.0, 203.0, 1543.0, 256.0, 106.0, 67.0, 64.0, 38.0, 53.0, 42.0, 35.0, 32.0, 32.0, 20.0, 13.0, 14.0, 9.0, 10.0, 6.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.859375, -15.400634765625, -14.94189453125, -14.483154296875, -14.0244140625, -13.565673828125, -13.10693359375, -12.648193359375, -12.189453125, -11.730712890625, -11.27197265625, -10.813232421875, -10.3544921875, -9.895751953125, -9.43701171875, -8.978271484375, -8.51953125, -8.060791015625, -7.60205078125, -7.143310546875, -6.6845703125, -6.225830078125, -5.76708984375, -5.308349609375, -4.849609375, -4.390869140625, -3.93212890625, -3.473388671875, -3.0146484375, -2.555908203125, -2.09716796875, -1.638427734375, -1.1796875, -0.720947265625, -0.26220703125, 0.196533203125, 0.6552734375, 1.114013671875, 1.57275390625, 2.031494140625, 2.490234375, 2.948974609375, 3.40771484375, 3.866455078125, 4.3251953125, 4.783935546875, 5.24267578125, 5.701416015625, 6.16015625, 6.618896484375, 7.07763671875, 7.536376953125, 7.9951171875, 8.453857421875, 8.91259765625, 9.371337890625, 9.830078125, 10.288818359375, 10.74755859375, 11.206298828125, 11.6650390625, 12.123779296875, 12.58251953125, 13.041259765625, 13.5]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 5.0, 11.0, 16.0, 19.0, 24.0, 42.0, 64.0, 80.0, 159.0, 289.0, 736.0, 12369.0, 3128561.0, 2291.0, 490.0, 216.0, 102.0, 89.0, 45.0, 28.0, 26.0, 14.0, 12.0, 10.0, 6.0, 7.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.15625, -36.76025390625, -34.3642578125, -31.96826171875, -29.572265625, -27.17626953125, -24.7802734375, -22.38427734375, -19.98828125, -17.59228515625, -15.1962890625, -12.80029296875, -10.404296875, -8.00830078125, -5.6123046875, -3.21630859375, -0.8203125, 1.57568359375, 3.9716796875, 6.36767578125, 8.763671875, 11.15966796875, 13.5556640625, 15.95166015625, 18.34765625, 20.74365234375, 23.1396484375, 25.53564453125, 27.931640625, 30.32763671875, 32.7236328125, 35.11962890625, 37.515625, 39.91162109375, 42.3076171875, 44.70361328125, 47.099609375, 49.49560546875, 51.8916015625, 54.28759765625, 56.68359375, 59.07958984375, 61.4755859375, 63.87158203125, 66.267578125, 68.66357421875, 71.0595703125, 73.45556640625, 75.8515625, 78.24755859375, 80.6435546875, 83.03955078125, 85.435546875, 87.83154296875, 90.2275390625, 92.62353515625, 95.01953125, 97.41552734375, 99.8115234375, 102.20751953125, 104.603515625, 106.99951171875, 109.3955078125, 111.79150390625, 114.1875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 6.0, 21.0, 64.0, 96.0, 139.0, 184.0, 200.0, 140.0, 80.0, 40.0, 21.0, 13.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.113792419433594, -41.10508346557617, -40.09637451171875, -39.08766555786133, -38.078956604003906, -37.070247650146484, -36.06153869628906, -35.052833557128906, -34.04412078857422, -33.0354118347168, -32.026702880859375, -31.017993927001953, -30.00928497314453, -29.00057601928711, -27.99186897277832, -26.9831600189209, -25.97445297241211, -24.965744018554688, -23.957035064697266, -22.948326110839844, -21.939617156982422, -20.930908203125, -19.92220115661621, -18.91349220275879, -17.904783248901367, -16.896074295043945, -15.887365341186523, -14.878657341003418, -13.869948387145996, -12.861239433288574, -11.852531433105469, -10.843822479248047, -9.835115432739258, -8.826406478881836, -7.817698001861572, -6.808989524841309, -5.800280570983887, -4.791571617126465, -3.782863140106201, -2.7741546630859375, -1.7654457092285156, -0.7567369937896729, 0.2519717216491699, 1.2606804370880127, 2.2693891525268555, 3.2780981063842773, 4.286806583404541, 5.295515060424805, 6.304224014282227, 7.312932968139648, 8.32164192199707, 9.330349922180176, 10.339058876037598, 11.34776782989502, 12.356475830078125, 13.365184783935547, 14.373893737792969, 15.38260269165039, 16.391311645507812, 17.400020599365234, 18.408729553222656, 19.417438507080078, 20.426145553588867, 21.43485450744629, 22.44356346130371]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 8.0, 10.0, 8.0, 7.0, 7.0, 10.0, 15.0, 17.0, 18.0, 24.0, 35.0, 31.0, 36.0, 45.0, 37.0, 46.0, 43.0, 42.0, 39.0, 39.0, 46.0, 42.0, 34.0, 44.0, 33.0, 27.0, 33.0, 23.0, 25.0, 27.0, 24.0, 31.0, 18.0, 17.0, 13.0, 11.0, 6.0, 13.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-44.56050109863281, -43.31117630004883, -42.06185531616211, -40.812530517578125, -39.563209533691406, -38.31388473510742, -37.0645637512207, -35.81523895263672, -34.56591796875, -33.316593170166016, -32.0672721862793, -30.817949295043945, -29.568626403808594, -28.319303512573242, -27.06998062133789, -25.820655822753906, -24.571332931518555, -23.322010040283203, -22.07268714904785, -20.8233642578125, -19.57404136657715, -18.324718475341797, -17.075393676757812, -15.826071739196777, -14.576748847961426, -13.327425956726074, -12.078103065490723, -10.828779220581055, -9.579456329345703, -8.330133438110352, -7.080810546875, -5.831487655639648, -4.582164764404297, -3.3328418731689453, -2.0835187435150146, -0.834195613861084, 0.4151272773742676, 1.6644501686096191, 2.913773536682129, 4.1630964279174805, 5.412419319152832, 6.661742210388184, 7.911065101623535, 9.160388946533203, 10.409711837768555, 11.659034729003906, 12.908357620239258, 14.15768051147461, 15.407003402709961, 16.656326293945312, 17.905649185180664, 19.154972076416016, 20.404294967651367, 21.65361785888672, 22.902942657470703, 24.152263641357422, 25.401588439941406, 26.650911331176758, 27.90023422241211, 29.14955711364746, 30.398880004882812, 31.648202896118164, 32.897525787353516, 34.1468505859375, 35.39617156982422]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 0.0, 3.0, 6.0, 2.0, 6.0, 6.0, 3.0, 6.0, 8.0, 13.0, 14.0, 10.0, 16.0, 18.0, 25.0, 10.0, 16.0, 22.0, 23.0, 27.0, 27.0, 16.0, 26.0, 25.0, 48.0, 33.0, 44.0, 40.0, 43.0, 41.0, 26.0, 36.0, 36.0, 40.0, 34.0, 27.0, 24.0, 20.0, 20.0, 24.0, 23.0, 18.0, 20.0, 14.0, 14.0, 6.0, 8.0, 9.0, 7.0, 7.0, 10.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.900390625, -3.77899169921875, -3.6575927734375, -3.53619384765625, -3.414794921875, -3.29339599609375, -3.1719970703125, -3.05059814453125, -2.92919921875, -2.80780029296875, -2.6864013671875, -2.56500244140625, -2.443603515625, -2.32220458984375, -2.2008056640625, -2.07940673828125, -1.9580078125, -1.83660888671875, -1.7152099609375, -1.59381103515625, -1.472412109375, -1.35101318359375, -1.2296142578125, -1.10821533203125, -0.98681640625, -0.86541748046875, -0.7440185546875, -0.62261962890625, -0.501220703125, -0.37982177734375, -0.2584228515625, -0.13702392578125, -0.015625, 0.10577392578125, 0.2271728515625, 0.34857177734375, 0.469970703125, 0.59136962890625, 0.7127685546875, 0.83416748046875, 0.95556640625, 1.07696533203125, 1.1983642578125, 1.31976318359375, 1.441162109375, 1.56256103515625, 1.6839599609375, 1.80535888671875, 1.9267578125, 2.04815673828125, 2.1695556640625, 2.29095458984375, 2.412353515625, 2.53375244140625, 2.6551513671875, 2.77655029296875, 2.89794921875, 3.01934814453125, 3.1407470703125, 3.26214599609375, 3.383544921875, 3.50494384765625, 3.6263427734375, 3.74774169921875, 3.869140625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 5.0, 5.0, 4.0, 10.0, 8.0, 10.0, 15.0, 12.0, 7.0, 13.0, 22.0, 20.0, 21.0, 22.0, 27.0, 26.0, 42.0, 51.0, 86.0, 216.0, 548.0, 1941.0, 20722.0, 958425.0, 3006934.0, 196833.0, 6241.0, 1091.0, 379.0, 158.0, 82.0, 51.0, 42.0, 31.0, 26.0, 26.0, 20.0, 18.0, 19.0, 11.0, 11.0, 13.0, 8.0, 11.0, 6.0, 4.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-14.4765625, -14.0281982421875, -13.579833984375, -13.1314697265625, -12.68310546875, -12.2347412109375, -11.786376953125, -11.3380126953125, -10.8896484375, -10.4412841796875, -9.992919921875, -9.5445556640625, -9.09619140625, -8.6478271484375, -8.199462890625, -7.7510986328125, -7.302734375, -6.8543701171875, -6.406005859375, -5.9576416015625, -5.50927734375, -5.0609130859375, -4.612548828125, -4.1641845703125, -3.7158203125, -3.2674560546875, -2.819091796875, -2.3707275390625, -1.92236328125, -1.4739990234375, -1.025634765625, -0.5772705078125, -0.12890625, 0.3194580078125, 0.767822265625, 1.2161865234375, 1.66455078125, 2.1129150390625, 2.561279296875, 3.0096435546875, 3.4580078125, 3.9063720703125, 4.354736328125, 4.8031005859375, 5.25146484375, 5.6998291015625, 6.148193359375, 6.5965576171875, 7.044921875, 7.4932861328125, 7.941650390625, 8.3900146484375, 8.83837890625, 9.2867431640625, 9.735107421875, 10.1834716796875, 10.6318359375, 11.0802001953125, 11.528564453125, 11.9769287109375, 12.42529296875, 12.8736572265625, 13.322021484375, 13.7703857421875, 14.21875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 3.0, 3.0, 3.0, 5.0, 7.0, 11.0, 19.0, 27.0, 41.0, 44.0, 47.0, 65.0, 95.0, 127.0, 163.0, 228.0, 311.0, 363.0, 413.0, 422.0, 425.0, 301.0, 233.0, 176.0, 142.0, 100.0, 83.0, 53.0, 45.0, 31.0, 28.0, 16.0, 10.0, 12.0, 12.0, 6.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.203125, -7.9306640625, -7.658203125, -7.3857421875, -7.11328125, -6.8408203125, -6.568359375, -6.2958984375, -6.0234375, -5.7509765625, -5.478515625, -5.2060546875, -4.93359375, -4.6611328125, -4.388671875, -4.1162109375, -3.84375, -3.5712890625, -3.298828125, -3.0263671875, -2.75390625, -2.4814453125, -2.208984375, -1.9365234375, -1.6640625, -1.3916015625, -1.119140625, -0.8466796875, -0.57421875, -0.3017578125, -0.029296875, 0.2431640625, 0.515625, 0.7880859375, 1.060546875, 1.3330078125, 1.60546875, 1.8779296875, 2.150390625, 2.4228515625, 2.6953125, 2.9677734375, 3.240234375, 3.5126953125, 3.78515625, 4.0576171875, 4.330078125, 4.6025390625, 4.875, 5.1474609375, 5.419921875, 5.6923828125, 5.96484375, 6.2373046875, 6.509765625, 6.7822265625, 7.0546875, 7.3271484375, 7.599609375, 7.8720703125, 8.14453125, 8.4169921875, 8.689453125, 8.9619140625, 9.234375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 9.0, 14.0, 15.0, 13.0, 27.0, 30.0, 38.0, 44.0, 65.0, 79.0, 113.0, 145.0, 186.0, 236.0, 340.0, 627.0, 3140.0, 266331.0, 3870769.0, 48714.0, 1635.0, 509.0, 280.0, 215.0, 148.0, 135.0, 85.0, 89.0, 75.0, 42.0, 39.0, 29.0, 25.0, 16.0, 7.0, 6.0, 6.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-32.75, -31.796630859375, -30.84326171875, -29.889892578125, -28.9365234375, -27.983154296875, -27.02978515625, -26.076416015625, -25.123046875, -24.169677734375, -23.21630859375, -22.262939453125, -21.3095703125, -20.356201171875, -19.40283203125, -18.449462890625, -17.49609375, -16.542724609375, -15.58935546875, -14.635986328125, -13.6826171875, -12.729248046875, -11.77587890625, -10.822509765625, -9.869140625, -8.915771484375, -7.96240234375, -7.009033203125, -6.0556640625, -5.102294921875, -4.14892578125, -3.195556640625, -2.2421875, -1.288818359375, -0.33544921875, 0.617919921875, 1.5712890625, 2.524658203125, 3.47802734375, 4.431396484375, 5.384765625, 6.338134765625, 7.29150390625, 8.244873046875, 9.1982421875, 10.151611328125, 11.10498046875, 12.058349609375, 13.01171875, 13.965087890625, 14.91845703125, 15.871826171875, 16.8251953125, 17.778564453125, 18.73193359375, 19.685302734375, 20.638671875, 21.592041015625, 22.54541015625, 23.498779296875, 24.4521484375, 25.405517578125, 26.35888671875, 27.312255859375, 28.265625]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 45.0, 195.0, 380.0, 286.0, 95.0, 8.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-182.7434844970703, -178.9963836669922, -175.24929809570312, -171.502197265625, -167.75509643554688, -164.00799560546875, -160.2609100341797, -156.51380920410156, -152.76670837402344, -149.0196075439453, -145.27252197265625, -141.52542114257812, -137.7783203125, -134.03121948242188, -130.2841339111328, -126.53703308105469, -122.78993225097656, -119.04283905029297, -115.29573822021484, -111.54864501953125, -107.80154418945312, -104.05445098876953, -100.3073501586914, -96.56025695800781, -92.81316375732422, -89.06607055664062, -85.3189697265625, -81.5718765258789, -77.82477569580078, -74.07768249511719, -70.33058166503906, -66.58348846435547, -62.83638381958008, -59.08928680419922, -55.34218978881836, -51.5950927734375, -47.84799575805664, -44.10089874267578, -40.35380554199219, -36.60670471191406, -32.85961151123047, -29.11251449584961, -25.36541748046875, -21.61832046508789, -17.87122344970703, -14.124128341674805, -10.377031326293945, -6.629934310913086, -2.8828353881835938, 0.8642613887786865, 4.611358165740967, 8.358454704284668, 12.105551719665527, 15.85264778137207, 19.59974479675293, 23.34684181213379, 27.09393882751465, 30.841035842895508, 34.588130950927734, 38.335227966308594, 42.08232498168945, 45.82942199707031, 49.57651901245117, 53.32361602783203, 57.07071304321289]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 4.0, 5.0, 7.0, 7.0, 5.0, 13.0, 8.0, 12.0, 16.0, 15.0, 17.0, 17.0, 13.0, 31.0, 33.0, 21.0, 39.0, 27.0, 30.0, 35.0, 33.0, 51.0, 41.0, 39.0, 33.0, 25.0, 29.0, 29.0, 41.0, 33.0, 41.0, 30.0, 25.0, 22.0, 28.0, 28.0, 17.0, 18.0, 22.0, 14.0, 9.0, 10.0, 11.0, 6.0, 6.0, 4.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.10993194580078, -23.26485824584961, -22.419784545898438, -21.574710845947266, -20.729637145996094, -19.884563446044922, -19.03948974609375, -18.194416046142578, -17.349342346191406, -16.504268646240234, -15.659194946289062, -14.81412124633789, -13.969047546386719, -13.123973846435547, -12.278899192810059, -11.433825492858887, -10.588750839233398, -9.743677139282227, -8.898603439331055, -8.053529739379883, -7.208455562591553, -6.363381862640381, -5.518307685852051, -4.673233985900879, -3.828160285949707, -2.983086585998535, -2.138012647628784, -1.2929387092590332, -0.44786500930786133, 0.39720869064331055, 1.2422828674316406, 2.0873565673828125, 2.9324302673339844, 3.7775039672851562, 4.622577667236328, 5.467651844024658, 6.31272554397583, 7.157799243927002, 8.002873420715332, 8.847947120666504, 9.693020820617676, 10.538094520568848, 11.38316822052002, 12.228242874145508, 13.07331657409668, 13.918390274047852, 14.763463973999023, 15.608537673950195, 16.453611373901367, 17.29868507385254, 18.14375877380371, 18.988832473754883, 19.833906173706055, 20.678979873657227, 21.52405548095703, 22.369129180908203, 23.214202880859375, 24.059276580810547, 24.90435028076172, 25.74942398071289, 26.594497680664062, 27.439571380615234, 28.284645080566406, 29.129718780517578, 29.97479248046875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 7.0, 10.0, 10.0, 9.0, 9.0, 8.0, 19.0, 23.0, 18.0, 20.0, 18.0, 17.0, 31.0, 24.0, 29.0, 42.0, 32.0, 38.0, 38.0, 36.0, 48.0, 51.0, 56.0, 49.0, 38.0, 32.0, 32.0, 25.0, 31.0, 29.0, 20.0, 33.0, 20.0, 13.0, 22.0, 15.0, 13.0, 11.0, 4.0, 6.0, 1.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.890625, -3.76068115234375, -3.6307373046875, -3.50079345703125, -3.370849609375, -3.24090576171875, -3.1109619140625, -2.98101806640625, -2.85107421875, -2.72113037109375, -2.5911865234375, -2.46124267578125, -2.331298828125, -2.20135498046875, -2.0714111328125, -1.94146728515625, -1.8115234375, -1.68157958984375, -1.5516357421875, -1.42169189453125, -1.291748046875, -1.16180419921875, -1.0318603515625, -0.90191650390625, -0.77197265625, -0.64202880859375, -0.5120849609375, -0.38214111328125, -0.252197265625, -0.12225341796875, 0.0076904296875, 0.13763427734375, 0.267578125, 0.39752197265625, 0.5274658203125, 0.65740966796875, 0.787353515625, 0.91729736328125, 1.0472412109375, 1.17718505859375, 1.30712890625, 1.43707275390625, 1.5670166015625, 1.69696044921875, 1.826904296875, 1.95684814453125, 2.0867919921875, 2.21673583984375, 2.3466796875, 2.47662353515625, 2.6065673828125, 2.73651123046875, 2.866455078125, 2.99639892578125, 3.1263427734375, 3.25628662109375, 3.38623046875, 3.51617431640625, 3.6461181640625, 3.77606201171875, 3.906005859375, 4.03594970703125, 4.1658935546875, 4.29583740234375, 4.42578125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 12.0, 14.0, 25.0, 37.0, 61.0, 86.0, 106.0, 185.0, 225.0, 376.0, 513.0, 795.0, 1142.0, 1672.0, 2312.0, 3415.0, 5095.0, 7324.0, 10500.0, 16051.0, 23769.0, 36053.0, 56112.0, 95801.0, 219123.0, 281075.0, 107063.0, 61402.0, 38884.0, 25740.0, 17101.0, 11564.0, 7904.0, 5348.0, 3637.0, 2528.0, 1704.0, 1128.0, 794.0, 601.0, 382.0, 295.0, 189.0, 145.0, 88.0, 66.0, 42.0, 20.0, 26.0, 10.0, 6.0, 5.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.93408203125, -0.905853271484375, -0.87762451171875, -0.849395751953125, -0.8211669921875, -0.792938232421875, -0.76470947265625, -0.736480712890625, -0.708251953125, -0.680023193359375, -0.65179443359375, -0.623565673828125, -0.5953369140625, -0.567108154296875, -0.53887939453125, -0.510650634765625, -0.482421875, -0.454193115234375, -0.42596435546875, -0.397735595703125, -0.3695068359375, -0.341278076171875, -0.31304931640625, -0.284820556640625, -0.256591796875, -0.228363037109375, -0.20013427734375, -0.171905517578125, -0.1436767578125, -0.115447998046875, -0.08721923828125, -0.058990478515625, -0.03076171875, -0.002532958984375, 0.02569580078125, 0.053924560546875, 0.0821533203125, 0.110382080078125, 0.13861083984375, 0.166839599609375, 0.195068359375, 0.223297119140625, 0.25152587890625, 0.279754638671875, 0.3079833984375, 0.336212158203125, 0.36444091796875, 0.392669677734375, 0.4208984375, 0.449127197265625, 0.47735595703125, 0.505584716796875, 0.5338134765625, 0.562042236328125, 0.59027099609375, 0.618499755859375, 0.646728515625, 0.674957275390625, 0.70318603515625, 0.731414794921875, 0.7596435546875, 0.787872314453125, 0.81610107421875, 0.844329833984375, 0.87255859375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 5.0, 7.0, 6.0, 10.0, 8.0, 11.0, 19.0, 19.0, 31.0, 33.0, 33.0, 37.0, 51.0, 36.0, 49.0, 35.0, 45.0, 32.0, 1079.0, 52.0, 50.0, 55.0, 44.0, 39.0, 31.0, 28.0, 27.0, 25.0, 20.0, 23.0, 17.0, 13.0, 9.0, 12.0, 11.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9921875, -2.895782470703125, -2.79937744140625, -2.702972412109375, -2.6065673828125, -2.510162353515625, -2.41375732421875, -2.317352294921875, -2.220947265625, -2.124542236328125, -2.02813720703125, -1.931732177734375, -1.8353271484375, -1.738922119140625, -1.64251708984375, -1.546112060546875, -1.44970703125, -1.353302001953125, -1.25689697265625, -1.160491943359375, -1.0640869140625, -0.967681884765625, -0.87127685546875, -0.774871826171875, -0.678466796875, -0.582061767578125, -0.48565673828125, -0.389251708984375, -0.2928466796875, -0.196441650390625, -0.10003662109375, -0.003631591796875, 0.0927734375, 0.189178466796875, 0.28558349609375, 0.381988525390625, 0.4783935546875, 0.574798583984375, 0.67120361328125, 0.767608642578125, 0.864013671875, 0.960418701171875, 1.05682373046875, 1.153228759765625, 1.2496337890625, 1.346038818359375, 1.44244384765625, 1.538848876953125, 1.63525390625, 1.731658935546875, 1.82806396484375, 1.924468994140625, 2.0208740234375, 2.117279052734375, 2.21368408203125, 2.310089111328125, 2.406494140625, 2.502899169921875, 2.59930419921875, 2.695709228515625, 2.7921142578125, 2.888519287109375, 2.98492431640625, 3.081329345703125, 3.177734375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 8.0, 10.0, 20.0, 15.0, 32.0, 51.0, 77.0, 110.0, 172.0, 264.0, 432.0, 717.0, 1122.0, 1861.0, 3096.0, 5204.0, 9042.0, 16512.0, 30901.0, 60401.0, 124593.0, 1428050.0, 222574.0, 91512.0, 45276.0, 23808.0, 13167.0, 7510.0, 4246.0, 2489.0, 1444.0, 900.0, 525.0, 354.0, 219.0, 142.0, 97.0, 67.0, 39.0, 25.0, 12.0, 12.0, 13.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2841796875, -1.245025634765625, -1.20587158203125, -1.166717529296875, -1.1275634765625, -1.088409423828125, -1.04925537109375, -1.010101318359375, -0.970947265625, -0.931793212890625, -0.89263916015625, -0.853485107421875, -0.8143310546875, -0.775177001953125, -0.73602294921875, -0.696868896484375, -0.65771484375, -0.618560791015625, -0.57940673828125, -0.540252685546875, -0.5010986328125, -0.461944580078125, -0.42279052734375, -0.383636474609375, -0.344482421875, -0.305328369140625, -0.26617431640625, -0.227020263671875, -0.1878662109375, -0.148712158203125, -0.10955810546875, -0.070404052734375, -0.03125, 0.007904052734375, 0.04705810546875, 0.086212158203125, 0.1253662109375, 0.164520263671875, 0.20367431640625, 0.242828369140625, 0.281982421875, 0.321136474609375, 0.36029052734375, 0.399444580078125, 0.4385986328125, 0.477752685546875, 0.51690673828125, 0.556060791015625, 0.59521484375, 0.634368896484375, 0.67352294921875, 0.712677001953125, 0.7518310546875, 0.790985107421875, 0.83013916015625, 0.869293212890625, 0.908447265625, 0.947601318359375, 0.98675537109375, 1.025909423828125, 1.0650634765625, 1.104217529296875, 1.14337158203125, 1.182525634765625, 1.2216796875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 5.0, 8.0, 10.0, 9.0, 11.0, 21.0, 22.0, 35.0, 33.0, 54.0, 49.0, 76.0, 129.0, 112.0, 113.0, 60.0, 50.0, 44.0, 21.0, 31.0, 19.0, 27.0, 15.0, 10.0, 11.0, 12.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00054168701171875, -0.0005183443427085876, -0.0004950016736984253, -0.00047165900468826294, -0.0004483163356781006, -0.00042497366666793823, -0.0004016309976577759, -0.0003782883286476135, -0.00035494565963745117, -0.0003316029906272888, -0.00030826032161712646, -0.0002849176526069641, -0.00026157498359680176, -0.0002382323145866394, -0.00021488964557647705, -0.0001915469765663147, -0.00016820430755615234, -0.00014486163854599, -0.00012151896953582764, -9.817630052566528e-05, -7.483363151550293e-05, -5.1490962505340576e-05, -2.8148293495178223e-05, -4.805624485015869e-06, 1.8537044525146484e-05, 4.187971353530884e-05, 6.522238254547119e-05, 8.856505155563354e-05, 0.0001119077205657959, 0.00013525038957595825, 0.0001585930585861206, 0.00018193572759628296, 0.0002052783966064453, 0.00022862106561660767, 0.00025196373462677, 0.0002753064036369324, 0.0002986490726470947, 0.0003219917416572571, 0.00034533441066741943, 0.0003686770796775818, 0.00039201974868774414, 0.0004153624176979065, 0.00043870508670806885, 0.0004620477557182312, 0.00048539042472839355, 0.0005087330937385559, 0.0005320757627487183, 0.0005554184317588806, 0.000578761100769043, 0.0006021037697792053, 0.0006254464387893677, 0.00064878910779953, 0.0006721317768096924, 0.0006954744458198547, 0.0007188171148300171, 0.0007421597838401794, 0.0007655024528503418, 0.0007888451218605042, 0.0008121877908706665, 0.0008355304598808289, 0.0008588731288909912, 0.0008822157979011536, 0.0009055584669113159, 0.0009289011359214783, 0.0009522438049316406]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 8.0, 5.0, 8.0, 9.0, 9.0, 20.0, 17.0, 32.0, 38.0, 48.0, 48.0, 95.0, 112.0, 208.0, 476.0, 1754.0, 550032.0, 492798.0, 1711.0, 469.0, 222.0, 114.0, 76.0, 57.0, 40.0, 34.0, 24.0, 17.0, 15.0, 16.0, 9.0, 6.0, 5.0, 6.0, 4.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.0165863037109375, -0.016171574592590332, -0.015756845474243164, -0.015342116355895996, -0.014927387237548828, -0.01451265811920166, -0.014097929000854492, -0.013683199882507324, -0.013268470764160156, -0.012853741645812988, -0.01243901252746582, -0.012024283409118652, -0.011609554290771484, -0.011194825172424316, -0.010780096054077148, -0.01036536693572998, -0.009950637817382812, -0.009535908699035645, -0.009121179580688477, -0.008706450462341309, -0.00829172134399414, -0.007876992225646973, -0.007462263107299805, -0.007047533988952637, -0.006632804870605469, -0.006218075752258301, -0.005803346633911133, -0.005388617515563965, -0.004973888397216797, -0.004559159278869629, -0.004144430160522461, -0.003729701042175293, -0.003314971923828125, -0.002900242805480957, -0.002485513687133789, -0.002070784568786621, -0.0016560554504394531, -0.0012413263320922852, -0.0008265972137451172, -0.0004118680953979492, 2.86102294921875e-06, 0.0004175901412963867, 0.0008323192596435547, 0.0012470483779907227, 0.0016617774963378906, 0.0020765066146850586, 0.0024912357330322266, 0.0029059648513793945, 0.0033206939697265625, 0.0037354230880737305, 0.0041501522064208984, 0.004564881324768066, 0.004979610443115234, 0.005394339561462402, 0.00580906867980957, 0.006223797798156738, 0.006638526916503906, 0.007053256034851074, 0.007467985153198242, 0.00788271427154541, 0.008297443389892578, 0.008712172508239746, 0.009126901626586914, 0.009541630744934082, 0.00995635986328125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 61.0, 210.0, 326.0, 288.0, 87.0, 29.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001050880760885775, -0.0010099856881424785, -0.0009690905571915209, -0.0009281954844482243, -0.0008873003534972668, -0.0008464052807539701, -0.0008055102080106735, -0.0007646151352673769, -0.0007237200043164194, -0.0006828249315731227, -0.0006419298006221652, -0.0006010347278788686, -0.000560139655135572, -0.0005192445241846144, -0.0004783494514413178, -0.0004374543495941907, -0.00039655924774706364, -0.00035566414589993656, -0.0003147690440528095, -0.00027387397130951285, -0.00023297886946238577, -0.0001920837676152587, -0.00015118869487196207, -0.00011029359302483499, -6.939849117770791e-05, -2.8503396606538445e-05, 1.2391697964631021e-05, 5.328678525984287e-05, 9.418188710696995e-05, 0.00013507698895409703, 0.00017597206169739366, 0.00021686716354452074, 0.00025776238180696964, 0.0002986574836540967, 0.0003395525855012238, 0.0003804476582445204, 0.0004213427600916475, 0.0004622378619387746, 0.0005031329346820712, 0.0005440280074253678, 0.0005849231383763254, 0.000625818211119622, 0.0006667133420705795, 0.0007076084148138762, 0.0007485034875571728, 0.0007893986185081303, 0.0008302936912514269, 0.0008711888222023845, 0.0009120838949456811, 0.0009529789676889777, 0.0009938740404322743, 0.0010347692295908928, 0.0010756643023341894, 0.001116559375077486, 0.0011574544478207827, 0.0011983495205640793, 0.001239244593307376, 0.0012801396660506725, 0.0013210347387939692, 0.0013619298115372658, 0.0014028250006958842, 0.0014437200734391809, 0.0014846151461824775, 0.001525510218925774, 0.0015664054080843925]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 6.0, 3.0, 7.0, 10.0, 3.0, 17.0, 31.0, 13.0, 24.0, 25.0, 21.0, 33.0, 30.0, 37.0, 44.0, 36.0, 53.0, 52.0, 34.0, 32.0, 40.0, 32.0, 33.0, 46.0, 32.0, 51.0, 33.0, 34.0, 26.0, 28.0, 17.0, 16.0, 13.0, 21.0, 15.0, 11.0, 12.0, 7.0, 6.0, 2.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0002950429916381836, -0.00028582941740751266, -0.00027661584317684174, -0.0002674022689461708, -0.0002581886947154999, -0.00024897512048482895, -0.00023976154625415802, -0.0002305479720234871, -0.00022133439779281616, -0.00021212082356214523, -0.0002029072493314743, -0.00019369367510080338, -0.00018448010087013245, -0.00017526652663946152, -0.0001660529524087906, -0.00015683937817811966, -0.00014762580394744873, -0.0001384122297167778, -0.00012919865548610687, -0.00011998508125543594, -0.00011077150702476501, -0.00010155793279409409, -9.234435856342316e-05, -8.313078433275223e-05, -7.39172101020813e-05, -6.470363587141037e-05, -5.549006164073944e-05, -4.627648741006851e-05, -3.706291317939758e-05, -2.7849338948726654e-05, -1.8635764718055725e-05, -9.422190487384796e-06, -2.086162567138672e-07, 9.004957973957062e-06, 1.821853220462799e-05, 2.743210643529892e-05, 3.664568066596985e-05, 4.585925489664078e-05, 5.5072829127311707e-05, 6.428640335798264e-05, 7.349997758865356e-05, 8.27135518193245e-05, 9.192712604999542e-05, 0.00010114070028066635, 0.00011035427451133728, 0.00011956784874200821, 0.00012878142297267914, 0.00013799499720335007, 0.000147208571434021, 0.00015642214566469193, 0.00016563571989536285, 0.00017484929412603378, 0.0001840628683567047, 0.00019327644258737564, 0.00020249001681804657, 0.0002117035910487175, 0.00022091716527938843, 0.00023013073951005936, 0.00023934431374073029, 0.0002485578879714012, 0.00025777146220207214, 0.00026698503643274307, 0.000276198610663414, 0.00028541218489408493, 0.00029462575912475586]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 7.0, 10.0, 10.0, 9.0, 9.0, 8.0, 19.0, 23.0, 18.0, 20.0, 18.0, 17.0, 31.0, 24.0, 29.0, 42.0, 32.0, 38.0, 38.0, 36.0, 48.0, 51.0, 56.0, 49.0, 38.0, 32.0, 32.0, 25.0, 31.0, 29.0, 20.0, 33.0, 20.0, 13.0, 22.0, 15.0, 13.0, 11.0, 4.0, 6.0, 1.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.890625, -3.76068115234375, -3.6307373046875, -3.50079345703125, -3.370849609375, -3.24090576171875, -3.1109619140625, -2.98101806640625, -2.85107421875, -2.72113037109375, -2.5911865234375, -2.46124267578125, -2.331298828125, -2.20135498046875, -2.0714111328125, -1.94146728515625, -1.8115234375, -1.68157958984375, -1.5516357421875, -1.42169189453125, -1.291748046875, -1.16180419921875, -1.0318603515625, -0.90191650390625, -0.77197265625, -0.64202880859375, -0.5120849609375, -0.38214111328125, -0.252197265625, -0.12225341796875, 0.0076904296875, 0.13763427734375, 0.267578125, 0.39752197265625, 0.5274658203125, 0.65740966796875, 0.787353515625, 0.91729736328125, 1.0472412109375, 1.17718505859375, 1.30712890625, 1.43707275390625, 1.5670166015625, 1.69696044921875, 1.826904296875, 1.95684814453125, 2.0867919921875, 2.21673583984375, 2.3466796875, 2.47662353515625, 2.6065673828125, 2.73651123046875, 2.866455078125, 2.99639892578125, 3.1263427734375, 3.25628662109375, 3.38623046875, 3.51617431640625, 3.6461181640625, 3.77606201171875, 3.906005859375, 4.03594970703125, 4.1658935546875, 4.29583740234375, 4.42578125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 7.0, 5.0, 22.0, 26.0, 19.0, 33.0, 38.0, 70.0, 89.0, 132.0, 183.0, 289.0, 479.0, 834.0, 1440.0, 2923.0, 6245.0, 13893.0, 32270.0, 78282.0, 192074.0, 375377.0, 199909.0, 82389.0, 33916.0, 14408.0, 6311.0, 3031.0, 1553.0, 844.0, 503.0, 287.0, 195.0, 136.0, 96.0, 74.0, 54.0, 31.0, 24.0, 12.0, 14.0, 15.0, 6.0, 4.0, 5.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.861328125, -3.734832763671875, -3.60833740234375, -3.481842041015625, -3.3553466796875, -3.228851318359375, -3.10235595703125, -2.975860595703125, -2.849365234375, -2.722869873046875, -2.59637451171875, -2.469879150390625, -2.3433837890625, -2.216888427734375, -2.09039306640625, -1.963897705078125, -1.83740234375, -1.710906982421875, -1.58441162109375, -1.457916259765625, -1.3314208984375, -1.204925537109375, -1.07843017578125, -0.951934814453125, -0.825439453125, -0.698944091796875, -0.57244873046875, -0.445953369140625, -0.3194580078125, -0.192962646484375, -0.06646728515625, 0.060028076171875, 0.1865234375, 0.313018798828125, 0.43951416015625, 0.566009521484375, 0.6925048828125, 0.819000244140625, 0.94549560546875, 1.071990966796875, 1.198486328125, 1.324981689453125, 1.45147705078125, 1.577972412109375, 1.7044677734375, 1.830963134765625, 1.95745849609375, 2.083953857421875, 2.21044921875, 2.336944580078125, 2.46343994140625, 2.589935302734375, 2.7164306640625, 2.842926025390625, 2.96942138671875, 3.095916748046875, 3.222412109375, 3.348907470703125, 3.47540283203125, 3.601898193359375, 3.7283935546875, 3.854888916015625, 3.98138427734375, 4.107879638671875, 4.234375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 10.0, 3.0, 6.0, 15.0, 10.0, 10.0, 13.0, 18.0, 24.0, 38.0, 31.0, 34.0, 46.0, 48.0, 61.0, 82.0, 150.0, 353.0, 1427.0, 172.0, 89.0, 61.0, 42.0, 58.0, 51.0, 34.0, 38.0, 26.0, 26.0, 9.0, 19.0, 12.0, 11.0, 5.0, 4.0, 3.0, 2.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.65625, -17.1527099609375, -16.649169921875, -16.1456298828125, -15.64208984375, -15.1385498046875, -14.635009765625, -14.1314697265625, -13.6279296875, -13.1243896484375, -12.620849609375, -12.1173095703125, -11.61376953125, -11.1102294921875, -10.606689453125, -10.1031494140625, -9.599609375, -9.0960693359375, -8.592529296875, -8.0889892578125, -7.58544921875, -7.0819091796875, -6.578369140625, -6.0748291015625, -5.5712890625, -5.0677490234375, -4.564208984375, -4.0606689453125, -3.55712890625, -3.0535888671875, -2.550048828125, -2.0465087890625, -1.54296875, -1.0394287109375, -0.535888671875, -0.0323486328125, 0.47119140625, 0.9747314453125, 1.478271484375, 1.9818115234375, 2.4853515625, 2.9888916015625, 3.492431640625, 3.9959716796875, 4.49951171875, 5.0030517578125, 5.506591796875, 6.0101318359375, 6.513671875, 7.0172119140625, 7.520751953125, 8.0242919921875, 8.52783203125, 9.0313720703125, 9.534912109375, 10.0384521484375, 10.5419921875, 11.0455322265625, 11.549072265625, 12.0526123046875, 12.55615234375, 13.0596923828125, 13.563232421875, 14.0667724609375, 14.5703125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 7.0, 6.0, 6.0, 9.0, 13.0, 16.0, 17.0, 25.0, 35.0, 63.0, 94.0, 146.0, 254.0, 467.0, 1335.0, 512714.0, 2627833.0, 1453.0, 467.0, 273.0, 151.0, 96.0, 63.0, 42.0, 27.0, 19.0, 11.0, 12.0, 9.0, 9.0, 10.0, 6.0, 3.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0], "bins": [-87.0625, -84.7744140625, -82.486328125, -80.1982421875, -77.91015625, -75.6220703125, -73.333984375, -71.0458984375, -68.7578125, -66.4697265625, -64.181640625, -61.8935546875, -59.60546875, -57.3173828125, -55.029296875, -52.7412109375, -50.453125, -48.1650390625, -45.876953125, -43.5888671875, -41.30078125, -39.0126953125, -36.724609375, -34.4365234375, -32.1484375, -29.8603515625, -27.572265625, -25.2841796875, -22.99609375, -20.7080078125, -18.419921875, -16.1318359375, -13.84375, -11.5556640625, -9.267578125, -6.9794921875, -4.69140625, -2.4033203125, -0.115234375, 2.1728515625, 4.4609375, 6.7490234375, 9.037109375, 11.3251953125, 13.61328125, 15.9013671875, 18.189453125, 20.4775390625, 22.765625, 25.0537109375, 27.341796875, 29.6298828125, 31.91796875, 34.2060546875, 36.494140625, 38.7822265625, 41.0703125, 43.3583984375, 45.646484375, 47.9345703125, 50.22265625, 52.5107421875, 54.798828125, 57.0869140625, 59.375]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.0, 962.0, 10.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-452.3536376953125, -444.18548583984375, -436.0173034667969, -427.84912109375, -419.68096923828125, -411.5128173828125, -403.3446350097656, -395.17645263671875, -387.00830078125, -378.84014892578125, -370.6719665527344, -362.5037841796875, -354.33563232421875, -346.16748046875, -337.9992980957031, -329.83111572265625, -321.6629638671875, -313.49481201171875, -305.3266296386719, -297.158447265625, -288.99029541015625, -280.8221435546875, -272.6539611816406, -264.48577880859375, -256.317626953125, -248.1494598388672, -239.98129272460938, -231.81312561035156, -223.64495849609375, -215.47679138183594, -207.30862426757812, -199.1404571533203, -190.9722900390625, -182.8041229248047, -174.63595581054688, -166.46778869628906, -158.29962158203125, -150.13145446777344, -141.96328735351562, -133.7951202392578, -125.626953125, -117.45878601074219, -109.29061889648438, -101.12245178222656, -92.95428466796875, -84.78611755371094, -76.61795043945312, -68.44978332519531, -60.2816162109375, -52.11344909667969, -43.945281982421875, -35.77711486816406, -27.60894775390625, -19.440780639648438, -11.272613525390625, -3.1044464111328125, 5.063720703125, 13.231887817382812, 21.400054931640625, 29.568222045898438, 37.73638916015625, 45.90455627441406, 54.072723388671875, 62.24089050292969, 70.4090576171875]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 7.0, 5.0, 5.0, 6.0, 10.0, 13.0, 20.0, 21.0, 20.0, 18.0, 22.0, 22.0, 24.0, 30.0, 20.0, 27.0, 41.0, 47.0, 25.0, 36.0, 38.0, 48.0, 32.0, 36.0, 49.0, 37.0, 35.0, 38.0, 34.0, 34.0, 32.0, 28.0, 15.0, 21.0, 13.0, 11.0, 17.0, 11.0, 9.0, 7.0, 10.0, 5.0, 8.0, 5.0, 3.0, 3.0, 3.0, 0.0, 3.0], "bins": [-37.644283294677734, -36.58751678466797, -35.5307502746582, -34.47398376464844, -33.41721725463867, -32.360450744628906, -31.30368423461914, -30.246917724609375, -29.19015121459961, -28.133384704589844, -27.076618194580078, -26.019851684570312, -24.963085174560547, -23.90631866455078, -22.849552154541016, -21.79278564453125, -20.736019134521484, -19.67925262451172, -18.622486114501953, -17.565719604492188, -16.508953094482422, -15.452186584472656, -14.39542007446289, -13.338653564453125, -12.28188705444336, -11.225120544433594, -10.168354034423828, -9.111587524414062, -8.054821014404297, -6.998054504394531, -5.941287994384766, -4.884521484375, -3.8277549743652344, -2.7709884643554688, -1.7142219543457031, -0.6574554443359375, 0.3993110656738281, 1.4560775756835938, 2.5128440856933594, 3.569610595703125, 4.626377105712891, 5.683143615722656, 6.739910125732422, 7.7966766357421875, 8.853443145751953, 9.910209655761719, 10.966976165771484, 12.02374267578125, 13.080509185791016, 14.137275695800781, 15.194042205810547, 16.250808715820312, 17.307575225830078, 18.364341735839844, 19.42110824584961, 20.477874755859375, 21.53464126586914, 22.591407775878906, 23.648174285888672, 24.704940795898438, 25.761707305908203, 26.81847381591797, 27.875240325927734, 28.9320068359375, 29.988773345947266]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 9.0, 4.0, 7.0, 10.0, 10.0, 18.0, 9.0, 15.0, 17.0, 26.0, 16.0, 21.0, 23.0, 21.0, 35.0, 29.0, 41.0, 31.0, 44.0, 51.0, 38.0, 41.0, 54.0, 50.0, 46.0, 42.0, 33.0, 38.0, 25.0, 22.0, 26.0, 27.0, 20.0, 12.0, 18.0, 17.0, 9.0, 12.0, 9.0, 5.0, 4.0, 8.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.46875, -4.3214111328125, -4.174072265625, -4.0267333984375, -3.87939453125, -3.7320556640625, -3.584716796875, -3.4373779296875, -3.2900390625, -3.1427001953125, -2.995361328125, -2.8480224609375, -2.70068359375, -2.5533447265625, -2.406005859375, -2.2586669921875, -2.111328125, -1.9639892578125, -1.816650390625, -1.6693115234375, -1.52197265625, -1.3746337890625, -1.227294921875, -1.0799560546875, -0.9326171875, -0.7852783203125, -0.637939453125, -0.4906005859375, -0.34326171875, -0.1959228515625, -0.048583984375, 0.0987548828125, 0.24609375, 0.3934326171875, 0.540771484375, 0.6881103515625, 0.83544921875, 0.9827880859375, 1.130126953125, 1.2774658203125, 1.4248046875, 1.5721435546875, 1.719482421875, 1.8668212890625, 2.01416015625, 2.1614990234375, 2.308837890625, 2.4561767578125, 2.603515625, 2.7508544921875, 2.898193359375, 3.0455322265625, 3.19287109375, 3.3402099609375, 3.487548828125, 3.6348876953125, 3.7822265625, 3.9295654296875, 4.076904296875, 4.2242431640625, 4.37158203125, 4.5189208984375, 4.666259765625, 4.8135986328125, 4.9609375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 5.0, 2.0, 6.0, 3.0, 12.0, 9.0, 13.0, 19.0, 16.0, 19.0, 20.0, 32.0, 20.0, 63.0, 77.0, 108.0, 224.0, 370.0, 977.0, 5220.0, 98294.0, 1869728.0, 2086873.0, 124052.0, 6013.0, 1037.0, 431.0, 198.0, 115.0, 68.0, 62.0, 42.0, 20.0, 34.0, 16.0, 18.0, 19.0, 9.0, 8.0, 7.0, 9.0, 3.0, 3.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.8671875, -12.4776611328125, -12.088134765625, -11.6986083984375, -11.30908203125, -10.9195556640625, -10.530029296875, -10.1405029296875, -9.7509765625, -9.3614501953125, -8.971923828125, -8.5823974609375, -8.19287109375, -7.8033447265625, -7.413818359375, -7.0242919921875, -6.634765625, -6.2452392578125, -5.855712890625, -5.4661865234375, -5.07666015625, -4.6871337890625, -4.297607421875, -3.9080810546875, -3.5185546875, -3.1290283203125, -2.739501953125, -2.3499755859375, -1.96044921875, -1.5709228515625, -1.181396484375, -0.7918701171875, -0.40234375, -0.0128173828125, 0.376708984375, 0.7662353515625, 1.15576171875, 1.5452880859375, 1.934814453125, 2.3243408203125, 2.7138671875, 3.1033935546875, 3.492919921875, 3.8824462890625, 4.27197265625, 4.6614990234375, 5.051025390625, 5.4405517578125, 5.830078125, 6.2196044921875, 6.609130859375, 6.9986572265625, 7.38818359375, 7.7777099609375, 8.167236328125, 8.5567626953125, 8.9462890625, 9.3358154296875, 9.725341796875, 10.1148681640625, 10.50439453125, 10.8939208984375, 11.283447265625, 11.6729736328125, 12.0625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 3.0, 3.0, 9.0, 7.0, 15.0, 16.0, 19.0, 24.0, 42.0, 39.0, 48.0, 91.0, 101.0, 123.0, 180.0, 221.0, 279.0, 344.0, 444.0, 390.0, 389.0, 320.0, 256.0, 173.0, 140.0, 101.0, 71.0, 61.0, 50.0, 31.0, 26.0, 12.0, 14.0, 8.0, 8.0, 7.0, 5.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7890625, -8.523193359375, -8.25732421875, -7.991455078125, -7.7255859375, -7.459716796875, -7.19384765625, -6.927978515625, -6.662109375, -6.396240234375, -6.13037109375, -5.864501953125, -5.5986328125, -5.332763671875, -5.06689453125, -4.801025390625, -4.53515625, -4.269287109375, -4.00341796875, -3.737548828125, -3.4716796875, -3.205810546875, -2.93994140625, -2.674072265625, -2.408203125, -2.142333984375, -1.87646484375, -1.610595703125, -1.3447265625, -1.078857421875, -0.81298828125, -0.547119140625, -0.28125, -0.015380859375, 0.25048828125, 0.516357421875, 0.7822265625, 1.048095703125, 1.31396484375, 1.579833984375, 1.845703125, 2.111572265625, 2.37744140625, 2.643310546875, 2.9091796875, 3.175048828125, 3.44091796875, 3.706787109375, 3.97265625, 4.238525390625, 4.50439453125, 4.770263671875, 5.0361328125, 5.302001953125, 5.56787109375, 5.833740234375, 6.099609375, 6.365478515625, 6.63134765625, 6.897216796875, 7.1630859375, 7.428955078125, 7.69482421875, 7.960693359375, 8.2265625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 8.0, 8.0, 11.0, 14.0, 21.0, 29.0, 33.0, 47.0, 60.0, 95.0, 101.0, 134.0, 202.0, 258.0, 363.0, 680.0, 5480.0, 1759094.0, 2418456.0, 7071.0, 669.0, 376.0, 255.0, 194.0, 160.0, 106.0, 93.0, 70.0, 49.0, 38.0, 35.0, 14.0, 19.0, 15.0, 4.0, 6.0, 7.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.359375, -30.315185546875, -29.27099609375, -28.226806640625, -27.1826171875, -26.138427734375, -25.09423828125, -24.050048828125, -23.005859375, -21.961669921875, -20.91748046875, -19.873291015625, -18.8291015625, -17.784912109375, -16.74072265625, -15.696533203125, -14.65234375, -13.608154296875, -12.56396484375, -11.519775390625, -10.4755859375, -9.431396484375, -8.38720703125, -7.343017578125, -6.298828125, -5.254638671875, -4.21044921875, -3.166259765625, -2.1220703125, -1.077880859375, -0.03369140625, 1.010498046875, 2.0546875, 3.098876953125, 4.14306640625, 5.187255859375, 6.2314453125, 7.275634765625, 8.31982421875, 9.364013671875, 10.408203125, 11.452392578125, 12.49658203125, 13.540771484375, 14.5849609375, 15.629150390625, 16.67333984375, 17.717529296875, 18.76171875, 19.805908203125, 20.85009765625, 21.894287109375, 22.9384765625, 23.982666015625, 25.02685546875, 26.071044921875, 27.115234375, 28.159423828125, 29.20361328125, 30.247802734375, 31.2919921875, 32.336181640625, 33.38037109375, 34.424560546875, 35.46875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 14.0, 31.0, 64.0, 121.0, 179.0, 178.0, 188.0, 114.0, 65.0, 34.0, 13.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.81599044799805, -40.04401397705078, -38.27203369140625, -36.50005340576172, -34.72807693481445, -32.95610046386719, -31.184120178222656, -29.412141799926758, -27.64016342163086, -25.86818504333496, -24.096206665039062, -22.324228286743164, -20.552249908447266, -18.780271530151367, -17.00829315185547, -15.23631477355957, -13.464336395263672, -11.692358016967773, -9.920379638671875, -8.148401260375977, -6.376422882080078, -4.60444450378418, -2.8324661254882812, -1.0604877471923828, 0.7114906311035156, 2.483469009399414, 4.2554473876953125, 6.027425765991211, 7.799404144287109, 9.571382522583008, 11.343360900878906, 13.115339279174805, 14.887313842773438, 16.659292221069336, 18.431270599365234, 20.203248977661133, 21.97522735595703, 23.74720573425293, 25.519184112548828, 27.291162490844727, 29.063140869140625, 30.835119247436523, 32.60709762573242, 34.37907409667969, 36.15105438232422, 37.92303466796875, 39.695011138916016, 41.46698760986328, 43.23896789550781, 45.010948181152344, 46.78292465209961, 48.554901123046875, 50.326881408691406, 52.09886169433594, 53.8708381652832, 55.64281463623047, 57.414794921875, 59.18677520751953, 60.9587516784668, 62.73072814941406, 64.5027084350586, 66.27468872070312, 68.04666137695312, 69.81864166259766, 71.59062194824219]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 5.0, 5.0, 11.0, 8.0, 12.0, 15.0, 24.0, 27.0, 21.0, 29.0, 33.0, 32.0, 30.0, 24.0, 41.0, 46.0, 39.0, 36.0, 43.0, 37.0, 32.0, 47.0, 38.0, 36.0, 37.0, 37.0, 28.0, 38.0, 34.0, 20.0, 20.0, 15.0, 20.0, 22.0, 10.0, 5.0, 18.0, 10.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-29.399795532226562, -28.469858169555664, -27.539920806884766, -26.6099853515625, -25.6800479888916, -24.750110626220703, -23.820175170898438, -22.89023780822754, -21.96030044555664, -21.030363082885742, -20.100425720214844, -19.170490264892578, -18.24055290222168, -17.31061553955078, -16.380680084228516, -15.450742721557617, -14.520805358886719, -13.59086799621582, -12.660931587219238, -11.730995178222656, -10.801057815551758, -9.87112045288086, -8.941184043884277, -8.011247634887695, -7.081310272216797, -6.151373386383057, -5.221436500549316, -4.291499614715576, -3.361562728881836, -2.4316258430480957, -1.5016889572143555, -0.5717520713806152, 0.358184814453125, 1.2881217002868652, 2.2180585861206055, 3.1479954719543457, 4.077932357788086, 5.007869243621826, 5.937806129455566, 6.867743015289307, 7.797679901123047, 8.727617263793945, 9.657553672790527, 10.58749008178711, 11.517427444458008, 12.447364807128906, 13.377301216125488, 14.30723762512207, 15.237174987792969, 16.167112350463867, 17.097049713134766, 18.02698516845703, 18.95692253112793, 19.886859893798828, 20.816795349121094, 21.746732711791992, 22.67667007446289, 23.60660743713379, 24.536544799804688, 25.466480255126953, 26.39641761779785, 27.32635498046875, 28.256290435791016, 29.186227798461914, 30.116165161132812]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 6.0, 9.0, 5.0, 5.0, 9.0, 10.0, 4.0, 12.0, 11.0, 14.0, 11.0, 8.0, 17.0, 39.0, 41.0, 26.0, 22.0, 29.0, 25.0, 41.0, 34.0, 34.0, 47.0, 35.0, 36.0, 43.0, 46.0, 44.0, 35.0, 34.0, 30.0, 40.0, 24.0, 38.0, 18.0, 18.0, 13.0, 17.0, 9.0, 12.0, 11.0, 8.0, 11.0, 8.0, 7.0, 5.0, 3.0, 6.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.861328125, -3.728546142578125, -3.59576416015625, -3.462982177734375, -3.3302001953125, -3.197418212890625, -3.06463623046875, -2.931854248046875, -2.799072265625, -2.666290283203125, -2.53350830078125, -2.400726318359375, -2.2679443359375, -2.135162353515625, -2.00238037109375, -1.869598388671875, -1.73681640625, -1.604034423828125, -1.47125244140625, -1.338470458984375, -1.2056884765625, -1.072906494140625, -0.94012451171875, -0.807342529296875, -0.674560546875, -0.541778564453125, -0.40899658203125, -0.276214599609375, -0.1434326171875, -0.010650634765625, 0.12213134765625, 0.254913330078125, 0.3876953125, 0.520477294921875, 0.65325927734375, 0.786041259765625, 0.9188232421875, 1.051605224609375, 1.18438720703125, 1.317169189453125, 1.449951171875, 1.582733154296875, 1.71551513671875, 1.848297119140625, 1.9810791015625, 2.113861083984375, 2.24664306640625, 2.379425048828125, 2.51220703125, 2.644989013671875, 2.77777099609375, 2.910552978515625, 3.0433349609375, 3.176116943359375, 3.30889892578125, 3.441680908203125, 3.574462890625, 3.707244873046875, 3.84002685546875, 3.972808837890625, 4.1055908203125, 4.238372802734375, 4.37115478515625, 4.503936767578125, 4.63671875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 6.0, 5.0, 11.0, 13.0, 25.0, 39.0, 59.0, 83.0, 111.0, 155.0, 250.0, 350.0, 467.0, 703.0, 1000.0, 1347.0, 2019.0, 2722.0, 3922.0, 5713.0, 8270.0, 12410.0, 19051.0, 28639.0, 44799.0, 73694.0, 137419.0, 310961.0, 165824.0, 83009.0, 50037.0, 31513.0, 20614.0, 13564.0, 9198.0, 6257.0, 4246.0, 2952.0, 2065.0, 1465.0, 1015.0, 786.0, 547.0, 379.0, 263.0, 202.0, 129.0, 100.0, 60.0, 32.0, 24.0, 15.0, 11.0, 12.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.87744140625, -0.8487777709960938, -0.8201141357421875, -0.7914505004882812, -0.762786865234375, -0.7341232299804688, -0.7054595947265625, -0.6767959594726562, -0.64813232421875, -0.6194686889648438, -0.5908050537109375, -0.5621414184570312, -0.533477783203125, -0.5048141479492188, -0.4761505126953125, -0.44748687744140625, -0.4188232421875, -0.39015960693359375, -0.3614959716796875, -0.33283233642578125, -0.304168701171875, -0.27550506591796875, -0.2468414306640625, -0.21817779541015625, -0.18951416015625, -0.16085052490234375, -0.1321868896484375, -0.10352325439453125, -0.074859619140625, -0.04619598388671875, -0.0175323486328125, 0.01113128662109375, 0.039794921875, 0.06845855712890625, 0.0971221923828125, 0.12578582763671875, 0.154449462890625, 0.18311309814453125, 0.2117767333984375, 0.24044036865234375, 0.26910400390625, 0.29776763916015625, 0.3264312744140625, 0.35509490966796875, 0.383758544921875, 0.41242218017578125, 0.4410858154296875, 0.46974945068359375, 0.4984130859375, 0.5270767211914062, 0.5557403564453125, 0.5844039916992188, 0.613067626953125, 0.6417312622070312, 0.6703948974609375, 0.6990585327148438, 0.72772216796875, 0.7563858032226562, 0.7850494384765625, 0.8137130737304688, 0.842376708984375, 0.8710403442382812, 0.8997039794921875, 0.9283676147460938, 0.95703125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 5.0, 3.0, 8.0, 10.0, 7.0, 9.0, 24.0, 17.0, 22.0, 26.0, 31.0, 28.0, 34.0, 30.0, 34.0, 40.0, 36.0, 39.0, 47.0, 1057.0, 42.0, 32.0, 34.0, 41.0, 44.0, 34.0, 32.0, 34.0, 27.0, 34.0, 19.0, 17.0, 17.0, 18.0, 12.0, 12.0, 22.0, 12.0, 9.0, 3.0, 1.0, 4.0, 6.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.998046875, -2.909332275390625, -2.82061767578125, -2.731903076171875, -2.6431884765625, -2.554473876953125, -2.46575927734375, -2.377044677734375, -2.288330078125, -2.199615478515625, -2.11090087890625, -2.022186279296875, -1.9334716796875, -1.844757080078125, -1.75604248046875, -1.667327880859375, -1.57861328125, -1.489898681640625, -1.40118408203125, -1.312469482421875, -1.2237548828125, -1.135040283203125, -1.04632568359375, -0.957611083984375, -0.868896484375, -0.780181884765625, -0.69146728515625, -0.602752685546875, -0.5140380859375, -0.425323486328125, -0.33660888671875, -0.247894287109375, -0.1591796875, -0.070465087890625, 0.01824951171875, 0.106964111328125, 0.1956787109375, 0.284393310546875, 0.37310791015625, 0.461822509765625, 0.550537109375, 0.639251708984375, 0.72796630859375, 0.816680908203125, 0.9053955078125, 0.994110107421875, 1.08282470703125, 1.171539306640625, 1.26025390625, 1.348968505859375, 1.43768310546875, 1.526397705078125, 1.6151123046875, 1.703826904296875, 1.79254150390625, 1.881256103515625, 1.969970703125, 2.058685302734375, 2.14739990234375, 2.236114501953125, 2.3248291015625, 2.413543701171875, 2.50225830078125, 2.590972900390625, 2.6796875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 11.0, 5.0, 22.0, 17.0, 31.0, 51.0, 87.0, 100.0, 159.0, 243.0, 327.0, 578.0, 816.0, 1274.0, 1870.0, 2927.0, 4654.0, 7543.0, 12751.0, 21658.0, 37212.0, 66674.0, 126885.0, 1393476.0, 201651.0, 93263.0, 50274.0, 28609.0, 16714.0, 10304.0, 6235.0, 3988.0, 2446.0, 1475.0, 981.0, 581.0, 408.0, 290.0, 172.0, 109.0, 89.0, 44.0, 36.0, 28.0, 22.0, 12.0, 15.0, 5.0, 5.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0693359375, -1.033416748046875, -0.99749755859375, -0.961578369140625, -0.9256591796875, -0.889739990234375, -0.85382080078125, -0.817901611328125, -0.781982421875, -0.746063232421875, -0.71014404296875, -0.674224853515625, -0.6383056640625, -0.602386474609375, -0.56646728515625, -0.530548095703125, -0.49462890625, -0.458709716796875, -0.42279052734375, -0.386871337890625, -0.3509521484375, -0.315032958984375, -0.27911376953125, -0.243194580078125, -0.207275390625, -0.171356201171875, -0.13543701171875, -0.099517822265625, -0.0635986328125, -0.027679443359375, 0.00823974609375, 0.044158935546875, 0.080078125, 0.115997314453125, 0.15191650390625, 0.187835693359375, 0.2237548828125, 0.259674072265625, 0.29559326171875, 0.331512451171875, 0.367431640625, 0.403350830078125, 0.43927001953125, 0.475189208984375, 0.5111083984375, 0.547027587890625, 0.58294677734375, 0.618865966796875, 0.65478515625, 0.690704345703125, 0.72662353515625, 0.762542724609375, 0.7984619140625, 0.834381103515625, 0.87030029296875, 0.906219482421875, 0.942138671875, 0.978057861328125, 1.01397705078125, 1.049896240234375, 1.0858154296875, 1.121734619140625, 1.15765380859375, 1.193572998046875, 1.2294921875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 5.0, 2.0, 4.0, 7.0, 12.0, 10.0, 17.0, 16.0, 19.0, 19.0, 28.0, 31.0, 45.0, 58.0, 71.0, 62.0, 65.0, 69.0, 79.0, 63.0, 55.0, 36.0, 40.0, 28.0, 23.0, 21.0, 12.0, 19.0, 13.0, 18.0, 8.0, 7.0, 6.0, 1.0, 4.0, 5.0, 4.0, 0.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.0004944801330566406, -0.00047635287046432495, -0.0004582256078720093, -0.0004400983452796936, -0.00042197108268737793, -0.00040384382009506226, -0.0003857165575027466, -0.0003675892949104309, -0.00034946203231811523, -0.00033133476972579956, -0.0003132075071334839, -0.0002950802445411682, -0.00027695298194885254, -0.00025882571935653687, -0.0002406984567642212, -0.00022257119417190552, -0.00020444393157958984, -0.00018631666898727417, -0.0001681894063949585, -0.00015006214380264282, -0.00013193488121032715, -0.00011380761861801147, -9.56803560256958e-05, -7.755309343338013e-05, -5.942583084106445e-05, -4.129856824874878e-05, -2.3171305656433105e-05, -5.044043064117432e-06, 1.3083219528198242e-05, 3.1210482120513916e-05, 4.933774471282959e-05, 6.746500730514526e-05, 8.559226989746094e-05, 0.00010371953248977661, 0.00012184679508209229, 0.00013997405767440796, 0.00015810132026672363, 0.0001762285828590393, 0.00019435584545135498, 0.00021248310804367065, 0.00023061037063598633, 0.000248737633228302, 0.0002668648958206177, 0.00028499215841293335, 0.000303119421005249, 0.0003212466835975647, 0.00033937394618988037, 0.00035750120878219604, 0.0003756284713745117, 0.0003937557339668274, 0.00041188299655914307, 0.00043001025915145874, 0.0004481375217437744, 0.0004662647843360901, 0.00048439204692840576, 0.0005025193095207214, 0.0005206465721130371, 0.0005387738347053528, 0.0005569010972976685, 0.0005750283598899841, 0.0005931556224822998, 0.0006112828850746155, 0.0006294101476669312, 0.0006475374102592468, 0.0006656646728515625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 4.0, 9.0, 12.0, 17.0, 17.0, 23.0, 26.0, 36.0, 63.0, 78.0, 119.0, 221.0, 604.0, 6864.0, 1019553.0, 19406.0, 743.0, 287.0, 129.0, 88.0, 53.0, 54.0, 29.0, 28.0, 14.0, 12.0, 9.0, 7.0, 6.0, 5.0, 1.0, 2.0, 6.0, 1.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.01690673828125, -0.016456961631774902, -0.016007184982299805, -0.015557408332824707, -0.01510763168334961, -0.014657855033874512, -0.014208078384399414, -0.013758301734924316, -0.013308525085449219, -0.012858748435974121, -0.012408971786499023, -0.011959195137023926, -0.011509418487548828, -0.01105964183807373, -0.010609865188598633, -0.010160088539123535, -0.009710311889648438, -0.00926053524017334, -0.008810758590698242, -0.008360981941223145, -0.007911205291748047, -0.007461428642272949, -0.0070116519927978516, -0.006561875343322754, -0.006112098693847656, -0.005662322044372559, -0.005212545394897461, -0.004762768745422363, -0.004312992095947266, -0.003863215446472168, -0.0034134387969970703, -0.0029636621475219727, -0.002513885498046875, -0.0020641088485717773, -0.0016143321990966797, -0.001164555549621582, -0.0007147789001464844, -0.0002650022506713867, 0.00018477439880371094, 0.0006345510482788086, 0.0010843276977539062, 0.001534104347229004, 0.0019838809967041016, 0.0024336576461791992, 0.002883434295654297, 0.0033332109451293945, 0.003782987594604492, 0.00423276424407959, 0.0046825408935546875, 0.005132317543029785, 0.005582094192504883, 0.0060318708419799805, 0.006481647491455078, 0.006931424140930176, 0.0073812007904052734, 0.007830977439880371, 0.008280754089355469, 0.008730530738830566, 0.009180307388305664, 0.009630084037780762, 0.01007986068725586, 0.010529637336730957, 0.010979413986206055, 0.011429190635681152, 0.01187896728515625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 11.0, 55.0, 130.0, 179.0, 256.0, 196.0, 113.0, 48.0, 14.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020932972256559879, -0.0001813946000766009, -0.00015345949213951826, -0.0001255243842024356, -9.758926171343774e-05, -6.965415377635509e-05, -4.171903128735721e-05, -1.3783908798359334e-05, 1.4151199138723314e-05, 4.2086314351763576e-05, 7.002142956480384e-05, 9.79565447778441e-05, 0.00012589165999088436, 0.000153826767927967, 0.0001817618904169649, 0.00020969701290596277, 0.0002376321208430454, 0.0002655672433320433, 0.00029350235126912594, 0.0003214374592062086, 0.00034937256714329123, 0.00037730770418420434, 0.000405242812121287, 0.00043317792005836964, 0.00046111305709928274, 0.0004890481941401958, 0.000516983272973448, 0.0005449184100143611, 0.0005728534888476133, 0.0006007886258885264, 0.0006287237629294395, 0.0006566588999703526, 0.0006845939205959439, 0.000712529057636857, 0.0007404641364701092, 0.0007683992735110223, 0.0007963343523442745, 0.0008242694893851876, 0.0008522046264261007, 0.0008801397634670138, 0.000908074842300266, 0.0009360099793411791, 0.0009639450581744313, 0.0009918801952153444, 0.0010198153322562575, 0.0010477504692971706, 0.001075685489922762, 0.001103620626963675, 0.0011315557640045881, 0.0011594909010455012, 0.0011874260380864143, 0.0012153610587120056, 0.0012432961957529187, 0.0012712313327938318, 0.001299166469834745, 0.001327101606875658, 0.0013550366275012493, 0.0013829717645421624, 0.0014109069015830755, 0.0014388419222086668, 0.00146677705924958, 0.001494712196290493, 0.0015226473333314061, 0.0015505824703723192, 0.0015785176074132323]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 2.0, 7.0, 7.0, 4.0, 8.0, 10.0, 12.0, 13.0, 15.0, 24.0, 24.0, 28.0, 29.0, 34.0, 33.0, 34.0, 29.0, 37.0, 40.0, 39.0, 42.0, 51.0, 45.0, 46.0, 41.0, 34.0, 36.0, 33.0, 35.0, 29.0, 26.0, 21.0, 26.0, 12.0, 14.0, 12.0, 19.0, 17.0, 8.0, 11.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002823472023010254, -0.00027278438210487366, -0.0002632215619087219, -0.0002536587417125702, -0.00024409592151641846, -0.00023453310132026672, -0.000224970281124115, -0.00021540746092796326, -0.00020584464073181152, -0.0001962818205356598, -0.00018671900033950806, -0.00017715618014335632, -0.0001675933599472046, -0.00015803053975105286, -0.00014846771955490112, -0.0001389048993587494, -0.00012934207916259766, -0.00011977925896644592, -0.00011021643877029419, -0.00010065361857414246, -9.109079837799072e-05, -8.152797818183899e-05, -7.196515798568726e-05, -6.240233778953552e-05, -5.283951759338379e-05, -4.3276697397232056e-05, -3.371387720108032e-05, -2.415105700492859e-05, -1.4588236808776855e-05, -5.025416612625122e-06, 4.537403583526611e-06, 1.4100223779678345e-05, 2.3663043975830078e-05, 3.322586417198181e-05, 4.2788684368133545e-05, 5.235150456428528e-05, 6.191432476043701e-05, 7.147714495658875e-05, 8.103996515274048e-05, 9.060278534889221e-05, 0.00010016560554504395, 0.00010972842574119568, 0.00011929124593734741, 0.00012885406613349915, 0.00013841688632965088, 0.0001479797065258026, 0.00015754252672195435, 0.00016710534691810608, 0.0001766681671142578, 0.00018623098731040955, 0.00019579380750656128, 0.000205356627702713, 0.00021491944789886475, 0.00022448226809501648, 0.0002340450882911682, 0.00024360790848731995, 0.0002531707286834717, 0.0002627335488796234, 0.00027229636907577515, 0.0002818591892719269, 0.0002914220094680786, 0.00030098482966423035, 0.0003105476498603821, 0.0003201104700565338, 0.00032967329025268555]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 6.0, 9.0, 5.0, 5.0, 9.0, 10.0, 4.0, 12.0, 11.0, 14.0, 11.0, 8.0, 17.0, 39.0, 41.0, 26.0, 22.0, 29.0, 25.0, 41.0, 34.0, 34.0, 47.0, 35.0, 36.0, 43.0, 46.0, 44.0, 35.0, 34.0, 30.0, 40.0, 24.0, 38.0, 18.0, 18.0, 13.0, 17.0, 9.0, 12.0, 11.0, 8.0, 11.0, 8.0, 7.0, 5.0, 3.0, 6.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.861328125, -3.728546142578125, -3.59576416015625, -3.462982177734375, -3.3302001953125, -3.197418212890625, -3.06463623046875, -2.931854248046875, -2.799072265625, -2.666290283203125, -2.53350830078125, -2.400726318359375, -2.2679443359375, -2.135162353515625, -2.00238037109375, -1.869598388671875, -1.73681640625, -1.604034423828125, -1.47125244140625, -1.338470458984375, -1.2056884765625, -1.072906494140625, -0.94012451171875, -0.807342529296875, -0.674560546875, -0.541778564453125, -0.40899658203125, -0.276214599609375, -0.1434326171875, -0.010650634765625, 0.12213134765625, 0.254913330078125, 0.3876953125, 0.520477294921875, 0.65325927734375, 0.786041259765625, 0.9188232421875, 1.051605224609375, 1.18438720703125, 1.317169189453125, 1.449951171875, 1.582733154296875, 1.71551513671875, 1.848297119140625, 1.9810791015625, 2.113861083984375, 2.24664306640625, 2.379425048828125, 2.51220703125, 2.644989013671875, 2.77777099609375, 2.910552978515625, 3.0433349609375, 3.176116943359375, 3.30889892578125, 3.441680908203125, 3.574462890625, 3.707244873046875, 3.84002685546875, 3.972808837890625, 4.1055908203125, 4.238372802734375, 4.37115478515625, 4.503936767578125, 4.63671875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 9.0, 13.0, 13.0, 11.0, 32.0, 29.0, 42.0, 51.0, 84.0, 89.0, 142.0, 257.0, 426.0, 852.0, 1909.0, 4649.0, 12598.0, 37491.0, 111973.0, 343340.0, 357805.0, 116041.0, 38558.0, 13209.0, 4871.0, 1981.0, 865.0, 435.0, 270.0, 158.0, 91.0, 73.0, 47.0, 46.0, 24.0, 26.0, 15.0, 12.0, 5.0, 11.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41015625, -4.25274658203125, -4.0953369140625, -3.93792724609375, -3.780517578125, -3.62310791015625, -3.4656982421875, -3.30828857421875, -3.15087890625, -2.99346923828125, -2.8360595703125, -2.67864990234375, -2.521240234375, -2.36383056640625, -2.2064208984375, -2.04901123046875, -1.8916015625, -1.73419189453125, -1.5767822265625, -1.41937255859375, -1.261962890625, -1.10455322265625, -0.9471435546875, -0.78973388671875, -0.63232421875, -0.47491455078125, -0.3175048828125, -0.16009521484375, -0.002685546875, 0.15472412109375, 0.3121337890625, 0.46954345703125, 0.626953125, 0.78436279296875, 0.9417724609375, 1.09918212890625, 1.256591796875, 1.41400146484375, 1.5714111328125, 1.72882080078125, 1.88623046875, 2.04364013671875, 2.2010498046875, 2.35845947265625, 2.515869140625, 2.67327880859375, 2.8306884765625, 2.98809814453125, 3.1455078125, 3.30291748046875, 3.4603271484375, 3.61773681640625, 3.775146484375, 3.93255615234375, 4.0899658203125, 4.24737548828125, 4.40478515625, 4.56219482421875, 4.7196044921875, 4.87701416015625, 5.034423828125, 5.19183349609375, 5.3492431640625, 5.50665283203125, 5.6640625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 6.0, 3.0, 8.0, 8.0, 7.0, 16.0, 18.0, 23.0, 22.0, 26.0, 25.0, 41.0, 39.0, 39.0, 49.0, 55.0, 84.0, 203.0, 1519.0, 299.0, 113.0, 64.0, 40.0, 44.0, 42.0, 42.0, 29.0, 27.0, 35.0, 24.0, 22.0, 12.0, 18.0, 11.0, 9.0, 6.0, 5.0, 4.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.0625, -15.522705078125, -14.98291015625, -14.443115234375, -13.9033203125, -13.363525390625, -12.82373046875, -12.283935546875, -11.744140625, -11.204345703125, -10.66455078125, -10.124755859375, -9.5849609375, -9.045166015625, -8.50537109375, -7.965576171875, -7.42578125, -6.885986328125, -6.34619140625, -5.806396484375, -5.2666015625, -4.726806640625, -4.18701171875, -3.647216796875, -3.107421875, -2.567626953125, -2.02783203125, -1.488037109375, -0.9482421875, -0.408447265625, 0.13134765625, 0.671142578125, 1.2109375, 1.750732421875, 2.29052734375, 2.830322265625, 3.3701171875, 3.909912109375, 4.44970703125, 4.989501953125, 5.529296875, 6.069091796875, 6.60888671875, 7.148681640625, 7.6884765625, 8.228271484375, 8.76806640625, 9.307861328125, 9.84765625, 10.387451171875, 10.92724609375, 11.467041015625, 12.0068359375, 12.546630859375, 13.08642578125, 13.626220703125, 14.166015625, 14.705810546875, 15.24560546875, 15.785400390625, 16.3251953125, 16.864990234375, 17.40478515625, 17.944580078125, 18.484375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 6.0, 21.0, 17.0, 18.0, 27.0, 46.0, 64.0, 105.0, 176.0, 315.0, 888.0, 9105.0, 3129714.0, 3889.0, 626.0, 276.0, 133.0, 93.0, 52.0, 34.0, 28.0, 20.0, 15.0, 8.0, 13.0, 8.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.875, -105.1357421875, -102.396484375, -99.6572265625, -96.91796875, -94.1787109375, -91.439453125, -88.7001953125, -85.9609375, -83.2216796875, -80.482421875, -77.7431640625, -75.00390625, -72.2646484375, -69.525390625, -66.7861328125, -64.046875, -61.3076171875, -58.568359375, -55.8291015625, -53.08984375, -50.3505859375, -47.611328125, -44.8720703125, -42.1328125, -39.3935546875, -36.654296875, -33.9150390625, -31.17578125, -28.4365234375, -25.697265625, -22.9580078125, -20.21875, -17.4794921875, -14.740234375, -12.0009765625, -9.26171875, -6.5224609375, -3.783203125, -1.0439453125, 1.6953125, 4.4345703125, 7.173828125, 9.9130859375, 12.65234375, 15.3916015625, 18.130859375, 20.8701171875, 23.609375, 26.3486328125, 29.087890625, 31.8271484375, 34.56640625, 37.3056640625, 40.044921875, 42.7841796875, 45.5234375, 48.2626953125, 51.001953125, 53.7412109375, 56.48046875, 59.2197265625, 61.958984375, 64.6982421875, 67.4375]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 12.0, 42.0, 97.0, 232.0, 274.0, 225.0, 94.0, 25.0, 8.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.21437072753906, -65.99598693847656, -64.77759552001953, -63.559207916259766, -62.3408203125, -61.1224365234375, -59.90404510498047, -58.68566131591797, -57.4672737121582, -56.24888610839844, -55.03049850463867, -53.812110900878906, -52.59372329711914, -51.375335693359375, -50.156951904296875, -48.93856430053711, -47.720176696777344, -46.50178909301758, -45.28340148925781, -44.06501388549805, -42.84662628173828, -41.62824249267578, -40.40985107421875, -39.19146728515625, -37.97307586669922, -36.75468826293945, -35.53630065917969, -34.31791305541992, -33.099525451660156, -31.881139755249023, -30.662752151489258, -29.444366455078125, -28.225975036621094, -27.007587432861328, -25.789199829101562, -24.570812225341797, -23.352426528930664, -22.1340389251709, -20.915651321411133, -19.697265625, -18.478878021240234, -17.26049041748047, -16.042102813720703, -14.823716163635254, -13.605329513549805, -12.386941909790039, -11.168554306030273, -9.950167655944824, -8.731780052185059, -7.513392925262451, -6.295005798339844, -5.076618194580078, -3.8582310676574707, -2.6398439407348633, -1.4214563369750977, -0.20306968688964844, 1.0153179168701172, 2.2337050437927246, 3.452092409133911, 4.670479774475098, 5.888866901397705, 7.1072540283203125, 8.325641632080078, 9.544028282165527, 10.762415885925293]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 5.0, 3.0, 8.0, 11.0, 11.0, 13.0, 6.0, 16.0, 18.0, 22.0, 15.0, 21.0, 17.0, 30.0, 37.0, 28.0, 39.0, 38.0, 27.0, 33.0, 34.0, 38.0, 34.0, 40.0, 44.0, 31.0, 35.0, 33.0, 31.0, 31.0, 32.0, 30.0, 19.0, 27.0, 25.0, 19.0, 22.0, 14.0, 15.0, 14.0, 11.0, 6.0, 7.0, 2.0, 6.0, 6.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-37.522613525390625, -36.37358474731445, -35.22455596923828, -34.075531005859375, -32.9265022277832, -31.77747344970703, -30.628446578979492, -29.479419708251953, -28.33039093017578, -27.18136215209961, -26.03233528137207, -24.88330841064453, -23.73427963256836, -22.585250854492188, -21.43622398376465, -20.28719711303711, -19.138168334960938, -17.989139556884766, -16.840112686157227, -15.691084861755371, -14.542057037353516, -13.39302921295166, -12.244001388549805, -11.09497356414795, -9.945945739746094, -8.796917915344238, -7.647890090942383, -6.498862266540527, -5.349834442138672, -4.200806617736816, -3.051778793334961, -1.9027509689331055, -0.75372314453125, 0.39530467987060547, 1.544332504272461, 2.6933603286743164, 3.842388153076172, 4.991415977478027, 6.140443801879883, 7.289471626281738, 8.438499450683594, 9.58752727508545, 10.736555099487305, 11.88558292388916, 13.034610748291016, 14.183638572692871, 15.332666397094727, 16.481693267822266, 17.630722045898438, 18.77975082397461, 19.92877769470215, 21.077804565429688, 22.22683334350586, 23.37586212158203, 24.52488899230957, 25.67391586303711, 26.82294464111328, 27.971973419189453, 29.121000289916992, 30.27002716064453, 31.419055938720703, 32.568084716796875, 33.71710968017578, 34.86613845825195, 36.015167236328125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 5.0, 2.0, 8.0, 6.0, 8.0, 10.0, 12.0, 15.0, 6.0, 18.0, 17.0, 16.0, 24.0, 26.0, 30.0, 33.0, 29.0, 26.0, 40.0, 49.0, 40.0, 35.0, 38.0, 35.0, 40.0, 40.0, 35.0, 47.0, 29.0, 33.0, 34.0, 40.0, 21.0, 17.0, 17.0, 22.0, 16.0, 18.0, 9.0, 4.0, 7.0, 9.0, 9.0, 6.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.1077880859375, -3.965576171875, -3.8233642578125, -3.68115234375, -3.5389404296875, -3.396728515625, -3.2545166015625, -3.1123046875, -2.9700927734375, -2.827880859375, -2.6856689453125, -2.54345703125, -2.4012451171875, -2.259033203125, -2.1168212890625, -1.974609375, -1.8323974609375, -1.690185546875, -1.5479736328125, -1.40576171875, -1.2635498046875, -1.121337890625, -0.9791259765625, -0.8369140625, -0.6947021484375, -0.552490234375, -0.4102783203125, -0.26806640625, -0.1258544921875, 0.016357421875, 0.1585693359375, 0.30078125, 0.4429931640625, 0.585205078125, 0.7274169921875, 0.86962890625, 1.0118408203125, 1.154052734375, 1.2962646484375, 1.4384765625, 1.5806884765625, 1.722900390625, 1.8651123046875, 2.00732421875, 2.1495361328125, 2.291748046875, 2.4339599609375, 2.576171875, 2.7183837890625, 2.860595703125, 3.0028076171875, 3.14501953125, 3.2872314453125, 3.429443359375, 3.5716552734375, 3.7138671875, 3.8560791015625, 3.998291015625, 4.1405029296875, 4.28271484375, 4.4249267578125, 4.567138671875, 4.7093505859375, 4.8515625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 9.0, 6.0, 12.0, 7.0, 12.0, 11.0, 10.0, 21.0, 19.0, 22.0, 33.0, 38.0, 38.0, 30.0, 48.0, 65.0, 91.0, 123.0, 180.0, 339.0, 646.0, 2158.0, 16028.0, 250781.0, 2046555.0, 1691085.0, 170778.0, 11605.0, 1862.0, 605.0, 299.0, 185.0, 115.0, 77.0, 71.0, 57.0, 48.0, 31.0, 32.0, 25.0, 22.0, 24.0, 16.0, 11.0, 12.0, 10.0, 9.0, 6.0, 5.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-10.4921875, -10.16357421875, -9.8349609375, -9.50634765625, -9.177734375, -8.84912109375, -8.5205078125, -8.19189453125, -7.86328125, -7.53466796875, -7.2060546875, -6.87744140625, -6.548828125, -6.22021484375, -5.8916015625, -5.56298828125, -5.234375, -4.90576171875, -4.5771484375, -4.24853515625, -3.919921875, -3.59130859375, -3.2626953125, -2.93408203125, -2.60546875, -2.27685546875, -1.9482421875, -1.61962890625, -1.291015625, -0.96240234375, -0.6337890625, -0.30517578125, 0.0234375, 0.35205078125, 0.6806640625, 1.00927734375, 1.337890625, 1.66650390625, 1.9951171875, 2.32373046875, 2.65234375, 2.98095703125, 3.3095703125, 3.63818359375, 3.966796875, 4.29541015625, 4.6240234375, 4.95263671875, 5.28125, 5.60986328125, 5.9384765625, 6.26708984375, 6.595703125, 6.92431640625, 7.2529296875, 7.58154296875, 7.91015625, 8.23876953125, 8.5673828125, 8.89599609375, 9.224609375, 9.55322265625, 9.8818359375, 10.21044921875, 10.5390625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 2.0, 3.0, 4.0, 3.0, 7.0, 9.0, 16.0, 20.0, 28.0, 29.0, 31.0, 53.0, 48.0, 74.0, 81.0, 122.0, 161.0, 202.0, 273.0, 339.0, 391.0, 398.0, 389.0, 301.0, 254.0, 203.0, 170.0, 118.0, 74.0, 52.0, 51.0, 29.0, 39.0, 21.0, 23.0, 15.0, 17.0, 6.0, 6.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.0234375, -8.76068115234375, -8.4979248046875, -8.23516845703125, -7.972412109375, -7.70965576171875, -7.4468994140625, -7.18414306640625, -6.92138671875, -6.65863037109375, -6.3958740234375, -6.13311767578125, -5.870361328125, -5.60760498046875, -5.3448486328125, -5.08209228515625, -4.8193359375, -4.55657958984375, -4.2938232421875, -4.03106689453125, -3.768310546875, -3.50555419921875, -3.2427978515625, -2.98004150390625, -2.71728515625, -2.45452880859375, -2.1917724609375, -1.92901611328125, -1.666259765625, -1.40350341796875, -1.1407470703125, -0.87799072265625, -0.615234375, -0.35247802734375, -0.0897216796875, 0.17303466796875, 0.435791015625, 0.69854736328125, 0.9613037109375, 1.22406005859375, 1.48681640625, 1.74957275390625, 2.0123291015625, 2.27508544921875, 2.537841796875, 2.80059814453125, 3.0633544921875, 3.32611083984375, 3.5888671875, 3.85162353515625, 4.1143798828125, 4.37713623046875, 4.639892578125, 4.90264892578125, 5.1654052734375, 5.42816162109375, 5.69091796875, 5.95367431640625, 6.2164306640625, 6.47918701171875, 6.741943359375, 7.00469970703125, 7.2674560546875, 7.53021240234375, 7.79296875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 9.0, 8.0, 17.0, 21.0, 28.0, 31.0, 40.0, 52.0, 64.0, 87.0, 122.0, 182.0, 219.0, 304.0, 422.0, 1140.0, 69319.0, 4082015.0, 37622.0, 1007.0, 405.0, 302.0, 210.0, 164.0, 102.0, 86.0, 70.0, 55.0, 53.0, 30.0, 18.0, 25.0, 13.0, 5.0, 12.0, 5.0, 5.0, 4.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.15625, -36.86083984375, -35.5654296875, -34.27001953125, -32.974609375, -31.67919921875, -30.3837890625, -29.08837890625, -27.79296875, -26.49755859375, -25.2021484375, -23.90673828125, -22.611328125, -21.31591796875, -20.0205078125, -18.72509765625, -17.4296875, -16.13427734375, -14.8388671875, -13.54345703125, -12.248046875, -10.95263671875, -9.6572265625, -8.36181640625, -7.06640625, -5.77099609375, -4.4755859375, -3.18017578125, -1.884765625, -0.58935546875, 0.7060546875, 2.00146484375, 3.296875, 4.59228515625, 5.8876953125, 7.18310546875, 8.478515625, 9.77392578125, 11.0693359375, 12.36474609375, 13.66015625, 14.95556640625, 16.2509765625, 17.54638671875, 18.841796875, 20.13720703125, 21.4326171875, 22.72802734375, 24.0234375, 25.31884765625, 26.6142578125, 27.90966796875, 29.205078125, 30.50048828125, 31.7958984375, 33.09130859375, 34.38671875, 35.68212890625, 36.9775390625, 38.27294921875, 39.568359375, 40.86376953125, 42.1591796875, 43.45458984375, 44.75]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 24.0, 336.0, 531.0, 118.0, 7.0, 1.0, 1.0], "bins": [-378.9446716308594, -372.55291748046875, -366.1611328125, -359.7693786621094, -353.3775939941406, -346.98583984375, -340.59405517578125, -334.2023010253906, -327.8105163574219, -321.41876220703125, -315.0269775390625, -308.6352233886719, -302.2434387207031, -295.8516845703125, -289.45989990234375, -283.0681457519531, -276.6763916015625, -270.2846374511719, -263.8928527832031, -257.5010986328125, -251.10931396484375, -244.71755981445312, -238.32577514648438, -231.93402099609375, -225.542236328125, -219.1504669189453, -212.75869750976562, -206.36692810058594, -199.97515869140625, -193.58340454101562, -187.19161987304688, -180.79986572265625, -174.40809631347656, -168.01632690429688, -161.6245574951172, -155.2327880859375, -148.8410186767578, -142.44924926757812, -136.0574951171875, -129.6657257080078, -123.27395629882812, -116.88218688964844, -110.49041748046875, -104.09864807128906, -97.7068862915039, -91.31511688232422, -84.92334747314453, -78.53158569335938, -72.13980865478516, -65.74803924560547, -59.35627365112305, -52.96450424194336, -46.57273864746094, -40.18096923828125, -33.78919982910156, -27.39743423461914, -21.005666732788086, -14.613899230957031, -8.22213077545166, -1.830362319946289, 4.561405181884766, 10.95317268371582, 17.344942092895508, 23.73670768737793, 30.128477096557617]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 1.0, 6.0, 2.0, 12.0, 4.0, 15.0, 21.0, 19.0, 17.0, 16.0, 24.0, 24.0, 32.0, 35.0, 30.0, 33.0, 31.0, 47.0, 44.0, 42.0, 39.0, 32.0, 41.0, 36.0, 36.0, 34.0, 39.0, 21.0, 30.0, 25.0, 24.0, 26.0, 22.0, 29.0, 16.0, 15.0, 17.0, 14.0, 10.0, 4.0, 7.0, 3.0, 5.0, 7.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.848724365234375, -25.951616287231445, -25.054508209228516, -24.157400131225586, -23.260292053222656, -22.363182067871094, -21.466073989868164, -20.568965911865234, -19.671857833862305, -18.774749755859375, -17.877641677856445, -16.980533599853516, -16.083423614501953, -15.18631649017334, -14.289207458496094, -13.392099380493164, -12.494991302490234, -11.597883224487305, -10.700775146484375, -9.803666114807129, -8.9065580368042, -8.00944995880127, -7.112341403961182, -6.215232849121094, -5.318124771118164, -4.421016693115234, -3.5239081382751465, -2.6267998218536377, -1.729691505432129, -0.8325834274291992, 0.06452512741088867, 0.9616336822509766, 1.8587398529052734, 2.7558481693267822, 3.652956485748291, 4.550065040588379, 5.447173118591309, 6.344281196594238, 7.241389751434326, 8.138498306274414, 9.035606384277344, 9.932714462280273, 10.829822540283203, 11.72693157196045, 12.624039649963379, 13.521147727966309, 14.418256759643555, 15.315364837646484, 16.212472915649414, 17.109580993652344, 18.006689071655273, 18.903797149658203, 19.800907135009766, 20.698013305664062, 21.595123291015625, 22.492231369018555, 23.389339447021484, 24.286447525024414, 25.183555603027344, 26.080663681030273, 26.977771759033203, 27.874881744384766, 28.771989822387695, 29.669097900390625, 30.566205978393555]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 0.0, 8.0, 4.0, 5.0, 9.0, 7.0, 6.0, 21.0, 16.0, 17.0, 14.0, 29.0, 32.0, 13.0, 34.0, 31.0, 26.0, 35.0, 40.0, 38.0, 38.0, 46.0, 36.0, 43.0, 34.0, 42.0, 39.0, 41.0, 29.0, 31.0, 21.0, 27.0, 26.0, 15.0, 22.0, 18.0, 13.0, 24.0, 11.0, 12.0, 8.0, 4.0, 8.0, 6.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2734375, -4.13812255859375, -4.0028076171875, -3.86749267578125, -3.732177734375, -3.59686279296875, -3.4615478515625, -3.32623291015625, -3.19091796875, -3.05560302734375, -2.9202880859375, -2.78497314453125, -2.649658203125, -2.51434326171875, -2.3790283203125, -2.24371337890625, -2.1083984375, -1.97308349609375, -1.8377685546875, -1.70245361328125, -1.567138671875, -1.43182373046875, -1.2965087890625, -1.16119384765625, -1.02587890625, -0.89056396484375, -0.7552490234375, -0.61993408203125, -0.484619140625, -0.34930419921875, -0.2139892578125, -0.07867431640625, 0.056640625, 0.19195556640625, 0.3272705078125, 0.46258544921875, 0.597900390625, 0.73321533203125, 0.8685302734375, 1.00384521484375, 1.13916015625, 1.27447509765625, 1.4097900390625, 1.54510498046875, 1.680419921875, 1.81573486328125, 1.9510498046875, 2.08636474609375, 2.2216796875, 2.35699462890625, 2.4923095703125, 2.62762451171875, 2.762939453125, 2.89825439453125, 3.0335693359375, 3.16888427734375, 3.30419921875, 3.43951416015625, 3.5748291015625, 3.71014404296875, 3.845458984375, 3.98077392578125, 4.1160888671875, 4.25140380859375, 4.38671875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 6.0, 1.0, 19.0, 11.0, 12.0, 23.0, 47.0, 59.0, 100.0, 140.0, 219.0, 344.0, 516.0, 785.0, 993.0, 1494.0, 2012.0, 3019.0, 4289.0, 6326.0, 9165.0, 13504.0, 20023.0, 29779.0, 45681.0, 72373.0, 127180.0, 301559.0, 163407.0, 86381.0, 53174.0, 34220.0, 22848.0, 15329.0, 10178.0, 7284.0, 4927.0, 3419.0, 2320.0, 1674.0, 1203.0, 840.0, 593.0, 365.0, 242.0, 187.0, 93.0, 66.0, 49.0, 33.0, 16.0, 12.0, 13.0, 10.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.9111328125, -0.8823623657226562, -0.8535919189453125, -0.8248214721679688, -0.796051025390625, -0.7672805786132812, -0.7385101318359375, -0.7097396850585938, -0.68096923828125, -0.6521987915039062, -0.6234283447265625, -0.5946578979492188, -0.565887451171875, -0.5371170043945312, -0.5083465576171875, -0.47957611083984375, -0.4508056640625, -0.42203521728515625, -0.3932647705078125, -0.36449432373046875, -0.335723876953125, -0.30695343017578125, -0.2781829833984375, -0.24941253662109375, -0.22064208984375, -0.19187164306640625, -0.1631011962890625, -0.13433074951171875, -0.105560302734375, -0.07678985595703125, -0.0480194091796875, -0.01924896240234375, 0.009521484375, 0.03829193115234375, 0.0670623779296875, 0.09583282470703125, 0.124603271484375, 0.15337371826171875, 0.1821441650390625, 0.21091461181640625, 0.23968505859375, 0.26845550537109375, 0.2972259521484375, 0.32599639892578125, 0.354766845703125, 0.38353729248046875, 0.4123077392578125, 0.44107818603515625, 0.4698486328125, 0.49861907958984375, 0.5273895263671875, 0.5561599731445312, 0.584930419921875, 0.6137008666992188, 0.6424713134765625, 0.6712417602539062, 0.70001220703125, 0.7287826538085938, 0.7575531005859375, 0.7863235473632812, 0.815093994140625, 0.8438644409179688, 0.8726348876953125, 0.9014053344726562, 0.93017578125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 10.0, 8.0, 10.0, 18.0, 24.0, 20.0, 27.0, 30.0, 27.0, 29.0, 25.0, 40.0, 42.0, 35.0, 36.0, 38.0, 32.0, 1066.0, 37.0, 48.0, 37.0, 32.0, 35.0, 36.0, 46.0, 30.0, 31.0, 35.0, 19.0, 24.0, 14.0, 14.0, 12.0, 11.0, 6.0, 6.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.9296875, -2.8397216796875, -2.749755859375, -2.6597900390625, -2.56982421875, -2.4798583984375, -2.389892578125, -2.2999267578125, -2.2099609375, -2.1199951171875, -2.030029296875, -1.9400634765625, -1.85009765625, -1.7601318359375, -1.670166015625, -1.5802001953125, -1.490234375, -1.4002685546875, -1.310302734375, -1.2203369140625, -1.13037109375, -1.0404052734375, -0.950439453125, -0.8604736328125, -0.7705078125, -0.6805419921875, -0.590576171875, -0.5006103515625, -0.41064453125, -0.3206787109375, -0.230712890625, -0.1407470703125, -0.05078125, 0.0391845703125, 0.129150390625, 0.2191162109375, 0.30908203125, 0.3990478515625, 0.489013671875, 0.5789794921875, 0.6689453125, 0.7589111328125, 0.848876953125, 0.9388427734375, 1.02880859375, 1.1187744140625, 1.208740234375, 1.2987060546875, 1.388671875, 1.4786376953125, 1.568603515625, 1.6585693359375, 1.74853515625, 1.8385009765625, 1.928466796875, 2.0184326171875, 2.1083984375, 2.1983642578125, 2.288330078125, 2.3782958984375, 2.46826171875, 2.5582275390625, 2.648193359375, 2.7381591796875, 2.828125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 10.0, 11.0, 22.0, 22.0, 34.0, 59.0, 70.0, 104.0, 165.0, 232.0, 377.0, 457.0, 819.0, 1242.0, 1934.0, 3176.0, 5300.0, 8866.0, 15227.0, 26460.0, 46965.0, 86744.0, 178607.0, 1411779.0, 140190.0, 73051.0, 40221.0, 22204.0, 12837.0, 7478.0, 4599.0, 2800.0, 1797.0, 1148.0, 722.0, 465.0, 326.0, 219.0, 125.0, 83.0, 60.0, 36.0, 21.0, 21.0, 15.0, 12.0, 10.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.1435546875, -1.107086181640625, -1.07061767578125, -1.034149169921875, -0.9976806640625, -0.961212158203125, -0.92474365234375, -0.888275146484375, -0.851806640625, -0.815338134765625, -0.77886962890625, -0.742401123046875, -0.7059326171875, -0.669464111328125, -0.63299560546875, -0.596527099609375, -0.56005859375, -0.523590087890625, -0.48712158203125, -0.450653076171875, -0.4141845703125, -0.377716064453125, -0.34124755859375, -0.304779052734375, -0.268310546875, -0.231842041015625, -0.19537353515625, -0.158905029296875, -0.1224365234375, -0.085968017578125, -0.04949951171875, -0.013031005859375, 0.0234375, 0.059906005859375, 0.09637451171875, 0.132843017578125, 0.1693115234375, 0.205780029296875, 0.24224853515625, 0.278717041015625, 0.315185546875, 0.351654052734375, 0.38812255859375, 0.424591064453125, 0.4610595703125, 0.497528076171875, 0.53399658203125, 0.570465087890625, 0.60693359375, 0.643402099609375, 0.67987060546875, 0.716339111328125, 0.7528076171875, 0.789276123046875, 0.82574462890625, 0.862213134765625, 0.898681640625, 0.935150146484375, 0.97161865234375, 1.008087158203125, 1.0445556640625, 1.081024169921875, 1.11749267578125, 1.153961181640625, 1.1904296875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 2.0, 2.0, 1.0, 6.0, 4.0, 3.0, 6.0, 7.0, 5.0, 9.0, 11.0, 7.0, 12.0, 15.0, 23.0, 24.0, 22.0, 37.0, 38.0, 35.0, 58.0, 67.0, 58.0, 55.0, 50.0, 50.0, 53.0, 47.0, 44.0, 39.0, 37.0, 19.0, 19.0, 19.0, 18.0, 13.0, 11.0, 13.0, 11.0, 10.0, 6.0, 8.0, 7.0, 6.0, 0.0, 8.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0005254745483398438, -0.0005093887448310852, -0.0004933029413223267, -0.0004772171378135681, -0.00046113133430480957, -0.000445045530796051, -0.0004289597272872925, -0.00041287392377853394, -0.0003967881202697754, -0.00038070231676101685, -0.0003646165132522583, -0.00034853070974349976, -0.0003324449062347412, -0.00031635910272598267, -0.0003002732992172241, -0.0002841874957084656, -0.00026810169219970703, -0.0002520158886909485, -0.00023593008518218994, -0.0002198442816734314, -0.00020375847816467285, -0.0001876726746559143, -0.00017158687114715576, -0.00015550106763839722, -0.00013941526412963867, -0.00012332946062088013, -0.00010724365711212158, -9.115785360336304e-05, -7.507205009460449e-05, -5.898624658584595e-05, -4.29004430770874e-05, -2.6814639568328857e-05, -1.0728836059570312e-05, 5.356967449188232e-06, 2.1442770957946777e-05, 3.752857446670532e-05, 5.361437797546387e-05, 6.970018148422241e-05, 8.578598499298096e-05, 0.0001018717885017395, 0.00011795759201049805, 0.0001340433955192566, 0.00015012919902801514, 0.00016621500253677368, 0.00018230080604553223, 0.00019838660955429077, 0.00021447241306304932, 0.00023055821657180786, 0.0002466440200805664, 0.00026272982358932495, 0.0002788156270980835, 0.00029490143060684204, 0.0003109872341156006, 0.00032707303762435913, 0.0003431588411331177, 0.0003592446446418762, 0.00037533044815063477, 0.0003914162516593933, 0.00040750205516815186, 0.0004235878586769104, 0.00043967366218566895, 0.0004557594656944275, 0.00047184526920318604, 0.0004879310727119446, 0.0005040168762207031]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 2.0, 5.0, 3.0, 7.0, 6.0, 8.0, 9.0, 6.0, 12.0, 20.0, 22.0, 24.0, 23.0, 36.0, 51.0, 58.0, 67.0, 121.0, 180.0, 432.0, 1523.0, 582451.0, 461018.0, 1471.0, 405.0, 176.0, 116.0, 57.0, 53.0, 38.0, 31.0, 25.0, 18.0, 18.0, 12.0, 8.0, 9.0, 6.0, 7.0, 6.0, 4.0, 0.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01116943359375, -0.010770320892333984, -0.010371208190917969, -0.009972095489501953, -0.009572982788085938, -0.009173870086669922, -0.008774757385253906, -0.00837564468383789, -0.007976531982421875, -0.007577419281005859, -0.007178306579589844, -0.006779193878173828, -0.0063800811767578125, -0.005980968475341797, -0.005581855773925781, -0.005182743072509766, -0.00478363037109375, -0.004384517669677734, -0.003985404968261719, -0.003586292266845703, -0.0031871795654296875, -0.002788066864013672, -0.0023889541625976562, -0.0019898414611816406, -0.001590728759765625, -0.0011916160583496094, -0.0007925033569335938, -0.0003933906555175781, 5.7220458984375e-06, 0.0004048347473144531, 0.0008039474487304688, 0.0012030601501464844, 0.0016021728515625, 0.0020012855529785156, 0.0024003982543945312, 0.002799510955810547, 0.0031986236572265625, 0.003597736358642578, 0.003996849060058594, 0.004395961761474609, 0.004795074462890625, 0.005194187164306641, 0.005593299865722656, 0.005992412567138672, 0.0063915252685546875, 0.006790637969970703, 0.007189750671386719, 0.007588863372802734, 0.00798797607421875, 0.008387088775634766, 0.008786201477050781, 0.009185314178466797, 0.009584426879882812, 0.009983539581298828, 0.010382652282714844, 0.01078176498413086, 0.011180877685546875, 0.01157999038696289, 0.011979103088378906, 0.012378215789794922, 0.012777328491210938, 0.013176441192626953, 0.013575553894042969, 0.013974666595458984, 0.014373779296875]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 12.0, 26.0, 161.0, 399.0, 314.0, 89.0, 16.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.0024153057020157576, -0.0023727656807750463, -0.002330225659534335, -0.002287685638293624, -0.0022451456170529127, -0.002202605362981558, -0.0021600653417408466, -0.0021175253205001354, -0.002074985299259424, -0.002032445278018713, -0.001989905256778002, -0.0019473651191219687, -0.0019048250978812575, -0.0018622850766405463, -0.0018197450553998351, -0.001777204917743802, -0.0017346648965030909, -0.0016921248752623796, -0.0016495848540216684, -0.0016070447163656354, -0.0015645046951249242, -0.001521964673884213, -0.0014794246526435018, -0.0014368845149874687, -0.0013943446101620793, -0.0013518045889213681, -0.001309264567680657, -0.0012667244300246239, -0.0012241844087839127, -0.0011816443875432014, -0.0011391043663024902, -0.001096564345061779, -0.001054024207405746, -0.0010114841861650348, -0.0009689441067166626, -0.0009264040854759514, -0.0008838640060275793, -0.0008413239847868681, -0.0007987839635461569, -0.0007562438840977848, -0.0007137038046494126, -0.0006711637834087014, -0.0006286237039603293, -0.0005860836827196181, -0.000543543603271246, -0.0005010035820305347, -0.0004584635316859931, -0.0004159234813414514, -0.0003733834601007402, -0.0003308434097561985, -0.00028830335941165686, -0.00024576333817094564, -0.00020322327327448875, -0.00016068322292994708, -0.00011814318713732064, -7.560313679277897e-05, -3.30630864482373e-05, 9.476960258325562e-06, 5.2017006964888424e-05, 9.455705003347248e-05, 0.00013709710037801415, 0.00017963715072255582, 0.00022217718651518226, 0.0002647172368597239, 0.0003072572872042656]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 8.0, 4.0, 9.0, 5.0, 7.0, 13.0, 15.0, 13.0, 16.0, 18.0, 28.0, 36.0, 44.0, 45.0, 41.0, 50.0, 48.0, 43.0, 43.0, 41.0, 46.0, 49.0, 49.0, 48.0, 40.0, 27.0, 35.0, 30.0, 24.0, 32.0, 18.0, 16.0, 17.0, 15.0, 9.0, 11.0, 4.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036776065826416016, -0.0003566090017557144, -0.0003454573452472687, -0.00033430568873882294, -0.0003231540322303772, -0.00031200237572193146, -0.0003008507192134857, -0.00028969906270504, -0.00027854740619659424, -0.0002673957496881485, -0.00025624409317970276, -0.000245092436671257, -0.00023394078016281128, -0.00022278912365436554, -0.0002116374671459198, -0.00020048581063747406, -0.00018933415412902832, -0.00017818249762058258, -0.00016703084111213684, -0.0001558791846036911, -0.00014472752809524536, -0.00013357587158679962, -0.00012242421507835388, -0.00011127255856990814, -0.0001001209020614624, -8.896924555301666e-05, -7.781758904457092e-05, -6.666593253612518e-05, -5.551427602767944e-05, -4.4362619519233704e-05, -3.3210963010787964e-05, -2.2059306502342224e-05, -1.0907649993896484e-05, 2.4400651454925537e-07, 1.1395663022994995e-05, 2.2547319531440735e-05, 3.3698976039886475e-05, 4.4850632548332214e-05, 5.6002289056777954e-05, 6.71539455652237e-05, 7.830560207366943e-05, 8.945725858211517e-05, 0.00010060891509056091, 0.00011176057159900665, 0.0001229122281074524, 0.00013406388461589813, 0.00014521554112434387, 0.0001563671976327896, 0.00016751885414123535, 0.0001786705106496811, 0.00018982216715812683, 0.00020097382366657257, 0.0002121254801750183, 0.00022327713668346405, 0.0002344287931919098, 0.00024558044970035553, 0.00025673210620880127, 0.000267883762717247, 0.00027903541922569275, 0.0002901870757341385, 0.00030133873224258423, 0.00031249038875102997, 0.0003236420452594757, 0.00033479370176792145, 0.0003459453582763672]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 0.0, 8.0, 4.0, 5.0, 9.0, 7.0, 6.0, 21.0, 16.0, 17.0, 14.0, 29.0, 32.0, 13.0, 34.0, 31.0, 26.0, 35.0, 40.0, 38.0, 38.0, 46.0, 36.0, 43.0, 34.0, 42.0, 39.0, 41.0, 29.0, 31.0, 21.0, 27.0, 26.0, 15.0, 22.0, 18.0, 13.0, 24.0, 11.0, 12.0, 8.0, 4.0, 8.0, 6.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2734375, -4.13812255859375, -4.0028076171875, -3.86749267578125, -3.732177734375, -3.59686279296875, -3.4615478515625, -3.32623291015625, -3.19091796875, -3.05560302734375, -2.9202880859375, -2.78497314453125, -2.649658203125, -2.51434326171875, -2.3790283203125, -2.24371337890625, -2.1083984375, -1.97308349609375, -1.8377685546875, -1.70245361328125, -1.567138671875, -1.43182373046875, -1.2965087890625, -1.16119384765625, -1.02587890625, -0.89056396484375, -0.7552490234375, -0.61993408203125, -0.484619140625, -0.34930419921875, -0.2139892578125, -0.07867431640625, 0.056640625, 0.19195556640625, 0.3272705078125, 0.46258544921875, 0.597900390625, 0.73321533203125, 0.8685302734375, 1.00384521484375, 1.13916015625, 1.27447509765625, 1.4097900390625, 1.54510498046875, 1.680419921875, 1.81573486328125, 1.9510498046875, 2.08636474609375, 2.2216796875, 2.35699462890625, 2.4923095703125, 2.62762451171875, 2.762939453125, 2.89825439453125, 3.0335693359375, 3.16888427734375, 3.30419921875, 3.43951416015625, 3.5748291015625, 3.71014404296875, 3.845458984375, 3.98077392578125, 4.1160888671875, 4.25140380859375, 4.38671875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 10.0, 9.0, 11.0, 10.0, 12.0, 20.0, 18.0, 26.0, 50.0, 52.0, 118.0, 192.0, 353.0, 660.0, 1270.0, 2552.0, 4955.0, 9991.0, 20287.0, 44634.0, 108413.0, 275024.0, 334703.0, 139969.0, 55966.0, 24545.0, 12240.0, 6169.0, 2960.0, 1540.0, 797.0, 411.0, 203.0, 123.0, 73.0, 44.0, 21.0, 27.0, 17.0, 21.0, 11.0, 10.0, 8.0, 9.0, 5.0, 3.0, 1.0, 5.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.00390625, -3.87530517578125, -3.7467041015625, -3.61810302734375, -3.489501953125, -3.36090087890625, -3.2322998046875, -3.10369873046875, -2.97509765625, -2.84649658203125, -2.7178955078125, -2.58929443359375, -2.460693359375, -2.33209228515625, -2.2034912109375, -2.07489013671875, -1.9462890625, -1.81768798828125, -1.6890869140625, -1.56048583984375, -1.431884765625, -1.30328369140625, -1.1746826171875, -1.04608154296875, -0.91748046875, -0.78887939453125, -0.6602783203125, -0.53167724609375, -0.403076171875, -0.27447509765625, -0.1458740234375, -0.01727294921875, 0.111328125, 0.23992919921875, 0.3685302734375, 0.49713134765625, 0.625732421875, 0.75433349609375, 0.8829345703125, 1.01153564453125, 1.14013671875, 1.26873779296875, 1.3973388671875, 1.52593994140625, 1.654541015625, 1.78314208984375, 1.9117431640625, 2.04034423828125, 2.1689453125, 2.29754638671875, 2.4261474609375, 2.55474853515625, 2.683349609375, 2.81195068359375, 2.9405517578125, 3.06915283203125, 3.19775390625, 3.32635498046875, 3.4549560546875, 3.58355712890625, 3.712158203125, 3.84075927734375, 3.9693603515625, 4.09796142578125, 4.2265625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 4.0, 5.0, 8.0, 10.0, 14.0, 17.0, 17.0, 17.0, 32.0, 31.0, 35.0, 40.0, 39.0, 47.0, 67.0, 101.0, 175.0, 1529.0, 344.0, 108.0, 63.0, 61.0, 45.0, 43.0, 39.0, 32.0, 22.0, 24.0, 16.0, 17.0, 13.0, 8.0, 6.0, 7.0, 6.0, 2.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.390625, -19.76904296875, -19.1474609375, -18.52587890625, -17.904296875, -17.28271484375, -16.6611328125, -16.03955078125, -15.41796875, -14.79638671875, -14.1748046875, -13.55322265625, -12.931640625, -12.31005859375, -11.6884765625, -11.06689453125, -10.4453125, -9.82373046875, -9.2021484375, -8.58056640625, -7.958984375, -7.33740234375, -6.7158203125, -6.09423828125, -5.47265625, -4.85107421875, -4.2294921875, -3.60791015625, -2.986328125, -2.36474609375, -1.7431640625, -1.12158203125, -0.5, 0.12158203125, 0.7431640625, 1.36474609375, 1.986328125, 2.60791015625, 3.2294921875, 3.85107421875, 4.47265625, 5.09423828125, 5.7158203125, 6.33740234375, 6.958984375, 7.58056640625, 8.2021484375, 8.82373046875, 9.4453125, 10.06689453125, 10.6884765625, 11.31005859375, 11.931640625, 12.55322265625, 13.1748046875, 13.79638671875, 14.41796875, 15.03955078125, 15.6611328125, 16.28271484375, 16.904296875, 17.52587890625, 18.1474609375, 18.76904296875, 19.390625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 6.0, 7.0, 7.0, 12.0, 19.0, 24.0, 27.0, 37.0, 54.0, 53.0, 104.0, 143.0, 248.0, 400.0, 940.0, 67395.0, 3071819.0, 2850.0, 592.0, 327.0, 213.0, 131.0, 78.0, 54.0, 34.0, 36.0, 29.0, 17.0, 13.0, 11.0, 7.0, 5.0, 8.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.9375, -60.01611328125, -58.0947265625, -56.17333984375, -54.251953125, -52.33056640625, -50.4091796875, -48.48779296875, -46.56640625, -44.64501953125, -42.7236328125, -40.80224609375, -38.880859375, -36.95947265625, -35.0380859375, -33.11669921875, -31.1953125, -29.27392578125, -27.3525390625, -25.43115234375, -23.509765625, -21.58837890625, -19.6669921875, -17.74560546875, -15.82421875, -13.90283203125, -11.9814453125, -10.06005859375, -8.138671875, -6.21728515625, -4.2958984375, -2.37451171875, -0.453125, 1.46826171875, 3.3896484375, 5.31103515625, 7.232421875, 9.15380859375, 11.0751953125, 12.99658203125, 14.91796875, 16.83935546875, 18.7607421875, 20.68212890625, 22.603515625, 24.52490234375, 26.4462890625, 28.36767578125, 30.2890625, 32.21044921875, 34.1318359375, 36.05322265625, 37.974609375, 39.89599609375, 41.8173828125, 43.73876953125, 45.66015625, 47.58154296875, 49.5029296875, 51.42431640625, 53.345703125, 55.26708984375, 57.1884765625, 59.10986328125, 61.03125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 14.0, 411.0, 564.0, 27.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-211.0338134765625, -207.33335876464844, -203.6328887939453, -199.93243408203125, -196.2319793701172, -192.53152465820312, -188.8310546875, -185.13059997558594, -181.43014526367188, -177.7296905517578, -174.0292205810547, -170.32876586914062, -166.62831115722656, -162.9278564453125, -159.22738647460938, -155.5269317626953, -151.8264617919922, -148.12600708007812, -144.425537109375, -140.72508239746094, -137.02462768554688, -133.32415771484375, -129.6237030029297, -125.92324829101562, -122.22279357910156, -118.52233123779297, -114.8218765258789, -111.12141418457031, -107.42095947265625, -103.72049713134766, -100.02003479003906, -96.319580078125, -92.61911010742188, -88.91864776611328, -85.21819305419922, -81.51773071289062, -77.81727600097656, -74.11681365966797, -70.41635131835938, -66.71589660644531, -63.01544189453125, -59.31498336791992, -55.614524841308594, -51.9140625, -48.21360397338867, -44.513145446777344, -40.812686920166016, -37.11222839355469, -33.411766052246094, -29.711307525634766, -26.010847091674805, -22.310388565063477, -18.609928131103516, -14.909469604492188, -11.20901107788086, -7.508550643920898, -3.8080921173095703, -0.10763287544250488, 3.5928263664245605, 7.293285369873047, 10.993744850158691, 14.694204330444336, 18.394662857055664, 22.095123291015625, 25.795581817626953]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 7.0, 2.0, 9.0, 1.0, 12.0, 13.0, 12.0, 7.0, 22.0, 22.0, 19.0, 23.0, 28.0, 30.0, 25.0, 34.0, 36.0, 29.0, 50.0, 58.0, 42.0, 38.0, 47.0, 47.0, 50.0, 48.0, 31.0, 29.0, 27.0, 23.0, 24.0, 20.0, 28.0, 17.0, 13.0, 21.0, 8.0, 14.0, 7.0, 11.0, 4.0, 6.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-40.97172546386719, -39.65695571899414, -38.342185974121094, -37.02741622924805, -35.712646484375, -34.39787673950195, -33.083106994628906, -31.768339157104492, -30.453569412231445, -29.1387996673584, -27.82402992248535, -26.509260177612305, -25.19449234008789, -23.879722595214844, -22.564952850341797, -21.25018310546875, -19.935413360595703, -18.620643615722656, -17.30587387084961, -15.991105079650879, -14.676335334777832, -13.361565589904785, -12.046796798706055, -10.732027053833008, -9.417257308959961, -8.102487564086914, -6.787718296051025, -5.472949028015137, -4.15817928314209, -2.843409538269043, -1.5286402702331543, -0.21387100219726562, 1.1008987426757812, 2.415668249130249, 3.730437755584717, 5.0452070236206055, 6.359976768493652, 7.674746513366699, 8.98951530456543, 10.304285049438477, 11.619054794311523, 12.93382453918457, 14.248594284057617, 15.563363075256348, 16.878131866455078, 18.192901611328125, 19.507671356201172, 20.82244110107422, 22.137210845947266, 23.451980590820312, 24.76675033569336, 26.081520080566406, 27.396289825439453, 28.7110595703125, 30.025827407836914, 31.34059715270996, 32.655364990234375, 33.97013473510742, 35.28490447998047, 36.599674224853516, 37.91444396972656, 39.22921371459961, 40.543983459472656, 41.85874938964844, 43.17352294921875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 6.0, 1.0, 9.0, 6.0, 6.0, 4.0, 10.0, 18.0, 11.0, 23.0, 18.0, 20.0, 17.0, 24.0, 31.0, 25.0, 27.0, 32.0, 39.0, 37.0, 42.0, 31.0, 41.0, 42.0, 45.0, 40.0, 37.0, 39.0, 28.0, 28.0, 26.0, 31.0, 21.0, 16.0, 23.0, 23.0, 14.0, 18.0, 13.0, 21.0, 8.0, 7.0, 11.0, 9.0, 4.0, 3.0, 3.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.73046875, -4.5848388671875, -4.439208984375, -4.2935791015625, -4.14794921875, -4.0023193359375, -3.856689453125, -3.7110595703125, -3.5654296875, -3.4197998046875, -3.274169921875, -3.1285400390625, -2.98291015625, -2.8372802734375, -2.691650390625, -2.5460205078125, -2.400390625, -2.2547607421875, -2.109130859375, -1.9635009765625, -1.81787109375, -1.6722412109375, -1.526611328125, -1.3809814453125, -1.2353515625, -1.0897216796875, -0.944091796875, -0.7984619140625, -0.65283203125, -0.5072021484375, -0.361572265625, -0.2159423828125, -0.0703125, 0.0753173828125, 0.220947265625, 0.3665771484375, 0.51220703125, 0.6578369140625, 0.803466796875, 0.9490966796875, 1.0947265625, 1.2403564453125, 1.385986328125, 1.5316162109375, 1.67724609375, 1.8228759765625, 1.968505859375, 2.1141357421875, 2.259765625, 2.4053955078125, 2.551025390625, 2.6966552734375, 2.84228515625, 2.9879150390625, 3.133544921875, 3.2791748046875, 3.4248046875, 3.5704345703125, 3.716064453125, 3.8616943359375, 4.00732421875, 4.1529541015625, 4.298583984375, 4.4442138671875, 4.58984375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 3.0, 7.0, 7.0, 11.0, 10.0, 8.0, 16.0, 13.0, 18.0, 26.0, 36.0, 54.0, 54.0, 67.0, 100.0, 130.0, 220.0, 474.0, 1466.0, 8941.0, 306519.0, 3096792.0, 756071.0, 19471.0, 2190.0, 662.0, 288.0, 152.0, 77.0, 77.0, 64.0, 51.0, 43.0, 25.0, 25.0, 24.0, 20.0, 11.0, 10.0, 9.0, 10.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-16.359375, -15.886962890625, -15.41455078125, -14.942138671875, -14.4697265625, -13.997314453125, -13.52490234375, -13.052490234375, -12.580078125, -12.107666015625, -11.63525390625, -11.162841796875, -10.6904296875, -10.218017578125, -9.74560546875, -9.273193359375, -8.80078125, -8.328369140625, -7.85595703125, -7.383544921875, -6.9111328125, -6.438720703125, -5.96630859375, -5.493896484375, -5.021484375, -4.549072265625, -4.07666015625, -3.604248046875, -3.1318359375, -2.659423828125, -2.18701171875, -1.714599609375, -1.2421875, -0.769775390625, -0.29736328125, 0.175048828125, 0.6474609375, 1.119873046875, 1.59228515625, 2.064697265625, 2.537109375, 3.009521484375, 3.48193359375, 3.954345703125, 4.4267578125, 4.899169921875, 5.37158203125, 5.843994140625, 6.31640625, 6.788818359375, 7.26123046875, 7.733642578125, 8.2060546875, 8.678466796875, 9.15087890625, 9.623291015625, 10.095703125, 10.568115234375, 11.04052734375, 11.512939453125, 11.9853515625, 12.457763671875, 12.93017578125, 13.402587890625, 13.875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 12.0, 21.0, 36.0, 51.0, 58.0, 81.0, 149.0, 193.0, 289.0, 449.0, 603.0, 624.0, 488.0, 353.0, 243.0, 125.0, 98.0, 70.0, 33.0, 24.0, 23.0, 21.0, 9.0, 4.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3984375, -13.9769287109375, -13.555419921875, -13.1339111328125, -12.71240234375, -12.2908935546875, -11.869384765625, -11.4478759765625, -11.0263671875, -10.6048583984375, -10.183349609375, -9.7618408203125, -9.34033203125, -8.9188232421875, -8.497314453125, -8.0758056640625, -7.654296875, -7.2327880859375, -6.811279296875, -6.3897705078125, -5.96826171875, -5.5467529296875, -5.125244140625, -4.7037353515625, -4.2822265625, -3.8607177734375, -3.439208984375, -3.0177001953125, -2.59619140625, -2.1746826171875, -1.753173828125, -1.3316650390625, -0.91015625, -0.4886474609375, -0.067138671875, 0.3543701171875, 0.77587890625, 1.1973876953125, 1.618896484375, 2.0404052734375, 2.4619140625, 2.8834228515625, 3.304931640625, 3.7264404296875, 4.14794921875, 4.5694580078125, 4.990966796875, 5.4124755859375, 5.833984375, 6.2554931640625, 6.677001953125, 7.0985107421875, 7.52001953125, 7.9415283203125, 8.363037109375, 8.7845458984375, 9.2060546875, 9.6275634765625, 10.049072265625, 10.4705810546875, 10.89208984375, 11.3135986328125, 11.735107421875, 12.1566162109375, 12.578125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 4.0, 12.0, 21.0, 21.0, 34.0, 46.0, 84.0, 124.0, 165.0, 325.0, 477.0, 1199.0, 681665.0, 3506683.0, 1905.0, 545.0, 317.0, 237.0, 137.0, 106.0, 70.0, 38.0, 33.0, 12.0, 9.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.5, -56.556640625, -54.61328125, -52.669921875, -50.7265625, -48.783203125, -46.83984375, -44.896484375, -42.953125, -41.009765625, -39.06640625, -37.123046875, -35.1796875, -33.236328125, -31.29296875, -29.349609375, -27.40625, -25.462890625, -23.51953125, -21.576171875, -19.6328125, -17.689453125, -15.74609375, -13.802734375, -11.859375, -9.916015625, -7.97265625, -6.029296875, -4.0859375, -2.142578125, -0.19921875, 1.744140625, 3.6875, 5.630859375, 7.57421875, 9.517578125, 11.4609375, 13.404296875, 15.34765625, 17.291015625, 19.234375, 21.177734375, 23.12109375, 25.064453125, 27.0078125, 28.951171875, 30.89453125, 32.837890625, 34.78125, 36.724609375, 38.66796875, 40.611328125, 42.5546875, 44.498046875, 46.44140625, 48.384765625, 50.328125, 52.271484375, 54.21484375, 56.158203125, 58.1015625, 60.044921875, 61.98828125, 63.931640625, 65.875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 29.0, 184.0, 480.0, 268.0, 53.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-176.27511596679688, -171.4671173095703, -166.65911865234375, -161.85110473632812, -157.04310607910156, -152.235107421875, -147.42709350585938, -142.6190948486328, -137.81109619140625, -133.0030975341797, -128.19509887695312, -123.3870849609375, -118.57908630371094, -113.77108764648438, -108.96308135986328, -104.15507507324219, -99.34707641601562, -94.53907775878906, -89.73107147216797, -84.92306518554688, -80.11506652832031, -75.30706787109375, -70.49906158447266, -65.69105529785156, -60.883056640625, -56.07505416870117, -51.267051696777344, -46.459049224853516, -41.65104675292969, -36.84304428100586, -32.03504180908203, -27.227039337158203, -22.419036865234375, -17.611034393310547, -12.803031921386719, -7.995029449462891, -3.1870269775390625, 1.6209754943847656, 6.428977966308594, 11.236980438232422, 16.04498291015625, 20.852985382080078, 25.660987854003906, 30.468990325927734, 35.27699279785156, 40.08499526977539, 44.89299774169922, 49.70100021362305, 54.509002685546875, 59.3170051574707, 64.12500762939453, 68.93301391601562, 73.74101257324219, 78.54901123046875, 83.35701751708984, 88.16502380371094, 92.9730224609375, 97.78102111816406, 102.58902740478516, 107.39703369140625, 112.20503234863281, 117.01303100585938, 121.82103729248047, 126.62904357910156, 131.43704223632812]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 6.0, 5.0, 7.0, 9.0, 11.0, 13.0, 13.0, 13.0, 17.0, 15.0, 24.0, 24.0, 21.0, 18.0, 28.0, 42.0, 39.0, 38.0, 43.0, 32.0, 40.0, 39.0, 48.0, 41.0, 34.0, 50.0, 43.0, 39.0, 20.0, 22.0, 21.0, 22.0, 27.0, 26.0, 14.0, 15.0, 19.0, 13.0, 9.0, 3.0, 15.0, 5.0, 3.0, 6.0, 1.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.30865478515625, -28.362224578857422, -27.415794372558594, -26.469364166259766, -25.52293586730957, -24.576505661010742, -23.630075454711914, -22.683645248413086, -21.73721694946289, -20.790786743164062, -19.844356536865234, -18.897926330566406, -17.95149803161621, -17.005067825317383, -16.058637619018555, -15.112207412719727, -14.165777206420898, -13.21934700012207, -12.272917747497559, -11.32648754119873, -10.380058288574219, -9.43362808227539, -8.487197875976562, -7.540768146514893, -6.594338417053223, -5.647908687591553, -4.701478958129883, -3.7550487518310547, -2.8086190223693848, -1.8621892929077148, -0.9157590866088867, 0.030670642852783203, 0.9770984649658203, 1.9235283136367798, 2.8699581623077393, 3.8163881301879883, 4.762817859649658, 5.709247589111328, 6.655677795410156, 7.602107524871826, 8.548537254333496, 9.494967460632324, 10.441396713256836, 11.387826919555664, 12.334257125854492, 13.280686378479004, 14.227116584777832, 15.173545837402344, 16.119976043701172, 17.06640625, 18.012836456298828, 18.959266662597656, 19.90569496154785, 20.85212516784668, 21.798555374145508, 22.744985580444336, 23.69141387939453, 24.63784408569336, 25.584274291992188, 26.530704498291016, 27.47713279724121, 28.42356300354004, 29.369993209838867, 30.316423416137695, 31.262853622436523]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 2.0, 5.0, 10.0, 8.0, 12.0, 11.0, 15.0, 14.0, 8.0, 20.0, 25.0, 18.0, 23.0, 34.0, 33.0, 45.0, 34.0, 37.0, 48.0, 45.0, 44.0, 37.0, 50.0, 42.0, 40.0, 38.0, 34.0, 29.0, 26.0, 23.0, 30.0, 27.0, 22.0, 14.0, 17.0, 15.0, 8.0, 16.0, 11.0, 3.0, 7.0, 6.0, 7.0, 3.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8046875, -4.65191650390625, -4.4991455078125, -4.34637451171875, -4.193603515625, -4.04083251953125, -3.8880615234375, -3.73529052734375, -3.58251953125, -3.42974853515625, -3.2769775390625, -3.12420654296875, -2.971435546875, -2.81866455078125, -2.6658935546875, -2.51312255859375, -2.3603515625, -2.20758056640625, -2.0548095703125, -1.90203857421875, -1.749267578125, -1.59649658203125, -1.4437255859375, -1.29095458984375, -1.13818359375, -0.98541259765625, -0.8326416015625, -0.67987060546875, -0.527099609375, -0.37432861328125, -0.2215576171875, -0.06878662109375, 0.083984375, 0.23675537109375, 0.3895263671875, 0.54229736328125, 0.695068359375, 0.84783935546875, 1.0006103515625, 1.15338134765625, 1.30615234375, 1.45892333984375, 1.6116943359375, 1.76446533203125, 1.917236328125, 2.07000732421875, 2.2227783203125, 2.37554931640625, 2.5283203125, 2.68109130859375, 2.8338623046875, 2.98663330078125, 3.139404296875, 3.29217529296875, 3.4449462890625, 3.59771728515625, 3.75048828125, 3.90325927734375, 4.0560302734375, 4.20880126953125, 4.361572265625, 4.51434326171875, 4.6671142578125, 4.81988525390625, 4.97265625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 6.0, 4.0, 13.0, 10.0, 28.0, 26.0, 45.0, 58.0, 91.0, 136.0, 197.0, 293.0, 411.0, 585.0, 861.0, 1189.0, 1926.0, 2695.0, 3892.0, 5897.0, 8567.0, 12585.0, 19038.0, 28899.0, 45479.0, 76641.0, 149381.0, 330459.0, 149140.0, 76622.0, 46023.0, 29030.0, 18845.0, 12611.0, 8791.0, 5801.0, 3905.0, 2580.0, 1881.0, 1250.0, 830.0, 604.0, 404.0, 281.0, 183.0, 120.0, 92.0, 57.0, 34.0, 28.0, 12.0, 14.0, 8.0, 7.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.0498046875, -1.0175018310546875, -0.985198974609375, -0.9528961181640625, -0.92059326171875, -0.8882904052734375, -0.855987548828125, -0.8236846923828125, -0.7913818359375, -0.7590789794921875, -0.726776123046875, -0.6944732666015625, -0.66217041015625, -0.6298675537109375, -0.597564697265625, -0.5652618408203125, -0.532958984375, -0.5006561279296875, -0.468353271484375, -0.4360504150390625, -0.40374755859375, -0.3714447021484375, -0.339141845703125, -0.3068389892578125, -0.2745361328125, -0.2422332763671875, -0.209930419921875, -0.1776275634765625, -0.14532470703125, -0.1130218505859375, -0.080718994140625, -0.0484161376953125, -0.01611328125, 0.0161895751953125, 0.048492431640625, 0.0807952880859375, 0.11309814453125, 0.1454010009765625, 0.177703857421875, 0.2100067138671875, 0.2423095703125, 0.2746124267578125, 0.306915283203125, 0.3392181396484375, 0.37152099609375, 0.4038238525390625, 0.436126708984375, 0.4684295654296875, 0.500732421875, 0.5330352783203125, 0.565338134765625, 0.5976409912109375, 0.62994384765625, 0.6622467041015625, 0.694549560546875, 0.7268524169921875, 0.7591552734375, 0.7914581298828125, 0.823760986328125, 0.8560638427734375, 0.88836669921875, 0.9206695556640625, 0.952972412109375, 0.9852752685546875, 1.017578125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 7.0, 6.0, 9.0, 15.0, 14.0, 18.0, 15.0, 16.0, 34.0, 24.0, 32.0, 31.0, 32.0, 22.0, 47.0, 25.0, 33.0, 38.0, 44.0, 1054.0, 33.0, 51.0, 40.0, 31.0, 38.0, 34.0, 36.0, 23.0, 32.0, 30.0, 21.0, 24.0, 19.0, 16.0, 20.0, 12.0, 8.0, 11.0, 4.0, 6.0, 5.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.03515625, -2.94207763671875, -2.8489990234375, -2.75592041015625, -2.662841796875, -2.56976318359375, -2.4766845703125, -2.38360595703125, -2.29052734375, -2.19744873046875, -2.1043701171875, -2.01129150390625, -1.918212890625, -1.82513427734375, -1.7320556640625, -1.63897705078125, -1.5458984375, -1.45281982421875, -1.3597412109375, -1.26666259765625, -1.173583984375, -1.08050537109375, -0.9874267578125, -0.89434814453125, -0.80126953125, -0.70819091796875, -0.6151123046875, -0.52203369140625, -0.428955078125, -0.33587646484375, -0.2427978515625, -0.14971923828125, -0.056640625, 0.03643798828125, 0.1295166015625, 0.22259521484375, 0.315673828125, 0.40875244140625, 0.5018310546875, 0.59490966796875, 0.68798828125, 0.78106689453125, 0.8741455078125, 0.96722412109375, 1.060302734375, 1.15338134765625, 1.2464599609375, 1.33953857421875, 1.4326171875, 1.52569580078125, 1.6187744140625, 1.71185302734375, 1.804931640625, 1.89801025390625, 1.9910888671875, 2.08416748046875, 2.17724609375, 2.27032470703125, 2.3634033203125, 2.45648193359375, 2.549560546875, 2.64263916015625, 2.7357177734375, 2.82879638671875, 2.921875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 1.0, 11.0, 8.0, 16.0, 28.0, 30.0, 71.0, 100.0, 147.0, 226.0, 341.0, 569.0, 876.0, 1391.0, 2254.0, 3658.0, 6073.0, 10034.0, 16960.0, 29203.0, 50523.0, 89955.0, 190686.0, 1396222.0, 130625.0, 70013.0, 39556.0, 23064.0, 13701.0, 7990.0, 4979.0, 2904.0, 1817.0, 1129.0, 718.0, 427.0, 275.0, 185.0, 113.0, 86.0, 55.0, 34.0, 30.0, 16.0, 12.0, 9.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1962890625, -1.158050537109375, -1.11981201171875, -1.081573486328125, -1.0433349609375, -1.005096435546875, -0.96685791015625, -0.928619384765625, -0.890380859375, -0.852142333984375, -0.81390380859375, -0.775665283203125, -0.7374267578125, -0.699188232421875, -0.66094970703125, -0.622711181640625, -0.58447265625, -0.546234130859375, -0.50799560546875, -0.469757080078125, -0.4315185546875, -0.393280029296875, -0.35504150390625, -0.316802978515625, -0.278564453125, -0.240325927734375, -0.20208740234375, -0.163848876953125, -0.1256103515625, -0.087371826171875, -0.04913330078125, -0.010894775390625, 0.02734375, 0.065582275390625, 0.10382080078125, 0.142059326171875, 0.1802978515625, 0.218536376953125, 0.25677490234375, 0.295013427734375, 0.333251953125, 0.371490478515625, 0.40972900390625, 0.447967529296875, 0.4862060546875, 0.524444580078125, 0.56268310546875, 0.600921630859375, 0.63916015625, 0.677398681640625, 0.71563720703125, 0.753875732421875, 0.7921142578125, 0.830352783203125, 0.86859130859375, 0.906829833984375, 0.945068359375, 0.983306884765625, 1.02154541015625, 1.059783935546875, 1.0980224609375, 1.136260986328125, 1.17449951171875, 1.212738037109375, 1.2509765625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 1.0, 5.0, 6.0, 9.0, 8.0, 13.0, 18.0, 20.0, 31.0, 26.0, 43.0, 74.0, 96.0, 126.0, 121.0, 105.0, 70.0, 48.0, 40.0, 27.0, 25.0, 19.0, 11.0, 12.0, 8.0, 5.0, 5.0, 4.0, 4.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010776519775390625, -0.0010460317134857178, -0.001014411449432373, -0.0009827911853790283, -0.0009511709213256836, -0.0009195506572723389, -0.0008879303932189941, -0.0008563101291656494, -0.0008246898651123047, -0.00079306960105896, -0.0007614493370056152, -0.0007298290729522705, -0.0006982088088989258, -0.0006665885448455811, -0.0006349682807922363, -0.0006033480167388916, -0.0005717277526855469, -0.0005401074886322021, -0.0005084872245788574, -0.0004768669605255127, -0.00044524669647216797, -0.00041362643241882324, -0.0003820061683654785, -0.0003503859043121338, -0.00031876564025878906, -0.00028714537620544434, -0.0002555251121520996, -0.00022390484809875488, -0.00019228458404541016, -0.00016066431999206543, -0.0001290440559387207, -9.742379188537598e-05, -6.580352783203125e-05, -3.4183263778686523e-05, -2.562999725341797e-06, 2.905726432800293e-05, 6.0677528381347656e-05, 9.229779243469238e-05, 0.0001239180564880371, 0.00015553832054138184, 0.00018715858459472656, 0.0002187788486480713, 0.000250399112701416, 0.00028201937675476074, 0.00031363964080810547, 0.0003452599048614502, 0.0003768801689147949, 0.00040850043296813965, 0.0004401206970214844, 0.0004717409610748291, 0.0005033612251281738, 0.0005349814891815186, 0.0005666017532348633, 0.000598222017288208, 0.0006298422813415527, 0.0006614625453948975, 0.0006930828094482422, 0.0007247030735015869, 0.0007563233375549316, 0.0007879436016082764, 0.0008195638656616211, 0.0008511841297149658, 0.0008828043937683105, 0.0009144246578216553, 0.000946044921875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 0.0, 4.0, 4.0, 7.0, 5.0, 6.0, 4.0, 7.0, 16.0, 19.0, 19.0, 22.0, 27.0, 46.0, 77.0, 112.0, 168.0, 394.0, 1831.0, 1027074.0, 17498.0, 567.0, 230.0, 144.0, 79.0, 45.0, 37.0, 26.0, 22.0, 12.0, 9.0, 10.0, 6.0, 8.0, 9.0, 2.0, 1.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0209197998046875, -0.020259857177734375, -0.01959991455078125, -0.018939971923828125, -0.018280029296875, -0.017620086669921875, -0.01696014404296875, -0.016300201416015625, -0.0156402587890625, -0.014980316162109375, -0.01432037353515625, -0.013660430908203125, -0.01300048828125, -0.012340545654296875, -0.01168060302734375, -0.011020660400390625, -0.0103607177734375, -0.009700775146484375, -0.00904083251953125, -0.008380889892578125, -0.007720947265625, -0.007061004638671875, -0.00640106201171875, -0.005741119384765625, -0.0050811767578125, -0.004421234130859375, -0.00376129150390625, -0.003101348876953125, -0.00244140625, -0.001781463623046875, -0.00112152099609375, -0.000461578369140625, 0.0001983642578125, 0.000858306884765625, 0.00151824951171875, 0.002178192138671875, 0.002838134765625, 0.003498077392578125, 0.00415802001953125, 0.004817962646484375, 0.0054779052734375, 0.006137847900390625, 0.00679779052734375, 0.007457733154296875, 0.00811767578125, 0.008777618408203125, 0.00943756103515625, 0.010097503662109375, 0.0107574462890625, 0.011417388916015625, 0.01207733154296875, 0.012737274169921875, 0.013397216796875, 0.014057159423828125, 0.01471710205078125, 0.015377044677734375, 0.0160369873046875, 0.016696929931640625, 0.01735687255859375, 0.018016815185546875, 0.0186767578125, 0.019336700439453125, 0.01999664306640625, 0.020656585693359375, 0.0213165283203125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 17.0, 19.0, 36.0, 35.0, 56.0, 76.0, 99.0, 146.0, 150.0, 114.0, 85.0, 54.0, 31.0, 36.0, 19.0, 14.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0005531213246285915, -0.0005389315774664283, -0.000524741830304265, -0.0005105520831421018, -0.0004963623359799385, -0.00048217258881777525, -0.000467982841655612, -0.00045379309449344873, -0.0004396033473312855, -0.0004254136001691222, -0.00041122385300695896, -0.0003970341058447957, -0.00038284435868263245, -0.0003686546115204692, -0.00035446486435830593, -0.0003402751171961427, -0.0003260853700339794, -0.00031189562287181616, -0.0002977058757096529, -0.00028351612854748964, -0.0002693263813853264, -0.00025513663422316313, -0.00024094688706099987, -0.0002267571398988366, -0.0002125673636328429, -0.00019837761647067964, -0.00018418786930851638, -0.00016999812214635313, -0.00015580837498418987, -0.0001416186278220266, -0.00012742888065986335, -0.00011323912622174248, -9.904938633553684e-05, -8.485963917337358e-05, -7.066989201121032e-05, -5.648014121106826e-05, -4.2290394048905e-05, -2.8100643248762935e-05, -1.3910896086599678e-05, 2.788510755635798e-07, 1.4468598237726837e-05, 2.8658345399890095e-05, 4.284809256205335e-05, 5.703784336219542e-05, 7.122759416233748e-05, 8.541734132450074e-05, 9.9607088486664e-05, 0.00011379683564882725, 0.0001279865828109905, 0.00014217632997315377, 0.00015636607713531703, 0.00017055582429748029, 0.00018474557145964354, 0.00019893533317372203, 0.00021312508033588529, 0.00022731482749804854, 0.0002415045746602118, 0.00025569432182237506, 0.0002698840689845383, 0.0002840738161467016, 0.00029826356330886483, 0.0003124533104710281, 0.00032664305763319135, 0.0003408328047953546, 0.00035502255195751786]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 9.0, 7.0, 3.0, 5.0, 10.0, 16.0, 16.0, 14.0, 15.0, 16.0, 19.0, 17.0, 24.0, 25.0, 31.0, 23.0, 29.0, 39.0, 29.0, 38.0, 47.0, 44.0, 30.0, 44.0, 41.0, 30.0, 39.0, 35.0, 36.0, 41.0, 31.0, 35.0, 24.0, 25.0, 16.0, 15.0, 21.0, 12.0, 11.0, 7.0, 9.0, 7.0, 8.0, 2.0, 7.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003560185432434082, -0.00034403055906295776, -0.0003320425748825073, -0.0003200545907020569, -0.00030806660652160645, -0.000296078622341156, -0.00028409063816070557, -0.0002721026539802551, -0.0002601146697998047, -0.00024812668561935425, -0.0002361387014389038, -0.00022415071725845337, -0.00021216273307800293, -0.0002001747488975525, -0.00018818676471710205, -0.0001761987805366516, -0.00016421079635620117, -0.00015222281217575073, -0.0001402348279953003, -0.00012824684381484985, -0.00011625885963439941, -0.00010427087545394897, -9.228289127349854e-05, -8.02949070930481e-05, -6.830692291259766e-05, -5.631893873214722e-05, -4.433095455169678e-05, -3.234297037124634e-05, -2.03549861907959e-05, -8.367002010345459e-06, 3.6209821701049805e-06, 1.560896635055542e-05, 2.759695053100586e-05, 3.95849347114563e-05, 5.157291889190674e-05, 6.356090307235718e-05, 7.554888725280762e-05, 8.753687143325806e-05, 9.95248556137085e-05, 0.00011151283979415894, 0.00012350082397460938, 0.00013548880815505981, 0.00014747679233551025, 0.0001594647765159607, 0.00017145276069641113, 0.00018344074487686157, 0.000195428729057312, 0.00020741671323776245, 0.0002194046974182129, 0.00023139268159866333, 0.00024338066577911377, 0.0002553686499595642, 0.00026735663414001465, 0.0002793446183204651, 0.00029133260250091553, 0.00030332058668136597, 0.0003153085708618164, 0.00032729655504226685, 0.0003392845392227173, 0.0003512725234031677, 0.00036326050758361816, 0.0003752484917640686, 0.00038723647594451904, 0.0003992244601249695, 0.0004112124443054199]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 2.0, 5.0, 10.0, 8.0, 12.0, 11.0, 15.0, 14.0, 8.0, 20.0, 25.0, 18.0, 23.0, 34.0, 33.0, 45.0, 34.0, 37.0, 48.0, 45.0, 44.0, 37.0, 50.0, 42.0, 40.0, 38.0, 34.0, 29.0, 26.0, 23.0, 30.0, 27.0, 22.0, 14.0, 17.0, 15.0, 8.0, 16.0, 11.0, 3.0, 7.0, 6.0, 7.0, 3.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8046875, -4.65191650390625, -4.4991455078125, -4.34637451171875, -4.193603515625, -4.04083251953125, -3.8880615234375, -3.73529052734375, -3.58251953125, -3.42974853515625, -3.2769775390625, -3.12420654296875, -2.971435546875, -2.81866455078125, -2.6658935546875, -2.51312255859375, -2.3603515625, -2.20758056640625, -2.0548095703125, -1.90203857421875, -1.749267578125, -1.59649658203125, -1.4437255859375, -1.29095458984375, -1.13818359375, -0.98541259765625, -0.8326416015625, -0.67987060546875, -0.527099609375, -0.37432861328125, -0.2215576171875, -0.06878662109375, 0.083984375, 0.23675537109375, 0.3895263671875, 0.54229736328125, 0.695068359375, 0.84783935546875, 1.0006103515625, 1.15338134765625, 1.30615234375, 1.45892333984375, 1.6116943359375, 1.76446533203125, 1.917236328125, 2.07000732421875, 2.2227783203125, 2.37554931640625, 2.5283203125, 2.68109130859375, 2.8338623046875, 2.98663330078125, 3.139404296875, 3.29217529296875, 3.4449462890625, 3.59771728515625, 3.75048828125, 3.90325927734375, 4.0560302734375, 4.20880126953125, 4.361572265625, 4.51434326171875, 4.6671142578125, 4.81988525390625, 4.97265625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 7.0, 10.0, 13.0, 22.0, 30.0, 27.0, 37.0, 40.0, 57.0, 74.0, 102.0, 140.0, 205.0, 397.0, 909.0, 2095.0, 5471.0, 14438.0, 39633.0, 106753.0, 284194.0, 368092.0, 141546.0, 52319.0, 19559.0, 7141.0, 2733.0, 1144.0, 478.0, 253.0, 178.0, 82.0, 80.0, 58.0, 58.0, 35.0, 33.0, 27.0, 15.0, 20.0, 14.0, 9.0, 5.0, 7.0, 8.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.11328125, -4.9490966796875, -4.784912109375, -4.6207275390625, -4.45654296875, -4.2923583984375, -4.128173828125, -3.9639892578125, -3.7998046875, -3.6356201171875, -3.471435546875, -3.3072509765625, -3.14306640625, -2.9788818359375, -2.814697265625, -2.6505126953125, -2.486328125, -2.3221435546875, -2.157958984375, -1.9937744140625, -1.82958984375, -1.6654052734375, -1.501220703125, -1.3370361328125, -1.1728515625, -1.0086669921875, -0.844482421875, -0.6802978515625, -0.51611328125, -0.3519287109375, -0.187744140625, -0.0235595703125, 0.140625, 0.3048095703125, 0.468994140625, 0.6331787109375, 0.79736328125, 0.9615478515625, 1.125732421875, 1.2899169921875, 1.4541015625, 1.6182861328125, 1.782470703125, 1.9466552734375, 2.11083984375, 2.2750244140625, 2.439208984375, 2.6033935546875, 2.767578125, 2.9317626953125, 3.095947265625, 3.2601318359375, 3.42431640625, 3.5885009765625, 3.752685546875, 3.9168701171875, 4.0810546875, 4.2452392578125, 4.409423828125, 4.5736083984375, 4.73779296875, 4.9019775390625, 5.066162109375, 5.2303466796875, 5.39453125]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 9.0, 10.0, 18.0, 19.0, 23.0, 20.0, 23.0, 27.0, 26.0, 33.0, 31.0, 39.0, 36.0, 47.0, 90.0, 149.0, 1531.0, 341.0, 117.0, 73.0, 45.0, 39.0, 50.0, 44.0, 26.0, 39.0, 27.0, 15.0, 17.0, 17.0, 16.0, 10.0, 7.0, 6.0, 2.0, 4.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.171875, -14.662353515625, -14.15283203125, -13.643310546875, -13.1337890625, -12.624267578125, -12.11474609375, -11.605224609375, -11.095703125, -10.586181640625, -10.07666015625, -9.567138671875, -9.0576171875, -8.548095703125, -8.03857421875, -7.529052734375, -7.01953125, -6.510009765625, -6.00048828125, -5.490966796875, -4.9814453125, -4.471923828125, -3.96240234375, -3.452880859375, -2.943359375, -2.433837890625, -1.92431640625, -1.414794921875, -0.9052734375, -0.395751953125, 0.11376953125, 0.623291015625, 1.1328125, 1.642333984375, 2.15185546875, 2.661376953125, 3.1708984375, 3.680419921875, 4.18994140625, 4.699462890625, 5.208984375, 5.718505859375, 6.22802734375, 6.737548828125, 7.2470703125, 7.756591796875, 8.26611328125, 8.775634765625, 9.28515625, 9.794677734375, 10.30419921875, 10.813720703125, 11.3232421875, 11.832763671875, 12.34228515625, 12.851806640625, 13.361328125, 13.870849609375, 14.38037109375, 14.889892578125, 15.3994140625, 15.908935546875, 16.41845703125, 16.927978515625, 17.4375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 5.0, 6.0, 10.0, 8.0, 13.0, 17.0, 34.0, 34.0, 63.0, 80.0, 146.0, 263.0, 664.0, 2211.0, 3052158.0, 87672.0, 1258.0, 428.0, 228.0, 134.0, 101.0, 49.0, 35.0, 20.0, 20.0, 11.0, 9.0, 4.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.4375, -76.048828125, -73.66015625, -71.271484375, -68.8828125, -66.494140625, -64.10546875, -61.716796875, -59.328125, -56.939453125, -54.55078125, -52.162109375, -49.7734375, -47.384765625, -44.99609375, -42.607421875, -40.21875, -37.830078125, -35.44140625, -33.052734375, -30.6640625, -28.275390625, -25.88671875, -23.498046875, -21.109375, -18.720703125, -16.33203125, -13.943359375, -11.5546875, -9.166015625, -6.77734375, -4.388671875, -2.0, 0.388671875, 2.77734375, 5.166015625, 7.5546875, 9.943359375, 12.33203125, 14.720703125, 17.109375, 19.498046875, 21.88671875, 24.275390625, 26.6640625, 29.052734375, 31.44140625, 33.830078125, 36.21875, 38.607421875, 40.99609375, 43.384765625, 45.7734375, 48.162109375, 50.55078125, 52.939453125, 55.328125, 57.716796875, 60.10546875, 62.494140625, 64.8828125, 67.271484375, 69.66015625, 72.048828125, 74.4375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 12.0, 43.0, 177.0, 315.0, 282.0, 141.0, 35.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.007919311523438, -26.525442123413086, -25.042964935302734, -23.560487747192383, -22.07801055908203, -20.59553337097168, -19.113056182861328, -17.63058090209961, -16.148101806640625, -14.665624618530273, -13.183147430419922, -11.70067024230957, -10.218193054199219, -8.735715866088867, -7.253239631652832, -5.7707624435424805, -4.288286209106445, -2.8058090209960938, -1.3233320713043213, 0.15914487838745117, 1.6416220664978027, 3.1240992546081543, 4.606575965881348, 6.089053153991699, 7.571530342102051, 9.054007530212402, 10.536484718322754, 12.018960952758789, 13.50143814086914, 14.983915328979492, 16.466392517089844, 17.948869705200195, 19.431346893310547, 20.9138240814209, 22.39630126953125, 23.8787784576416, 25.361255645751953, 26.843732833862305, 28.326210021972656, 29.808685302734375, 31.29116439819336, 32.77363967895508, 34.25611877441406, 35.73859405517578, 37.221073150634766, 38.703548431396484, 40.18602752685547, 41.66850280761719, 43.150978088378906, 44.633453369140625, 46.11593246459961, 47.59840774536133, 49.08088684082031, 50.56336212158203, 52.045841217041016, 53.528316497802734, 55.01079559326172, 56.49327087402344, 57.97574996948242, 59.45822525024414, 60.940704345703125, 62.423179626464844, 63.90565872192383, 65.38813781738281, 66.87061309814453]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 3.0, 4.0, 3.0, 2.0, 6.0, 7.0, 6.0, 14.0, 12.0, 16.0, 16.0, 17.0, 22.0, 29.0, 23.0, 19.0, 31.0, 36.0, 26.0, 40.0, 42.0, 41.0, 39.0, 45.0, 46.0, 44.0, 35.0, 41.0, 40.0, 36.0, 20.0, 31.0, 29.0, 33.0, 17.0, 24.0, 29.0, 13.0, 4.0, 12.0, 15.0, 10.0, 10.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.497459411621094, -36.32136917114258, -35.14528274536133, -33.96919250488281, -32.79310607910156, -31.617015838623047, -30.44092559814453, -29.26483726501465, -28.088748931884766, -26.912660598754883, -25.736572265625, -24.560482025146484, -23.3843936920166, -22.20830535888672, -21.032215118408203, -19.85612678527832, -18.680038452148438, -17.503950119018555, -16.327861785888672, -15.151771545410156, -13.975683212280273, -12.79959487915039, -11.623505592346191, -10.447416305541992, -9.27132797241211, -8.095239639282227, -6.919150352478027, -5.743061542510986, -4.566972732543945, -3.3908839225769043, -2.2147951126098633, -1.038705825805664, 0.13738250732421875, 1.3134713172912598, 2.489560127258301, 3.665648937225342, 4.841737747192383, 6.017826557159424, 7.193915367126465, 8.370004653930664, 9.546092987060547, 10.72218132019043, 11.898270606994629, 13.074359893798828, 14.250448226928711, 15.426536560058594, 16.60262680053711, 17.778715133666992, 18.954803466796875, 20.130891799926758, 21.30698013305664, 22.483070373535156, 23.65915870666504, 24.835247039794922, 26.011337280273438, 27.18742561340332, 28.363513946533203, 29.539602279663086, 30.71569061279297, 31.891780853271484, 33.06787109375, 34.24395751953125, 35.420047760009766, 36.59613800048828, 37.77222442626953]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 2.0, 5.0, 7.0, 6.0, 10.0, 10.0, 12.0, 14.0, 11.0, 17.0, 18.0, 23.0, 29.0, 34.0, 22.0, 37.0, 29.0, 32.0, 34.0, 42.0, 43.0, 40.0, 41.0, 39.0, 27.0, 38.0, 39.0, 29.0, 32.0, 27.0, 23.0, 24.0, 28.0, 19.0, 25.0, 25.0, 14.0, 19.0, 11.0, 10.0, 6.0, 8.0, 7.0, 1.0, 10.0, 7.0, 5.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.953125, -4.79815673828125, -4.6431884765625, -4.48822021484375, -4.333251953125, -4.17828369140625, -4.0233154296875, -3.86834716796875, -3.71337890625, -3.55841064453125, -3.4034423828125, -3.24847412109375, -3.093505859375, -2.93853759765625, -2.7835693359375, -2.62860107421875, -2.4736328125, -2.31866455078125, -2.1636962890625, -2.00872802734375, -1.853759765625, -1.69879150390625, -1.5438232421875, -1.38885498046875, -1.23388671875, -1.07891845703125, -0.9239501953125, -0.76898193359375, -0.614013671875, -0.45904541015625, -0.3040771484375, -0.14910888671875, 0.005859375, 0.16082763671875, 0.3157958984375, 0.47076416015625, 0.625732421875, 0.78070068359375, 0.9356689453125, 1.09063720703125, 1.24560546875, 1.40057373046875, 1.5555419921875, 1.71051025390625, 1.865478515625, 2.02044677734375, 2.1754150390625, 2.33038330078125, 2.4853515625, 2.64031982421875, 2.7952880859375, 2.95025634765625, 3.105224609375, 3.26019287109375, 3.4151611328125, 3.57012939453125, 3.72509765625, 3.88006591796875, 4.0350341796875, 4.19000244140625, 4.344970703125, 4.49993896484375, 4.6549072265625, 4.80987548828125, 4.96484375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 8.0, 4.0, 7.0, 14.0, 13.0, 14.0, 21.0, 18.0, 42.0, 31.0, 34.0, 58.0, 72.0, 62.0, 96.0, 120.0, 148.0, 248.0, 647.0, 3751.0, 81023.0, 2138497.0, 1905398.0, 58982.0, 3386.0, 625.0, 218.0, 130.0, 119.0, 80.0, 57.0, 56.0, 41.0, 48.0, 41.0, 30.0, 22.0, 25.0, 21.0, 19.0, 4.0, 8.0, 5.0, 6.0, 10.0, 7.0, 1.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0], "bins": [-16.125, -15.6358642578125, -15.146728515625, -14.6575927734375, -14.16845703125, -13.6793212890625, -13.190185546875, -12.7010498046875, -12.2119140625, -11.7227783203125, -11.233642578125, -10.7445068359375, -10.25537109375, -9.7662353515625, -9.277099609375, -8.7879638671875, -8.298828125, -7.8096923828125, -7.320556640625, -6.8314208984375, -6.34228515625, -5.8531494140625, -5.364013671875, -4.8748779296875, -4.3857421875, -3.8966064453125, -3.407470703125, -2.9183349609375, -2.42919921875, -1.9400634765625, -1.450927734375, -0.9617919921875, -0.47265625, 0.0164794921875, 0.505615234375, 0.9947509765625, 1.48388671875, 1.9730224609375, 2.462158203125, 2.9512939453125, 3.4404296875, 3.9295654296875, 4.418701171875, 4.9078369140625, 5.39697265625, 5.8861083984375, 6.375244140625, 6.8643798828125, 7.353515625, 7.8426513671875, 8.331787109375, 8.8209228515625, 9.31005859375, 9.7991943359375, 10.288330078125, 10.7774658203125, 11.2666015625, 11.7557373046875, 12.244873046875, 12.7340087890625, 13.22314453125, 13.7122802734375, 14.201416015625, 14.6905517578125, 15.1796875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 3.0, 8.0, 7.0, 11.0, 8.0, 18.0, 21.0, 34.0, 51.0, 48.0, 70.0, 103.0, 165.0, 220.0, 313.0, 406.0, 490.0, 536.0, 415.0, 314.0, 219.0, 175.0, 126.0, 69.0, 61.0, 40.0, 40.0, 26.0, 16.0, 20.0, 9.0, 5.0, 8.0, 9.0, 3.0, 1.0, 3.0, 1.0, 1.0, 4.0], "bins": [-13.6796875, -13.3472900390625, -13.014892578125, -12.6824951171875, -12.35009765625, -12.0177001953125, -11.685302734375, -11.3529052734375, -11.0205078125, -10.6881103515625, -10.355712890625, -10.0233154296875, -9.69091796875, -9.3585205078125, -9.026123046875, -8.6937255859375, -8.361328125, -8.0289306640625, -7.696533203125, -7.3641357421875, -7.03173828125, -6.6993408203125, -6.366943359375, -6.0345458984375, -5.7021484375, -5.3697509765625, -5.037353515625, -4.7049560546875, -4.37255859375, -4.0401611328125, -3.707763671875, -3.3753662109375, -3.04296875, -2.7105712890625, -2.378173828125, -2.0457763671875, -1.71337890625, -1.3809814453125, -1.048583984375, -0.7161865234375, -0.3837890625, -0.0513916015625, 0.281005859375, 0.6134033203125, 0.94580078125, 1.2781982421875, 1.610595703125, 1.9429931640625, 2.275390625, 2.6077880859375, 2.940185546875, 3.2725830078125, 3.60498046875, 3.9373779296875, 4.269775390625, 4.6021728515625, 4.9345703125, 5.2669677734375, 5.599365234375, 5.9317626953125, 6.26416015625, 6.5965576171875, 6.928955078125, 7.2613525390625, 7.59375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 9.0, 1.0, 12.0, 12.0, 14.0, 19.0, 15.0, 49.0, 58.0, 73.0, 106.0, 154.0, 219.0, 349.0, 469.0, 1420.0, 970654.0, 3216737.0, 2201.0, 537.0, 351.0, 262.0, 168.0, 124.0, 73.0, 60.0, 34.0, 37.0, 18.0, 14.0, 8.0, 12.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.875, -42.052734375, -40.23046875, -38.408203125, -36.5859375, -34.763671875, -32.94140625, -31.119140625, -29.296875, -27.474609375, -25.65234375, -23.830078125, -22.0078125, -20.185546875, -18.36328125, -16.541015625, -14.71875, -12.896484375, -11.07421875, -9.251953125, -7.4296875, -5.607421875, -3.78515625, -1.962890625, -0.140625, 1.681640625, 3.50390625, 5.326171875, 7.1484375, 8.970703125, 10.79296875, 12.615234375, 14.4375, 16.259765625, 18.08203125, 19.904296875, 21.7265625, 23.548828125, 25.37109375, 27.193359375, 29.015625, 30.837890625, 32.66015625, 34.482421875, 36.3046875, 38.126953125, 39.94921875, 41.771484375, 43.59375, 45.416015625, 47.23828125, 49.060546875, 50.8828125, 52.705078125, 54.52734375, 56.349609375, 58.171875, 59.994140625, 61.81640625, 63.638671875, 65.4609375, 67.283203125, 69.10546875, 70.927734375, 72.75]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 5.0, 37.0, 73.0, 142.0, 174.0, 195.0, 149.0, 102.0, 72.0, 28.0, 18.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.84767532348633, -57.087432861328125, -55.32719039916992, -53.56694793701172, -51.80670928955078, -50.04646682739258, -48.286224365234375, -46.52598190307617, -44.76573944091797, -43.005496978759766, -41.24525451660156, -39.485015869140625, -37.72477340698242, -35.96453094482422, -34.204288482666016, -32.44404602050781, -30.683805465698242, -28.92356300354004, -27.16332244873047, -25.403079986572266, -23.642837524414062, -21.88259506225586, -20.12235450744629, -18.362112045288086, -16.601871490478516, -14.841629981994629, -13.081387519836426, -11.321146011352539, -9.560903549194336, -7.800662040710449, -6.0404205322265625, -4.280178070068359, -2.5199356079101562, -0.7596937417984009, 1.0005481243133545, 2.7607898712158203, 4.521031856536865, 6.28127384185791, 8.041515350341797, 9.8017578125, 11.561999320983887, 13.322240829467773, 15.082483291625977, 16.842723846435547, 18.60296630859375, 20.363208770751953, 22.123451232910156, 23.88369369506836, 25.64393424987793, 27.404176712036133, 29.164417266845703, 30.924659729003906, 32.68490219116211, 34.44514465332031, 36.20538330078125, 37.96562957763672, 39.725868225097656, 41.48611068725586, 43.24635314941406, 45.006591796875, 46.7668342590332, 48.527076721191406, 50.28731918334961, 52.04756164550781, 53.807804107666016]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 7.0, 3.0, 6.0, 8.0, 5.0, 6.0, 14.0, 14.0, 19.0, 23.0, 18.0, 19.0, 35.0, 22.0, 43.0, 29.0, 49.0, 38.0, 38.0, 45.0, 39.0, 43.0, 43.0, 44.0, 49.0, 40.0, 32.0, 26.0, 24.0, 35.0, 28.0, 27.0, 14.0, 22.0, 19.0, 15.0, 16.0, 8.0, 7.0, 8.0, 8.0, 6.0, 4.0, 2.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.35517883300781, -31.319854736328125, -30.284530639648438, -29.24920654296875, -28.213882446289062, -27.178558349609375, -26.143234252929688, -25.10791015625, -24.072586059570312, -23.037261962890625, -22.001937866210938, -20.96661376953125, -19.931289672851562, -18.895965576171875, -17.860641479492188, -16.8253173828125, -15.78999137878418, -14.754667282104492, -13.719343185424805, -12.684019088745117, -11.64869499206543, -10.613370895385742, -9.578045845031738, -8.54272174835205, -7.507397651672363, -6.472073554992676, -5.436749458312988, -4.401424884796143, -3.366100788116455, -2.3307766914367676, -1.2954521179199219, -0.2601280212402344, 0.7751960754394531, 1.8105202913284302, 2.8458445072174072, 3.881168842315674, 4.916492938995361, 5.951817035675049, 6.9871416091918945, 8.022465705871582, 9.05778980255127, 10.093113899230957, 11.128437995910645, 12.163763046264648, 13.199087142944336, 14.234411239624023, 15.269735336303711, 16.3050594329834, 17.340383529663086, 18.375707626342773, 19.41103172302246, 20.44635581970215, 21.481679916381836, 22.517004013061523, 23.552330017089844, 24.58765411376953, 25.62297821044922, 26.658302307128906, 27.693626403808594, 28.72895050048828, 29.76427459716797, 30.799598693847656, 31.834922790527344, 32.87024688720703, 33.90557098388672]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 13.0, 16.0, 15.0, 15.0, 17.0, 20.0, 23.0, 32.0, 31.0, 33.0, 29.0, 48.0, 47.0, 39.0, 55.0, 35.0, 64.0, 44.0, 41.0, 44.0, 34.0, 32.0, 22.0, 38.0, 29.0, 21.0, 19.0, 19.0, 23.0, 13.0, 17.0, 20.0, 9.0, 7.0, 8.0, 3.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90234375, -5.71435546875, -5.5263671875, -5.33837890625, -5.150390625, -4.96240234375, -4.7744140625, -4.58642578125, -4.3984375, -4.21044921875, -4.0224609375, -3.83447265625, -3.646484375, -3.45849609375, -3.2705078125, -3.08251953125, -2.89453125, -2.70654296875, -2.5185546875, -2.33056640625, -2.142578125, -1.95458984375, -1.7666015625, -1.57861328125, -1.390625, -1.20263671875, -1.0146484375, -0.82666015625, -0.638671875, -0.45068359375, -0.2626953125, -0.07470703125, 0.11328125, 0.30126953125, 0.4892578125, 0.67724609375, 0.865234375, 1.05322265625, 1.2412109375, 1.42919921875, 1.6171875, 1.80517578125, 1.9931640625, 2.18115234375, 2.369140625, 2.55712890625, 2.7451171875, 2.93310546875, 3.12109375, 3.30908203125, 3.4970703125, 3.68505859375, 3.873046875, 4.06103515625, 4.2490234375, 4.43701171875, 4.625, 4.81298828125, 5.0009765625, 5.18896484375, 5.376953125, 5.56494140625, 5.7529296875, 5.94091796875, 6.12890625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 10.0, 16.0, 21.0, 30.0, 38.0, 75.0, 89.0, 148.0, 207.0, 333.0, 476.0, 735.0, 1115.0, 1641.0, 2467.0, 3497.0, 5220.0, 7608.0, 11087.0, 16476.0, 24441.0, 37919.0, 61873.0, 109091.0, 269082.0, 225652.0, 101573.0, 58652.0, 36025.0, 23784.0, 15793.0, 10618.0, 7294.0, 5023.0, 3407.0, 2305.0, 1556.0, 1032.0, 722.0, 487.0, 312.0, 199.0, 140.0, 97.0, 65.0, 45.0, 24.0, 19.0, 20.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.1767578125, -1.139923095703125, -1.10308837890625, -1.066253662109375, -1.0294189453125, -0.992584228515625, -0.95574951171875, -0.918914794921875, -0.882080078125, -0.845245361328125, -0.80841064453125, -0.771575927734375, -0.7347412109375, -0.697906494140625, -0.66107177734375, -0.624237060546875, -0.58740234375, -0.550567626953125, -0.51373291015625, -0.476898193359375, -0.4400634765625, -0.403228759765625, -0.36639404296875, -0.329559326171875, -0.292724609375, -0.255889892578125, -0.21905517578125, -0.182220458984375, -0.1453857421875, -0.108551025390625, -0.07171630859375, -0.034881591796875, 0.001953125, 0.038787841796875, 0.07562255859375, 0.112457275390625, 0.1492919921875, 0.186126708984375, 0.22296142578125, 0.259796142578125, 0.296630859375, 0.333465576171875, 0.37030029296875, 0.407135009765625, 0.4439697265625, 0.480804443359375, 0.51763916015625, 0.554473876953125, 0.59130859375, 0.628143310546875, 0.66497802734375, 0.701812744140625, 0.7386474609375, 0.775482177734375, 0.81231689453125, 0.849151611328125, 0.885986328125, 0.922821044921875, 0.95965576171875, 0.996490478515625, 1.0333251953125, 1.070159912109375, 1.10699462890625, 1.143829345703125, 1.1806640625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 3.0, 5.0, 6.0, 6.0, 8.0, 11.0, 11.0, 6.0, 15.0, 12.0, 19.0, 20.0, 19.0, 24.0, 23.0, 32.0, 36.0, 24.0, 36.0, 27.0, 28.0, 21.0, 36.0, 44.0, 1061.0, 31.0, 39.0, 45.0, 30.0, 38.0, 26.0, 37.0, 29.0, 22.0, 18.0, 27.0, 26.0, 16.0, 16.0, 16.0, 12.0, 8.0, 9.0, 11.0, 8.0, 8.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0], "bins": [-3.189453125, -3.0904541015625, -2.991455078125, -2.8924560546875, -2.79345703125, -2.6944580078125, -2.595458984375, -2.4964599609375, -2.3974609375, -2.2984619140625, -2.199462890625, -2.1004638671875, -2.00146484375, -1.9024658203125, -1.803466796875, -1.7044677734375, -1.60546875, -1.5064697265625, -1.407470703125, -1.3084716796875, -1.20947265625, -1.1104736328125, -1.011474609375, -0.9124755859375, -0.8134765625, -0.7144775390625, -0.615478515625, -0.5164794921875, -0.41748046875, -0.3184814453125, -0.219482421875, -0.1204833984375, -0.021484375, 0.0775146484375, 0.176513671875, 0.2755126953125, 0.37451171875, 0.4735107421875, 0.572509765625, 0.6715087890625, 0.7705078125, 0.8695068359375, 0.968505859375, 1.0675048828125, 1.16650390625, 1.2655029296875, 1.364501953125, 1.4635009765625, 1.5625, 1.6614990234375, 1.760498046875, 1.8594970703125, 1.95849609375, 2.0574951171875, 2.156494140625, 2.2554931640625, 2.3544921875, 2.4534912109375, 2.552490234375, 2.6514892578125, 2.75048828125, 2.8494873046875, 2.948486328125, 3.0474853515625, 3.146484375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 12.0, 13.0, 18.0, 32.0, 40.0, 52.0, 66.0, 100.0, 145.0, 225.0, 329.0, 490.0, 710.0, 1110.0, 1573.0, 2559.0, 3764.0, 5677.0, 8988.0, 14009.0, 22290.0, 37018.0, 62319.0, 108298.0, 1323308.0, 244511.0, 104416.0, 59297.0, 35363.0, 21661.0, 13663.0, 8726.0, 5518.0, 3579.0, 2458.0, 1590.0, 1019.0, 707.0, 475.0, 335.0, 220.0, 137.0, 94.0, 72.0, 49.0, 20.0, 32.0, 12.0, 13.0, 5.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.28125, -1.2411651611328125, -1.201080322265625, -1.1609954833984375, -1.12091064453125, -1.0808258056640625, -1.040740966796875, -1.0006561279296875, -0.9605712890625, -0.9204864501953125, -0.880401611328125, -0.8403167724609375, -0.80023193359375, -0.7601470947265625, -0.720062255859375, -0.6799774169921875, -0.639892578125, -0.5998077392578125, -0.559722900390625, -0.5196380615234375, -0.47955322265625, -0.4394683837890625, -0.399383544921875, -0.3592987060546875, -0.3192138671875, -0.2791290283203125, -0.239044189453125, -0.1989593505859375, -0.15887451171875, -0.1187896728515625, -0.078704833984375, -0.0386199951171875, 0.00146484375, 0.0415496826171875, 0.081634521484375, 0.1217193603515625, 0.16180419921875, 0.2018890380859375, 0.241973876953125, 0.2820587158203125, 0.3221435546875, 0.3622283935546875, 0.402313232421875, 0.4423980712890625, 0.48248291015625, 0.5225677490234375, 0.562652587890625, 0.6027374267578125, 0.642822265625, 0.6829071044921875, 0.722991943359375, 0.7630767822265625, 0.80316162109375, 0.8432464599609375, 0.883331298828125, 0.9234161376953125, 0.9635009765625, 1.0035858154296875, 1.043670654296875, 1.0837554931640625, 1.12384033203125, 1.1639251708984375, 1.204010009765625, 1.2440948486328125, 1.2841796875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 11.0, 4.0, 5.0, 10.0, 7.0, 14.0, 10.0, 23.0, 13.0, 30.0, 24.0, 31.0, 32.0, 36.0, 53.0, 72.0, 74.0, 73.0, 75.0, 65.0, 60.0, 51.0, 29.0, 21.0, 36.0, 18.0, 22.0, 21.0, 6.0, 5.0, 15.0, 9.0, 7.0, 11.0, 2.0, 2.0, 3.0, 5.0, 3.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.000698089599609375, -0.0006785765290260315, -0.000659063458442688, -0.0006395503878593445, -0.000620037317276001, -0.0006005242466926575, -0.000581011176109314, -0.0005614981055259705, -0.000541985034942627, -0.0005224719643592834, -0.0005029588937759399, -0.00048344582319259644, -0.00046393275260925293, -0.0004444196820259094, -0.0004249066114425659, -0.0004053935408592224, -0.0003858804702758789, -0.0003663673996925354, -0.0003468543291091919, -0.0003273412585258484, -0.0003078281879425049, -0.0002883151173591614, -0.00026880204677581787, -0.00024928897619247437, -0.00022977590560913086, -0.00021026283502578735, -0.00019074976444244385, -0.00017123669385910034, -0.00015172362327575684, -0.00013221055269241333, -0.00011269748210906982, -9.318441152572632e-05, -7.367134094238281e-05, -5.415827035903931e-05, -3.46451997756958e-05, -1.5132129192352295e-05, 4.380941390991211e-06, 2.3894011974334717e-05, 4.340708255767822e-05, 6.292015314102173e-05, 8.243322372436523e-05, 0.00010194629430770874, 0.00012145936489105225, 0.00014097243547439575, 0.00016048550605773926, 0.00017999857664108276, 0.00019951164722442627, 0.00021902471780776978, 0.00023853778839111328, 0.0002580508589744568, 0.0002775639295578003, 0.0002970770001411438, 0.0003165900707244873, 0.0003361031413078308, 0.0003556162118911743, 0.0003751292824745178, 0.00039464235305786133, 0.00041415542364120483, 0.00043366849422454834, 0.00045318156480789185, 0.00047269463539123535, 0.0004922077059745789, 0.0005117207765579224, 0.0005312338471412659, 0.0005507469177246094]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 7.0, 10.0, 4.0, 14.0, 6.0, 17.0, 12.0, 9.0, 18.0, 32.0, 29.0, 38.0, 43.0, 71.0, 88.0, 119.0, 210.0, 351.0, 1068.0, 50831.0, 988123.0, 5881.0, 604.0, 287.0, 188.0, 114.0, 88.0, 54.0, 56.0, 33.0, 27.0, 31.0, 18.0, 16.0, 16.0, 7.0, 10.0, 6.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01131439208984375, -0.010900020599365234, -0.010485649108886719, -0.010071277618408203, -0.009656906127929688, -0.009242534637451172, -0.008828163146972656, -0.00841379165649414, -0.007999420166015625, -0.007585048675537109, -0.007170677185058594, -0.006756305694580078, -0.0063419342041015625, -0.005927562713623047, -0.005513191223144531, -0.005098819732666016, -0.0046844482421875, -0.004270076751708984, -0.0038557052612304688, -0.003441333770751953, -0.0030269622802734375, -0.002612590789794922, -0.0021982192993164062, -0.0017838478088378906, -0.001369476318359375, -0.0009551048278808594, -0.0005407333374023438, -0.00012636184692382812, 0.0002880096435546875, 0.0007023811340332031, 0.0011167526245117188, 0.0015311241149902344, 0.00194549560546875, 0.0023598670959472656, 0.0027742385864257812, 0.003188610076904297, 0.0036029815673828125, 0.004017353057861328, 0.004431724548339844, 0.004846096038818359, 0.005260467529296875, 0.005674839019775391, 0.006089210510253906, 0.006503582000732422, 0.0069179534912109375, 0.007332324981689453, 0.007746696472167969, 0.008161067962646484, 0.008575439453125, 0.008989810943603516, 0.009404182434082031, 0.009818553924560547, 0.010232925415039062, 0.010647296905517578, 0.011061668395996094, 0.01147603988647461, 0.011890411376953125, 0.01230478286743164, 0.012719154357910156, 0.013133525848388672, 0.013547897338867188, 0.013962268829345703, 0.014376640319824219, 0.014791011810302734, 0.01520538330078125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 13.0, 59.0, 255.0, 403.0, 209.0, 58.0, 13.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000501918257214129, -0.0004538766806945205, -0.000405835104174912, -0.00035779355675913393, -0.00030975198023952544, -0.00026171040371991694, -0.0002136688563041389, -0.0001656272797845304, -0.0001175857032649219, -6.954413402127102e-05, -2.1502564777620137e-05, 2.6538997190073133e-05, 7.458057370968163e-05, 0.00012262215022929013, 0.00017066369764506817, 0.00021870527416467667, 0.00026674685068428516, 0.00031478842720389366, 0.00036283000372350216, 0.0004108715511392802, 0.0004589131276588887, 0.0005069547332823277, 0.0005549962515942752, 0.0006030378281138837, 0.0006510794046334922, 0.0006991209811531007, 0.0007471625576727092, 0.0007952040759846568, 0.0008432456525042653, 0.0008912872290238738, 0.0009393288055434823, 0.0009873703820630908, 0.0010354118421673775, 0.001083453418686986, 0.0011314949952065945, 0.001179536571726203, 0.0012275781482458115, 0.00127561972476542, 0.0013236613012850285, 0.001371702877804637, 0.0014197444543242455, 0.001467786030843854, 0.0015158276073634624, 0.001563869183883071, 0.0016119107604026794, 0.001659952336922288, 0.0017079939134418964, 0.001756035489961505, 0.0018040769500657916, 0.0018521185265854, 0.0019001601031050086, 0.001948201679624617, 0.0019962431397289038, 0.0020442847162485123, 0.0020923262927681208, 0.0021403678692877293, 0.0021884094458073378, 0.0022364510223269463, 0.0022844925988465548, 0.0023325341753661633, 0.0023805757518857718, 0.0024286173284053802, 0.0024766589049249887, 0.0025247004814445972, 0.0025727420579642057]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 10.0, 12.0, 11.0, 19.0, 15.0, 20.0, 17.0, 28.0, 21.0, 23.0, 32.0, 33.0, 47.0, 48.0, 40.0, 34.0, 47.0, 44.0, 37.0, 43.0, 42.0, 42.0, 46.0, 40.0, 44.0, 34.0, 25.0, 25.0, 22.0, 16.0, 15.0, 14.0, 8.0, 13.0, 8.0, 7.0, 7.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0003611445426940918, -0.00034975167363882065, -0.0003383588045835495, -0.00032696593552827835, -0.0003155730664730072, -0.00030418019741773605, -0.0002927873283624649, -0.00028139445930719376, -0.0002700015902519226, -0.00025860872119665146, -0.0002472158521413803, -0.00023582298308610916, -0.000224430114030838, -0.00021303724497556686, -0.00020164437592029572, -0.00019025150686502457, -0.00017885863780975342, -0.00016746576875448227, -0.00015607289969921112, -0.00014468003064393997, -0.00013328716158866882, -0.00012189429253339767, -0.00011050142347812653, -9.910855442285538e-05, -8.771568536758423e-05, -7.632281631231308e-05, -6.492994725704193e-05, -5.353707820177078e-05, -4.2144209146499634e-05, -3.0751340091228485e-05, -1.9358471035957336e-05, -7.965601980686188e-06, 3.427267074584961e-06, 1.482013612985611e-05, 2.6213005185127258e-05, 3.760587424039841e-05, 4.8998743295669556e-05, 6.0391612350940704e-05, 7.178448140621185e-05, 8.3177350461483e-05, 9.457021951675415e-05, 0.0001059630885720253, 0.00011735595762729645, 0.0001287488266825676, 0.00014014169573783875, 0.0001515345647931099, 0.00016292743384838104, 0.0001743203029036522, 0.00018571317195892334, 0.0001971060410141945, 0.00020849891006946564, 0.00021989177912473679, 0.00023128464818000793, 0.00024267751723527908, 0.00025407038629055023, 0.0002654632553458214, 0.00027685612440109253, 0.0002882489934563637, 0.0002996418625116348, 0.000311034731566906, 0.0003224276006221771, 0.00033382046967744827, 0.0003452133387327194, 0.00035660620778799057, 0.0003679990768432617]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 13.0, 16.0, 15.0, 15.0, 17.0, 20.0, 23.0, 32.0, 31.0, 33.0, 29.0, 48.0, 47.0, 39.0, 55.0, 35.0, 64.0, 44.0, 41.0, 44.0, 34.0, 32.0, 22.0, 38.0, 29.0, 21.0, 19.0, 19.0, 23.0, 13.0, 17.0, 20.0, 9.0, 7.0, 8.0, 3.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90234375, -5.71435546875, -5.5263671875, -5.33837890625, -5.150390625, -4.96240234375, -4.7744140625, -4.58642578125, -4.3984375, -4.21044921875, -4.0224609375, -3.83447265625, -3.646484375, -3.45849609375, -3.2705078125, -3.08251953125, -2.89453125, -2.70654296875, -2.5185546875, -2.33056640625, -2.142578125, -1.95458984375, -1.7666015625, -1.57861328125, -1.390625, -1.20263671875, -1.0146484375, -0.82666015625, -0.638671875, -0.45068359375, -0.2626953125, -0.07470703125, 0.11328125, 0.30126953125, 0.4892578125, 0.67724609375, 0.865234375, 1.05322265625, 1.2412109375, 1.42919921875, 1.6171875, 1.80517578125, 1.9931640625, 2.18115234375, 2.369140625, 2.55712890625, 2.7451171875, 2.93310546875, 3.12109375, 3.30908203125, 3.4970703125, 3.68505859375, 3.873046875, 4.06103515625, 4.2490234375, 4.43701171875, 4.625, 4.81298828125, 5.0009765625, 5.18896484375, 5.376953125, 5.56494140625, 5.7529296875, 5.94091796875, 6.12890625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 14.0, 14.0, 15.0, 23.0, 30.0, 37.0, 49.0, 71.0, 93.0, 149.0, 190.0, 335.0, 560.0, 1276.0, 6148.0, 54057.0, 604802.0, 341368.0, 32927.0, 3951.0, 1046.0, 470.0, 292.0, 154.0, 116.0, 87.0, 63.0, 45.0, 33.0, 29.0, 23.0, 19.0, 15.0, 9.0, 10.0, 7.0, 4.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.234375, -11.8507080078125, -11.467041015625, -11.0833740234375, -10.69970703125, -10.3160400390625, -9.932373046875, -9.5487060546875, -9.1650390625, -8.7813720703125, -8.397705078125, -8.0140380859375, -7.63037109375, -7.2467041015625, -6.863037109375, -6.4793701171875, -6.095703125, -5.7120361328125, -5.328369140625, -4.9447021484375, -4.56103515625, -4.1773681640625, -3.793701171875, -3.4100341796875, -3.0263671875, -2.6427001953125, -2.259033203125, -1.8753662109375, -1.49169921875, -1.1080322265625, -0.724365234375, -0.3406982421875, 0.04296875, 0.4266357421875, 0.810302734375, 1.1939697265625, 1.57763671875, 1.9613037109375, 2.344970703125, 2.7286376953125, 3.1123046875, 3.4959716796875, 3.879638671875, 4.2633056640625, 4.64697265625, 5.0306396484375, 5.414306640625, 5.7979736328125, 6.181640625, 6.5653076171875, 6.948974609375, 7.3326416015625, 7.71630859375, 8.0999755859375, 8.483642578125, 8.8673095703125, 9.2509765625, 9.6346435546875, 10.018310546875, 10.4019775390625, 10.78564453125, 11.1693115234375, 11.552978515625, 11.9366455078125, 12.3203125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 9.0, 2.0, 6.0, 13.0, 8.0, 10.0, 12.0, 7.0, 15.0, 23.0, 24.0, 35.0, 28.0, 27.0, 39.0, 38.0, 65.0, 82.0, 129.0, 270.0, 1522.0, 198.0, 87.0, 63.0, 47.0, 39.0, 29.0, 32.0, 28.0, 25.0, 24.0, 18.0, 21.0, 18.0, 12.0, 14.0, 7.0, 3.0, 7.0, 4.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.515625, -16.896484375, -16.27734375, -15.658203125, -15.0390625, -14.419921875, -13.80078125, -13.181640625, -12.5625, -11.943359375, -11.32421875, -10.705078125, -10.0859375, -9.466796875, -8.84765625, -8.228515625, -7.609375, -6.990234375, -6.37109375, -5.751953125, -5.1328125, -4.513671875, -3.89453125, -3.275390625, -2.65625, -2.037109375, -1.41796875, -0.798828125, -0.1796875, 0.439453125, 1.05859375, 1.677734375, 2.296875, 2.916015625, 3.53515625, 4.154296875, 4.7734375, 5.392578125, 6.01171875, 6.630859375, 7.25, 7.869140625, 8.48828125, 9.107421875, 9.7265625, 10.345703125, 10.96484375, 11.583984375, 12.203125, 12.822265625, 13.44140625, 14.060546875, 14.6796875, 15.298828125, 15.91796875, 16.537109375, 17.15625, 17.775390625, 18.39453125, 19.013671875, 19.6328125, 20.251953125, 20.87109375, 21.490234375, 22.109375]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 7.0, 4.0, 7.0, 13.0, 8.0, 14.0, 18.0, 26.0, 28.0, 36.0, 40.0, 48.0, 55.0, 60.0, 102.0, 161.0, 314.0, 702.0, 2784.0, 2777525.0, 360385.0, 1916.0, 549.0, 259.0, 165.0, 89.0, 74.0, 62.0, 57.0, 38.0, 30.0, 24.0, 14.0, 12.0, 23.0, 14.0, 14.0, 4.0, 5.0, 7.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.8125, -62.90087890625, -60.9892578125, -59.07763671875, -57.166015625, -55.25439453125, -53.3427734375, -51.43115234375, -49.51953125, -47.60791015625, -45.6962890625, -43.78466796875, -41.873046875, -39.96142578125, -38.0498046875, -36.13818359375, -34.2265625, -32.31494140625, -30.4033203125, -28.49169921875, -26.580078125, -24.66845703125, -22.7568359375, -20.84521484375, -18.93359375, -17.02197265625, -15.1103515625, -13.19873046875, -11.287109375, -9.37548828125, -7.4638671875, -5.55224609375, -3.640625, -1.72900390625, 0.1826171875, 2.09423828125, 4.005859375, 5.91748046875, 7.8291015625, 9.74072265625, 11.65234375, 13.56396484375, 15.4755859375, 17.38720703125, 19.298828125, 21.21044921875, 23.1220703125, 25.03369140625, 26.9453125, 28.85693359375, 30.7685546875, 32.68017578125, 34.591796875, 36.50341796875, 38.4150390625, 40.32666015625, 42.23828125, 44.14990234375, 46.0615234375, 47.97314453125, 49.884765625, 51.79638671875, 53.7080078125, 55.61962890625, 57.53125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [2.0, 2.0, 10.0, 62.0, 220.0, 342.0, 266.0, 88.0, 21.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.037247657775879, -7.4186272621154785, -5.800006866455078, -4.181386947631836, -2.5627665519714355, -0.9441461563110352, 0.674473762512207, 2.2930946350097656, 3.911714553833008, 5.530334949493408, 7.148955345153809, 8.76757526397705, 10.38619613647461, 12.004816055297852, 13.623435974121094, 15.242056846618652, 16.860675811767578, 18.47929573059082, 20.097915649414062, 21.716537475585938, 23.33515739440918, 24.953777313232422, 26.572397232055664, 28.191017150878906, 29.80963897705078, 31.428258895874023, 33.046878814697266, 34.66550064086914, 36.28411865234375, 37.902740478515625, 39.5213623046875, 41.13998031616211, 42.758602142333984, 44.37722396850586, 45.99584197998047, 47.614463806152344, 49.23308181762695, 50.85170364379883, 52.47032165527344, 54.08894348144531, 55.70756530761719, 57.32618713378906, 58.94480514526367, 60.56342697143555, 62.182044982910156, 63.80066680908203, 65.4192886352539, 67.03791046142578, 68.65652465820312, 70.275146484375, 71.89376831054688, 73.51238250732422, 75.1310043334961, 76.74962615966797, 78.36824798583984, 79.98686981201172, 81.6054916381836, 83.22411346435547, 84.84273529052734, 86.46134948730469, 88.07997131347656, 89.69859313964844, 91.31721496582031, 92.93583679199219, 94.55445098876953]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 6.0, 5.0, 11.0, 16.0, 19.0, 11.0, 21.0, 14.0, 23.0, 35.0, 30.0, 27.0, 38.0, 46.0, 48.0, 46.0, 55.0, 43.0, 53.0, 39.0, 50.0, 46.0, 31.0, 45.0, 24.0, 38.0, 28.0, 24.0, 17.0, 22.0, 19.0, 15.0, 15.0, 16.0, 6.0, 4.0, 2.0, 5.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.4478988647461, -62.54887390136719, -60.649845123291016, -58.75082015991211, -56.85179138183594, -54.95276641845703, -53.053741455078125, -51.15471267700195, -49.25568389892578, -47.356658935546875, -45.4576301574707, -43.5586051940918, -41.659576416015625, -39.76055145263672, -37.86152648925781, -35.96249771118164, -34.063472747802734, -32.16444778442383, -30.265419006347656, -28.36639404296875, -26.467365264892578, -24.568340301513672, -22.669313430786133, -20.770286560058594, -18.871259689331055, -16.972232818603516, -15.073205947875977, -13.174180030822754, -11.275153160095215, -9.376126289367676, -7.477100372314453, -5.578073501586914, -3.6790504455566406, -1.7800238132476807, 0.1190028190612793, 2.01802921295166, 3.917056083679199, 5.816082954406738, 7.715108871459961, 9.6141357421875, 11.513162612915039, 13.412189483642578, 15.311216354370117, 17.210243225097656, 19.109268188476562, 21.008296966552734, 22.90732192993164, 24.80634880065918, 26.70537567138672, 28.604402542114258, 30.503429412841797, 32.4024543762207, 34.301483154296875, 36.20050811767578, 38.09953308105469, 39.99856185913086, 41.89759063720703, 43.79661560058594, 45.69564437866211, 47.594669342041016, 49.49369812011719, 51.392723083496094, 53.291748046875, 55.19077682495117, 57.08980178833008]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 3.0, 11.0, 10.0, 12.0, 11.0, 12.0, 5.0, 9.0, 23.0, 28.0, 20.0, 30.0, 34.0, 33.0, 34.0, 34.0, 33.0, 35.0, 29.0, 35.0, 47.0, 38.0, 41.0, 43.0, 38.0, 38.0, 29.0, 39.0, 25.0, 22.0, 30.0, 22.0, 20.0, 17.0, 13.0, 18.0, 17.0, 20.0, 6.0, 2.0, 10.0, 8.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.76953125, -5.57916259765625, -5.3887939453125, -5.19842529296875, -5.008056640625, -4.81768798828125, -4.6273193359375, -4.43695068359375, -4.24658203125, -4.05621337890625, -3.8658447265625, -3.67547607421875, -3.485107421875, -3.29473876953125, -3.1043701171875, -2.91400146484375, -2.7236328125, -2.53326416015625, -2.3428955078125, -2.15252685546875, -1.962158203125, -1.77178955078125, -1.5814208984375, -1.39105224609375, -1.20068359375, -1.01031494140625, -0.8199462890625, -0.62957763671875, -0.439208984375, -0.24884033203125, -0.0584716796875, 0.13189697265625, 0.322265625, 0.51263427734375, 0.7030029296875, 0.89337158203125, 1.083740234375, 1.27410888671875, 1.4644775390625, 1.65484619140625, 1.84521484375, 2.03558349609375, 2.2259521484375, 2.41632080078125, 2.606689453125, 2.79705810546875, 2.9874267578125, 3.17779541015625, 3.3681640625, 3.55853271484375, 3.7489013671875, 3.93927001953125, 4.129638671875, 4.32000732421875, 4.5103759765625, 4.70074462890625, 4.89111328125, 5.08148193359375, 5.2718505859375, 5.46221923828125, 5.652587890625, 5.84295654296875, 6.0333251953125, 6.22369384765625, 6.4140625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 6.0, 2.0, 5.0, 8.0, 12.0, 10.0, 10.0, 24.0, 19.0, 28.0, 47.0, 39.0, 68.0, 100.0, 151.0, 233.0, 434.0, 856.0, 2191.0, 7648.0, 43566.0, 290943.0, 1193392.0, 1765672.0, 737662.0, 125201.0, 18413.0, 4368.0, 1468.0, 670.0, 386.0, 221.0, 107.0, 86.0, 62.0, 37.0, 21.0, 25.0, 23.0, 22.0, 9.0, 9.0, 8.0, 6.0, 8.0, 5.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.9765625, -6.711181640625, -6.44580078125, -6.180419921875, -5.9150390625, -5.649658203125, -5.38427734375, -5.118896484375, -4.853515625, -4.588134765625, -4.32275390625, -4.057373046875, -3.7919921875, -3.526611328125, -3.26123046875, -2.995849609375, -2.73046875, -2.465087890625, -2.19970703125, -1.934326171875, -1.6689453125, -1.403564453125, -1.13818359375, -0.872802734375, -0.607421875, -0.342041015625, -0.07666015625, 0.188720703125, 0.4541015625, 0.719482421875, 0.98486328125, 1.250244140625, 1.515625, 1.781005859375, 2.04638671875, 2.311767578125, 2.5771484375, 2.842529296875, 3.10791015625, 3.373291015625, 3.638671875, 3.904052734375, 4.16943359375, 4.434814453125, 4.7001953125, 4.965576171875, 5.23095703125, 5.496337890625, 5.76171875, 6.027099609375, 6.29248046875, 6.557861328125, 6.8232421875, 7.088623046875, 7.35400390625, 7.619384765625, 7.884765625, 8.150146484375, 8.41552734375, 8.680908203125, 8.9462890625, 9.211669921875, 9.47705078125, 9.742431640625, 10.0078125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 8.0, 4.0, 24.0, 24.0, 48.0, 44.0, 85.0, 117.0, 189.0, 326.0, 463.0, 646.0, 562.0, 499.0, 345.0, 248.0, 152.0, 76.0, 72.0, 49.0, 31.0, 23.0, 13.0, 12.0, 5.0, 8.0, 7.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.25, -20.769775390625, -20.28955078125, -19.809326171875, -19.3291015625, -18.848876953125, -18.36865234375, -17.888427734375, -17.408203125, -16.927978515625, -16.44775390625, -15.967529296875, -15.4873046875, -15.007080078125, -14.52685546875, -14.046630859375, -13.56640625, -13.086181640625, -12.60595703125, -12.125732421875, -11.6455078125, -11.165283203125, -10.68505859375, -10.204833984375, -9.724609375, -9.244384765625, -8.76416015625, -8.283935546875, -7.8037109375, -7.323486328125, -6.84326171875, -6.363037109375, -5.8828125, -5.402587890625, -4.92236328125, -4.442138671875, -3.9619140625, -3.481689453125, -3.00146484375, -2.521240234375, -2.041015625, -1.560791015625, -1.08056640625, -0.600341796875, -0.1201171875, 0.360107421875, 0.84033203125, 1.320556640625, 1.80078125, 2.281005859375, 2.76123046875, 3.241455078125, 3.7216796875, 4.201904296875, 4.68212890625, 5.162353515625, 5.642578125, 6.122802734375, 6.60302734375, 7.083251953125, 7.5634765625, 8.043701171875, 8.52392578125, 9.004150390625, 9.484375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 4.0, 11.0, 16.0, 19.0, 35.0, 58.0, 82.0, 120.0, 202.0, 352.0, 656.0, 1519.0, 11633.0, 4079440.0, 96082.0, 2192.0, 789.0, 424.0, 250.0, 149.0, 91.0, 60.0, 43.0, 20.0, 21.0, 8.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.09375, -35.38134765625, -33.6689453125, -31.95654296875, -30.244140625, -28.53173828125, -26.8193359375, -25.10693359375, -23.39453125, -21.68212890625, -19.9697265625, -18.25732421875, -16.544921875, -14.83251953125, -13.1201171875, -11.40771484375, -9.6953125, -7.98291015625, -6.2705078125, -4.55810546875, -2.845703125, -1.13330078125, 0.5791015625, 2.29150390625, 4.00390625, 5.71630859375, 7.4287109375, 9.14111328125, 10.853515625, 12.56591796875, 14.2783203125, 15.99072265625, 17.703125, 19.41552734375, 21.1279296875, 22.84033203125, 24.552734375, 26.26513671875, 27.9775390625, 29.68994140625, 31.40234375, 33.11474609375, 34.8271484375, 36.53955078125, 38.251953125, 39.96435546875, 41.6767578125, 43.38916015625, 45.1015625, 46.81396484375, 48.5263671875, 50.23876953125, 51.951171875, 53.66357421875, 55.3759765625, 57.08837890625, 58.80078125, 60.51318359375, 62.2255859375, 63.93798828125, 65.650390625, 67.36279296875, 69.0751953125, 70.78759765625, 72.5]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 10.0, 149.0, 457.0, 336.0, 56.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.36093139648438, -139.35037231445312, -134.33981323242188, -129.3292694091797, -124.31871032714844, -119.30815124511719, -114.29759216308594, -109.28703308105469, -104.27648162841797, -99.26592254638672, -94.25537109375, -89.24481201171875, -84.2342529296875, -79.22370147705078, -74.21314239501953, -69.20259094238281, -64.19203186035156, -59.18147659301758, -54.170921325683594, -49.160362243652344, -44.14980697631836, -39.139251708984375, -34.128692626953125, -29.11813735961914, -24.107582092285156, -19.097026824951172, -14.086469650268555, -9.075913429260254, -4.065357208251953, 0.9451980590820312, 5.955755233764648, 10.966312408447266, 15.976882934570312, 20.987438201904297, 25.997995376586914, 31.00855255126953, 36.019107818603516, 41.0296630859375, 46.04022216796875, 51.050777435302734, 56.06133270263672, 61.0718879699707, 66.08244323730469, 71.09300231933594, 76.10356140136719, 81.1141128540039, 86.12467193603516, 91.13522338867188, 96.14578247070312, 101.15634155273438, 106.1668930053711, 111.17745208740234, 116.18800354003906, 121.19856262207031, 126.20912170410156, 131.2196807861328, 136.230224609375, 141.24078369140625, 146.2513427734375, 151.2618865966797, 156.27244567871094, 161.2830047607422, 166.29356384277344, 171.3041229248047, 176.31468200683594]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 3.0, 7.0, 13.0, 15.0, 10.0, 9.0, 19.0, 26.0, 30.0, 24.0, 23.0, 32.0, 33.0, 37.0, 40.0, 40.0, 53.0, 41.0, 45.0, 44.0, 44.0, 44.0, 42.0, 20.0, 36.0, 35.0, 46.0, 29.0, 30.0, 27.0, 13.0, 16.0, 19.0, 15.0, 9.0, 7.0, 9.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.76203155517578, -36.543174743652344, -35.324317932128906, -34.10546112060547, -32.88660430908203, -31.667747497558594, -30.44889259338379, -29.23003578186035, -28.011178970336914, -26.792322158813477, -25.57346534729004, -24.3546085357666, -23.135753631591797, -21.91689682006836, -20.698040008544922, -19.479183197021484, -18.260326385498047, -17.04146957397461, -15.822612762451172, -14.60375690460205, -13.384900093078613, -12.166043281555176, -10.947187423706055, -9.728330612182617, -8.50947380065918, -7.290616989135742, -6.071760654449463, -4.852904319763184, -3.634047508239746, -2.4151906967163086, -1.1963343620300293, 0.02252197265625, 1.2413749694824219, 2.4602315425872803, 3.6790881156921387, 4.897944450378418, 6.1168012619018555, 7.335658073425293, 8.554513931274414, 9.773370742797852, 10.992227554321289, 12.211084365844727, 13.429941177368164, 14.648797035217285, 15.867653846740723, 17.086509704589844, 18.30536651611328, 19.52422332763672, 20.743080139160156, 21.961936950683594, 23.18079376220703, 24.39965057373047, 25.618507385253906, 26.837364196777344, 28.05621910095215, 29.275075912475586, 30.493932723999023, 31.71278953552246, 32.931644439697266, 34.1505012512207, 35.36935806274414, 36.58821487426758, 37.807071685791016, 39.02592849731445, 40.24478530883789]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 3.0, 8.0, 4.0, 15.0, 11.0, 15.0, 15.0, 16.0, 19.0, 26.0, 16.0, 18.0, 20.0, 29.0, 21.0, 35.0, 37.0, 43.0, 33.0, 34.0, 39.0, 53.0, 45.0, 40.0, 35.0, 35.0, 37.0, 29.0, 24.0, 27.0, 33.0, 32.0, 19.0, 12.0, 28.0, 17.0, 11.0, 9.0, 9.0, 12.0, 8.0, 7.0, 4.0, 7.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-5.578125, -5.39715576171875, -5.2161865234375, -5.03521728515625, -4.854248046875, -4.67327880859375, -4.4923095703125, -4.31134033203125, -4.13037109375, -3.94940185546875, -3.7684326171875, -3.58746337890625, -3.406494140625, -3.22552490234375, -3.0445556640625, -2.86358642578125, -2.6826171875, -2.50164794921875, -2.3206787109375, -2.13970947265625, -1.958740234375, -1.77777099609375, -1.5968017578125, -1.41583251953125, -1.23486328125, -1.05389404296875, -0.8729248046875, -0.69195556640625, -0.510986328125, -0.33001708984375, -0.1490478515625, 0.03192138671875, 0.212890625, 0.39385986328125, 0.5748291015625, 0.75579833984375, 0.936767578125, 1.11773681640625, 1.2987060546875, 1.47967529296875, 1.66064453125, 1.84161376953125, 2.0225830078125, 2.20355224609375, 2.384521484375, 2.56549072265625, 2.7464599609375, 2.92742919921875, 3.1083984375, 3.28936767578125, 3.4703369140625, 3.65130615234375, 3.832275390625, 4.01324462890625, 4.1942138671875, 4.37518310546875, 4.55615234375, 4.73712158203125, 4.9180908203125, 5.09906005859375, 5.280029296875, 5.46099853515625, 5.6419677734375, 5.82293701171875, 6.00390625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 3.0, 13.0, 29.0, 16.0, 37.0, 58.0, 74.0, 92.0, 161.0, 229.0, 300.0, 445.0, 673.0, 919.0, 1337.0, 1934.0, 2783.0, 4116.0, 5930.0, 8892.0, 13028.0, 19653.0, 29339.0, 46020.0, 74705.0, 135151.0, 323480.0, 152338.0, 81367.0, 49280.0, 31702.0, 20843.0, 13931.0, 9405.0, 6275.0, 4357.0, 2930.0, 2029.0, 1412.0, 1018.0, 684.0, 482.0, 339.0, 226.0, 175.0, 100.0, 81.0, 64.0, 32.0, 26.0, 19.0, 14.0, 5.0, 5.0, 3.0, 1.0, 3.0], "bins": [-1.3291015625, -1.289520263671875, -1.24993896484375, -1.210357666015625, -1.1707763671875, -1.131195068359375, -1.09161376953125, -1.052032470703125, -1.012451171875, -0.972869873046875, -0.93328857421875, -0.893707275390625, -0.8541259765625, -0.814544677734375, -0.77496337890625, -0.735382080078125, -0.69580078125, -0.656219482421875, -0.61663818359375, -0.577056884765625, -0.5374755859375, -0.497894287109375, -0.45831298828125, -0.418731689453125, -0.379150390625, -0.339569091796875, -0.29998779296875, -0.260406494140625, -0.2208251953125, -0.181243896484375, -0.14166259765625, -0.102081298828125, -0.0625, -0.022918701171875, 0.01666259765625, 0.056243896484375, 0.0958251953125, 0.135406494140625, 0.17498779296875, 0.214569091796875, 0.254150390625, 0.293731689453125, 0.33331298828125, 0.372894287109375, 0.4124755859375, 0.452056884765625, 0.49163818359375, 0.531219482421875, 0.57080078125, 0.610382080078125, 0.64996337890625, 0.689544677734375, 0.7291259765625, 0.768707275390625, 0.80828857421875, 0.847869873046875, 0.887451171875, 0.927032470703125, 0.96661376953125, 1.006195068359375, 1.0457763671875, 1.085357666015625, 1.12493896484375, 1.164520263671875, 1.2041015625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 5.0, 7.0, 10.0, 11.0, 6.0, 14.0, 14.0, 20.0, 17.0, 21.0, 26.0, 33.0, 26.0, 28.0, 43.0, 36.0, 30.0, 36.0, 57.0, 38.0, 1069.0, 37.0, 39.0, 44.0, 39.0, 35.0, 34.0, 34.0, 21.0, 29.0, 25.0, 25.0, 19.0, 8.0, 15.0, 7.0, 12.0, 5.0, 12.0, 9.0, 3.0, 3.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.75, -3.632598876953125, -3.51519775390625, -3.397796630859375, -3.2803955078125, -3.162994384765625, -3.04559326171875, -2.928192138671875, -2.810791015625, -2.693389892578125, -2.57598876953125, -2.458587646484375, -2.3411865234375, -2.223785400390625, -2.10638427734375, -1.988983154296875, -1.87158203125, -1.754180908203125, -1.63677978515625, -1.519378662109375, -1.4019775390625, -1.284576416015625, -1.16717529296875, -1.049774169921875, -0.932373046875, -0.814971923828125, -0.69757080078125, -0.580169677734375, -0.4627685546875, -0.345367431640625, -0.22796630859375, -0.110565185546875, 0.0068359375, 0.124237060546875, 0.24163818359375, 0.359039306640625, 0.4764404296875, 0.593841552734375, 0.71124267578125, 0.828643798828125, 0.946044921875, 1.063446044921875, 1.18084716796875, 1.298248291015625, 1.4156494140625, 1.533050537109375, 1.65045166015625, 1.767852783203125, 1.88525390625, 2.002655029296875, 2.12005615234375, 2.237457275390625, 2.3548583984375, 2.472259521484375, 2.58966064453125, 2.707061767578125, 2.824462890625, 2.941864013671875, 3.05926513671875, 3.176666259765625, 3.2940673828125, 3.411468505859375, 3.52886962890625, 3.646270751953125, 3.763671875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 6.0, 12.0, 22.0, 20.0, 31.0, 52.0, 77.0, 90.0, 129.0, 214.0, 324.0, 417.0, 676.0, 1057.0, 1600.0, 2537.0, 4005.0, 6535.0, 10416.0, 17568.0, 29839.0, 52014.0, 96998.0, 240289.0, 1376395.0, 112916.0, 59324.0, 33109.0, 19245.0, 11361.0, 7068.0, 4468.0, 2887.0, 1883.0, 1238.0, 771.0, 517.0, 352.0, 237.0, 154.0, 77.0, 67.0, 47.0, 30.0, 11.0, 18.0, 11.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.544921875, -1.496795654296875, -1.44866943359375, -1.400543212890625, -1.3524169921875, -1.304290771484375, -1.25616455078125, -1.208038330078125, -1.159912109375, -1.111785888671875, -1.06365966796875, -1.015533447265625, -0.9674072265625, -0.919281005859375, -0.87115478515625, -0.823028564453125, -0.77490234375, -0.726776123046875, -0.67864990234375, -0.630523681640625, -0.5823974609375, -0.534271240234375, -0.48614501953125, -0.438018798828125, -0.389892578125, -0.341766357421875, -0.29364013671875, -0.245513916015625, -0.1973876953125, -0.149261474609375, -0.10113525390625, -0.053009033203125, -0.0048828125, 0.043243408203125, 0.09136962890625, 0.139495849609375, 0.1876220703125, 0.235748291015625, 0.28387451171875, 0.332000732421875, 0.380126953125, 0.428253173828125, 0.47637939453125, 0.524505615234375, 0.5726318359375, 0.620758056640625, 0.66888427734375, 0.717010498046875, 0.76513671875, 0.813262939453125, 0.86138916015625, 0.909515380859375, 0.9576416015625, 1.005767822265625, 1.05389404296875, 1.102020263671875, 1.150146484375, 1.198272705078125, 1.24639892578125, 1.294525146484375, 1.3426513671875, 1.390777587890625, 1.43890380859375, 1.487030029296875, 1.53515625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 3.0, 6.0, 5.0, 9.0, 6.0, 9.0, 11.0, 20.0, 29.0, 41.0, 82.0, 123.0, 175.0, 178.0, 108.0, 68.0, 38.0, 25.0, 19.0, 10.0, 9.0, 9.0, 0.0, 5.0, 7.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011463165283203125, -0.0011051595211029053, -0.001064002513885498, -0.0010228455066680908, -0.0009816884994506836, -0.0009405314922332764, -0.0008993744850158691, -0.0008582174777984619, -0.0008170604705810547, -0.0007759034633636475, -0.0007347464561462402, -0.000693589448928833, -0.0006524324417114258, -0.0006112754344940186, -0.0005701184272766113, -0.0005289614200592041, -0.0004878044128417969, -0.00044664740562438965, -0.0004054903984069824, -0.0003643333911895752, -0.00032317638397216797, -0.00028201937675476074, -0.00024086236953735352, -0.0001997053623199463, -0.00015854835510253906, -0.00011739134788513184, -7.623434066772461e-05, -3.507733345031738e-05, 6.079673767089844e-06, 4.723668098449707e-05, 8.83936882019043e-05, 0.00012955069541931152, 0.00017070770263671875, 0.00021186470985412598, 0.0002530217170715332, 0.00029417872428894043, 0.00033533573150634766, 0.0003764927387237549, 0.0004176497459411621, 0.00045880675315856934, 0.0004999637603759766, 0.0005411207675933838, 0.000582277774810791, 0.0006234347820281982, 0.0006645917892456055, 0.0007057487964630127, 0.0007469058036804199, 0.0007880628108978271, 0.0008292198181152344, 0.0008703768253326416, 0.0009115338325500488, 0.0009526908397674561, 0.0009938478469848633, 0.0010350048542022705, 0.0010761618614196777, 0.001117318868637085, 0.0011584758758544922, 0.0011996328830718994, 0.0012407898902893066, 0.0012819468975067139, 0.001323103904724121, 0.0013642609119415283, 0.0014054179191589355, 0.0014465749263763428, 0.00148773193359375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 8.0, 8.0, 13.0, 11.0, 13.0, 23.0, 31.0, 60.0, 70.0, 132.0, 268.0, 715.0, 39494.0, 1005556.0, 1308.0, 353.0, 178.0, 103.0, 58.0, 31.0, 29.0, 13.0, 20.0, 10.0, 12.0, 5.0, 5.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0], "bins": [-0.027862548828125, -0.027092695236206055, -0.02632284164428711, -0.025552988052368164, -0.02478313446044922, -0.024013280868530273, -0.023243427276611328, -0.022473573684692383, -0.021703720092773438, -0.020933866500854492, -0.020164012908935547, -0.0193941593170166, -0.018624305725097656, -0.01785445213317871, -0.017084598541259766, -0.01631474494934082, -0.015544891357421875, -0.01477503776550293, -0.014005184173583984, -0.013235330581665039, -0.012465476989746094, -0.011695623397827148, -0.010925769805908203, -0.010155916213989258, -0.009386062622070312, -0.008616209030151367, -0.007846355438232422, -0.0070765018463134766, -0.006306648254394531, -0.005536794662475586, -0.004766941070556641, -0.003997087478637695, -0.00322723388671875, -0.0024573802947998047, -0.0016875267028808594, -0.0009176731109619141, -0.00014781951904296875, 0.0006220340728759766, 0.0013918876647949219, 0.002161741256713867, 0.0029315948486328125, 0.003701448440551758, 0.004471302032470703, 0.0052411556243896484, 0.006011009216308594, 0.006780862808227539, 0.007550716400146484, 0.00832056999206543, 0.009090423583984375, 0.00986027717590332, 0.010630130767822266, 0.011399984359741211, 0.012169837951660156, 0.012939691543579102, 0.013709545135498047, 0.014479398727416992, 0.015249252319335938, 0.016019105911254883, 0.016788959503173828, 0.017558813095092773, 0.01832866668701172, 0.019098520278930664, 0.01986837387084961, 0.020638227462768555, 0.0214080810546875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 9.0, 499.0, 498.0, 10.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006397530902177095, -0.0062641846016049385, -0.006130837835371494, -0.005997491534799337, -0.0058641452342271805, -0.005730798467993736, -0.005597452167421579, -0.005464105401188135, -0.005330759100615978, -0.005197412800043821, -0.005064066033810377, -0.00493071973323822, -0.004797372967004776, -0.004664026666432619, -0.004530680365860462, -0.004397333599627018, -0.004263987299054861, -0.004130640998482704, -0.00399729423224926, -0.003863947931677103, -0.0037306013982743025, -0.003597254864871502, -0.003463908564299345, -0.0033305620308965445, -0.003197215497493744, -0.0030638689640909433, -0.0029305224306881428, -0.002797176130115986, -0.0026638295967131853, -0.0025304830633103848, -0.002397136762738228, -0.0022637902293354273, -0.002130444161593914, -0.0019970976281911135, -0.0018637512112036347, -0.001730404794216156, -0.0015970582608133554, -0.0014637117274105549, -0.0013303653104230762, -0.0011970188934355974, -0.0010636723600327969, -0.0009303258848376572, -0.0007969794096425176, -0.0006636329344473779, -0.0005302864592522383, -0.0003969399840570986, -0.000263593508861959, -0.00013024703366681933, 3.0994415283203125e-06, 0.00013644591672345996, 0.0002697923919185996, 0.00040313886711373925, 0.0005364853423088789, 0.0006698318175040185, 0.0008031782926991582, 0.0009365247678942978, 0.0010698712430894375, 0.001203217776492238, 0.0013365641934797168, 0.0014699106104671955, 0.001603257143869996, 0.0017366036772727966, 0.0018699500942602754, 0.002003296511247754, 0.0021366430446505547]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 10.0, 7.0, 14.0, 13.0, 15.0, 10.0, 23.0, 18.0, 26.0, 27.0, 25.0, 34.0, 36.0, 48.0, 38.0, 45.0, 42.0, 50.0, 56.0, 44.0, 55.0, 43.0, 38.0, 44.0, 36.0, 37.0, 30.0, 23.0, 24.0, 19.0, 16.0, 11.0, 7.0, 11.0, 4.0, 5.0, 7.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004138350486755371, -0.0003994675353169441, -0.00038510002195835114, -0.00037073250859975815, -0.00035636499524116516, -0.0003419974818825722, -0.0003276299685239792, -0.0003132624551653862, -0.0002988949418067932, -0.0002845274284482002, -0.00027015991508960724, -0.00025579240173101425, -0.00024142488837242126, -0.00022705737501382828, -0.0002126898616552353, -0.0001983223482966423, -0.00018395483493804932, -0.00016958732157945633, -0.00015521980822086334, -0.00014085229486227036, -0.00012648478150367737, -0.00011211726814508438, -9.77497547864914e-05, -8.338224142789841e-05, -6.901472806930542e-05, -5.464721471071243e-05, -4.0279701352119446e-05, -2.591218799352646e-05, -1.1544674634933472e-05, 2.8228387236595154e-06, 1.7190352082252502e-05, 3.155786544084549e-05, 4.5925378799438477e-05, 6.0292892158031464e-05, 7.466040551662445e-05, 8.902791887521744e-05, 0.00010339543223381042, 0.00011776294559240341, 0.0001321304589509964, 0.00014649797230958939, 0.00016086548566818237, 0.00017523299902677536, 0.00018960051238536835, 0.00020396802574396133, 0.00021833553910255432, 0.0002327030524611473, 0.0002470705658197403, 0.0002614380791783333, 0.00027580559253692627, 0.00029017310589551926, 0.00030454061925411224, 0.00031890813261270523, 0.0003332756459712982, 0.0003476431593298912, 0.0003620106726884842, 0.0003763781860470772, 0.00039074569940567017, 0.00040511321276426315, 0.00041948072612285614, 0.00043384823948144913, 0.0004482157528400421, 0.0004625832661986351, 0.0004769507795572281, 0.0004913182929158211, 0.0005056858062744141]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 3.0, 8.0, 4.0, 15.0, 11.0, 15.0, 15.0, 16.0, 19.0, 26.0, 16.0, 18.0, 20.0, 29.0, 21.0, 35.0, 37.0, 43.0, 33.0, 34.0, 40.0, 52.0, 45.0, 40.0, 35.0, 35.0, 37.0, 29.0, 24.0, 27.0, 33.0, 32.0, 19.0, 12.0, 28.0, 17.0, 11.0, 9.0, 9.0, 12.0, 8.0, 7.0, 4.0, 7.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-5.578125, -5.39715576171875, -5.2161865234375, -5.03521728515625, -4.854248046875, -4.67327880859375, -4.4923095703125, -4.31134033203125, -4.13037109375, -3.94940185546875, -3.7684326171875, -3.58746337890625, -3.406494140625, -3.22552490234375, -3.0445556640625, -2.86358642578125, -2.6826171875, -2.50164794921875, -2.3206787109375, -2.13970947265625, -1.958740234375, -1.77777099609375, -1.5968017578125, -1.41583251953125, -1.23486328125, -1.05389404296875, -0.8729248046875, -0.69195556640625, -0.510986328125, -0.33001708984375, -0.1490478515625, 0.03192138671875, 0.212890625, 0.39385986328125, 0.5748291015625, 0.75579833984375, 0.936767578125, 1.11773681640625, 1.2987060546875, 1.47967529296875, 1.66064453125, 1.84161376953125, 2.0225830078125, 2.20355224609375, 2.384521484375, 2.56549072265625, 2.7464599609375, 2.92742919921875, 3.1083984375, 3.28936767578125, 3.4703369140625, 3.65130615234375, 3.832275390625, 4.01324462890625, 4.1942138671875, 4.37518310546875, 4.55615234375, 4.73712158203125, 4.9180908203125, 5.09906005859375, 5.280029296875, 5.46099853515625, 5.6419677734375, 5.82293701171875, 6.00390625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 13.0, 5.0, 9.0, 13.0, 17.0, 23.0, 29.0, 38.0, 48.0, 76.0, 141.0, 236.0, 516.0, 1048.0, 2379.0, 5749.0, 13634.0, 33254.0, 87751.0, 252025.0, 379933.0, 170369.0, 60243.0, 23612.0, 9850.0, 4155.0, 1701.0, 765.0, 372.0, 192.0, 98.0, 68.0, 52.0, 27.0, 19.0, 14.0, 15.0, 17.0, 10.0, 5.0, 3.0, 9.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-6.03515625, -5.8424072265625, -5.649658203125, -5.4569091796875, -5.26416015625, -5.0714111328125, -4.878662109375, -4.6859130859375, -4.4931640625, -4.3004150390625, -4.107666015625, -3.9149169921875, -3.72216796875, -3.5294189453125, -3.336669921875, -3.1439208984375, -2.951171875, -2.7584228515625, -2.565673828125, -2.3729248046875, -2.18017578125, -1.9874267578125, -1.794677734375, -1.6019287109375, -1.4091796875, -1.2164306640625, -1.023681640625, -0.8309326171875, -0.63818359375, -0.4454345703125, -0.252685546875, -0.0599365234375, 0.1328125, 0.3255615234375, 0.518310546875, 0.7110595703125, 0.90380859375, 1.0965576171875, 1.289306640625, 1.4820556640625, 1.6748046875, 1.8675537109375, 2.060302734375, 2.2530517578125, 2.44580078125, 2.6385498046875, 2.831298828125, 3.0240478515625, 3.216796875, 3.4095458984375, 3.602294921875, 3.7950439453125, 3.98779296875, 4.1805419921875, 4.373291015625, 4.5660400390625, 4.7587890625, 4.9515380859375, 5.144287109375, 5.3370361328125, 5.52978515625, 5.7225341796875, 5.915283203125, 6.1080322265625, 6.30078125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 10.0, 6.0, 9.0, 12.0, 13.0, 19.0, 26.0, 22.0, 32.0, 26.0, 36.0, 30.0, 43.0, 33.0, 58.0, 85.0, 199.0, 1449.0, 347.0, 108.0, 79.0, 42.0, 37.0, 42.0, 44.0, 28.0, 31.0, 34.0, 21.0, 13.0, 18.0, 13.0, 11.0, 10.0, 10.0, 13.0, 6.0, 4.0, 2.0, 3.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 5.0], "bins": [-22.875, -22.217041015625, -21.55908203125, -20.901123046875, -20.2431640625, -19.585205078125, -18.92724609375, -18.269287109375, -17.611328125, -16.953369140625, -16.29541015625, -15.637451171875, -14.9794921875, -14.321533203125, -13.66357421875, -13.005615234375, -12.34765625, -11.689697265625, -11.03173828125, -10.373779296875, -9.7158203125, -9.057861328125, -8.39990234375, -7.741943359375, -7.083984375, -6.426025390625, -5.76806640625, -5.110107421875, -4.4521484375, -3.794189453125, -3.13623046875, -2.478271484375, -1.8203125, -1.162353515625, -0.50439453125, 0.153564453125, 0.8115234375, 1.469482421875, 2.12744140625, 2.785400390625, 3.443359375, 4.101318359375, 4.75927734375, 5.417236328125, 6.0751953125, 6.733154296875, 7.39111328125, 8.049072265625, 8.70703125, 9.364990234375, 10.02294921875, 10.680908203125, 11.3388671875, 11.996826171875, 12.65478515625, 13.312744140625, 13.970703125, 14.628662109375, 15.28662109375, 15.944580078125, 16.6025390625, 17.260498046875, 17.91845703125, 18.576416015625, 19.234375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 3.0, 5.0, 20.0, 14.0, 14.0, 14.0, 26.0, 36.0, 55.0, 55.0, 77.0, 149.0, 244.0, 376.0, 811.0, 4082.0, 2929729.0, 206590.0, 1877.0, 629.0, 334.0, 185.0, 97.0, 74.0, 50.0, 50.0, 24.0, 16.0, 14.0, 13.0, 6.0, 7.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-58.125, -56.35498046875, -54.5849609375, -52.81494140625, -51.044921875, -49.27490234375, -47.5048828125, -45.73486328125, -43.96484375, -42.19482421875, -40.4248046875, -38.65478515625, -36.884765625, -35.11474609375, -33.3447265625, -31.57470703125, -29.8046875, -28.03466796875, -26.2646484375, -24.49462890625, -22.724609375, -20.95458984375, -19.1845703125, -17.41455078125, -15.64453125, -13.87451171875, -12.1044921875, -10.33447265625, -8.564453125, -6.79443359375, -5.0244140625, -3.25439453125, -1.484375, 0.28564453125, 2.0556640625, 3.82568359375, 5.595703125, 7.36572265625, 9.1357421875, 10.90576171875, 12.67578125, 14.44580078125, 16.2158203125, 17.98583984375, 19.755859375, 21.52587890625, 23.2958984375, 25.06591796875, 26.8359375, 28.60595703125, 30.3759765625, 32.14599609375, 33.916015625, 35.68603515625, 37.4560546875, 39.22607421875, 40.99609375, 42.76611328125, 44.5361328125, 46.30615234375, 48.076171875, 49.84619140625, 51.6162109375, 53.38623046875, 55.15625]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 117.0, 766.0, 129.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.33853149414062, -105.20160675048828, -100.0646743774414, -94.92774963378906, -89.79081726074219, -84.65389251708984, -79.5169677734375, -74.38003540039062, -69.24311065673828, -64.10618591308594, -58.96925354003906, -53.83232879638672, -48.69540023803711, -43.5584716796875, -38.421546936035156, -33.28461837768555, -28.147689819335938, -23.010761260986328, -17.87383460998535, -12.736907005310059, -7.599979400634766, -2.4630508422851562, 2.6738758087158203, 7.810802459716797, 12.947731018066406, 18.084659576416016, 23.221586227416992, 28.35851287841797, 33.49544143676758, 38.63236999511719, 43.76929473876953, 48.90622329711914, 54.04316711425781, 59.18009567260742, 64.31702423095703, 69.45394897460938, 74.59088134765625, 79.7278060913086, 84.86473083496094, 90.00166320800781, 95.13858795166016, 100.2755126953125, 105.41244506835938, 110.54936981201172, 115.68629455566406, 120.82322692871094, 125.96015167236328, 131.09707641601562, 136.2340087890625, 141.37094116210938, 146.5078582763672, 151.64479064941406, 156.78172302246094, 161.91864013671875, 167.05557250976562, 172.1925048828125, 177.32943725585938, 182.46636962890625, 187.60328674316406, 192.74021911621094, 197.8771514892578, 203.01406860351562, 208.1510009765625, 213.28793334960938, 218.4248504638672]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 7.0, 3.0, 7.0, 10.0, 13.0, 15.0, 15.0, 23.0, 27.0, 24.0, 18.0, 35.0, 21.0, 37.0, 35.0, 37.0, 37.0, 39.0, 49.0, 46.0, 41.0, 37.0, 24.0, 40.0, 38.0, 38.0, 37.0, 22.0, 29.0, 32.0, 32.0, 23.0, 17.0, 15.0, 17.0, 9.0, 11.0, 7.0, 10.0, 5.0, 3.0, 2.0, 4.0, 0.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-56.971168518066406, -55.327877044677734, -53.68458938598633, -52.041297912597656, -50.398006439208984, -48.75471878051758, -47.111427307128906, -45.4681396484375, -43.82484817504883, -42.181556701660156, -40.53826904296875, -38.89497756958008, -37.251686096191406, -35.6083984375, -33.96510696411133, -32.321815490722656, -30.678525924682617, -29.035236358642578, -27.391944885253906, -25.748655319213867, -24.105365753173828, -22.462074279785156, -20.818784713745117, -19.175495147705078, -17.532203674316406, -15.88891315460205, -14.245623588562012, -12.602333068847656, -10.959043502807617, -9.315752983093262, -7.672462463378906, -6.029172897338867, -4.385883331298828, -2.742593288421631, -1.0993030071258545, 0.5439872741699219, 2.187277317047119, 3.8305673599243164, 5.473857879638672, 7.117147445678711, 8.760437965393066, 10.403728485107422, 12.047018051147461, 13.690308570861816, 15.333599090576172, 16.97688865661621, 18.62017822265625, 20.263469696044922, 21.90675926208496, 23.550048828125, 25.193340301513672, 26.83662986755371, 28.47991943359375, 30.123210906982422, 31.76650047302246, 33.4097900390625, 35.05308151245117, 36.696372985839844, 38.33966064453125, 39.98295211791992, 41.626243591308594, 43.26953125, 44.91282272338867, 46.556114196777344, 48.19940185546875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 7.0, 7.0, 6.0, 3.0, 8.0, 15.0, 13.0, 19.0, 19.0, 13.0, 13.0, 26.0, 20.0, 40.0, 30.0, 26.0, 36.0, 34.0, 39.0, 38.0, 48.0, 45.0, 43.0, 36.0, 34.0, 51.0, 27.0, 22.0, 33.0, 24.0, 32.0, 27.0, 18.0, 16.0, 19.0, 21.0, 13.0, 16.0, 11.0, 12.0, 10.0, 7.0, 6.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-5.80078125, -5.60845947265625, -5.4161376953125, -5.22381591796875, -5.031494140625, -4.83917236328125, -4.6468505859375, -4.45452880859375, -4.26220703125, -4.06988525390625, -3.8775634765625, -3.68524169921875, -3.492919921875, -3.30059814453125, -3.1082763671875, -2.91595458984375, -2.7236328125, -2.53131103515625, -2.3389892578125, -2.14666748046875, -1.954345703125, -1.76202392578125, -1.5697021484375, -1.37738037109375, -1.18505859375, -0.99273681640625, -0.8004150390625, -0.60809326171875, -0.415771484375, -0.22344970703125, -0.0311279296875, 0.16119384765625, 0.353515625, 0.54583740234375, 0.7381591796875, 0.93048095703125, 1.122802734375, 1.31512451171875, 1.5074462890625, 1.69976806640625, 1.89208984375, 2.08441162109375, 2.2767333984375, 2.46905517578125, 2.661376953125, 2.85369873046875, 3.0460205078125, 3.23834228515625, 3.4306640625, 3.62298583984375, 3.8153076171875, 4.00762939453125, 4.199951171875, 4.39227294921875, 4.5845947265625, 4.77691650390625, 4.96923828125, 5.16156005859375, 5.3538818359375, 5.54620361328125, 5.738525390625, 5.93084716796875, 6.1231689453125, 6.31549072265625, 6.5078125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 6.0, 6.0, 10.0, 13.0, 14.0, 13.0, 8.0, 15.0, 22.0, 23.0, 32.0, 41.0, 50.0, 54.0, 71.0, 101.0, 155.0, 281.0, 914.0, 9774.0, 843542.0, 3222740.0, 112466.0, 2638.0, 531.0, 191.0, 114.0, 89.0, 68.0, 49.0, 46.0, 29.0, 28.0, 24.0, 16.0, 24.0, 16.0, 15.0, 9.0, 10.0, 7.0, 5.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.65625, -18.01904296875, -17.3818359375, -16.74462890625, -16.107421875, -15.47021484375, -14.8330078125, -14.19580078125, -13.55859375, -12.92138671875, -12.2841796875, -11.64697265625, -11.009765625, -10.37255859375, -9.7353515625, -9.09814453125, -8.4609375, -7.82373046875, -7.1865234375, -6.54931640625, -5.912109375, -5.27490234375, -4.6376953125, -4.00048828125, -3.36328125, -2.72607421875, -2.0888671875, -1.45166015625, -0.814453125, -0.17724609375, 0.4599609375, 1.09716796875, 1.734375, 2.37158203125, 3.0087890625, 3.64599609375, 4.283203125, 4.92041015625, 5.5576171875, 6.19482421875, 6.83203125, 7.46923828125, 8.1064453125, 8.74365234375, 9.380859375, 10.01806640625, 10.6552734375, 11.29248046875, 11.9296875, 12.56689453125, 13.2041015625, 13.84130859375, 14.478515625, 15.11572265625, 15.7529296875, 16.39013671875, 17.02734375, 17.66455078125, 18.3017578125, 18.93896484375, 19.576171875, 20.21337890625, 20.8505859375, 21.48779296875, 22.125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 8.0, 11.0, 9.0, 16.0, 25.0, 26.0, 36.0, 51.0, 47.0, 69.0, 127.0, 131.0, 236.0, 314.0, 411.0, 429.0, 496.0, 403.0, 287.0, 253.0, 181.0, 121.0, 92.0, 72.0, 45.0, 49.0, 29.0, 20.0, 13.0, 12.0, 11.0, 5.0, 5.0, 5.0, 6.0, 8.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.359375, -9.0489501953125, -8.738525390625, -8.4281005859375, -8.11767578125, -7.8072509765625, -7.496826171875, -7.1864013671875, -6.8759765625, -6.5655517578125, -6.255126953125, -5.9447021484375, -5.63427734375, -5.3238525390625, -5.013427734375, -4.7030029296875, -4.392578125, -4.0821533203125, -3.771728515625, -3.4613037109375, -3.15087890625, -2.8404541015625, -2.530029296875, -2.2196044921875, -1.9091796875, -1.5987548828125, -1.288330078125, -0.9779052734375, -0.66748046875, -0.3570556640625, -0.046630859375, 0.2637939453125, 0.57421875, 0.8846435546875, 1.195068359375, 1.5054931640625, 1.81591796875, 2.1263427734375, 2.436767578125, 2.7471923828125, 3.0576171875, 3.3680419921875, 3.678466796875, 3.9888916015625, 4.29931640625, 4.6097412109375, 4.920166015625, 5.2305908203125, 5.541015625, 5.8514404296875, 6.161865234375, 6.4722900390625, 6.78271484375, 7.0931396484375, 7.403564453125, 7.7139892578125, 8.0244140625, 8.3348388671875, 8.645263671875, 8.9556884765625, 9.26611328125, 9.5765380859375, 9.886962890625, 10.1973876953125, 10.5078125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 8.0, 2.0, 11.0, 13.0, 10.0, 11.0, 17.0, 24.0, 29.0, 44.0, 58.0, 67.0, 71.0, 108.0, 170.0, 196.0, 287.0, 428.0, 807.0, 5192.0, 457244.0, 3694055.0, 31836.0, 1741.0, 589.0, 376.0, 231.0, 159.0, 122.0, 101.0, 64.0, 63.0, 45.0, 24.0, 25.0, 13.0, 11.0, 10.0, 7.0, 7.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.40625, -31.2587890625, -30.111328125, -28.9638671875, -27.81640625, -26.6689453125, -25.521484375, -24.3740234375, -23.2265625, -22.0791015625, -20.931640625, -19.7841796875, -18.63671875, -17.4892578125, -16.341796875, -15.1943359375, -14.046875, -12.8994140625, -11.751953125, -10.6044921875, -9.45703125, -8.3095703125, -7.162109375, -6.0146484375, -4.8671875, -3.7197265625, -2.572265625, -1.4248046875, -0.27734375, 0.8701171875, 2.017578125, 3.1650390625, 4.3125, 5.4599609375, 6.607421875, 7.7548828125, 8.90234375, 10.0498046875, 11.197265625, 12.3447265625, 13.4921875, 14.6396484375, 15.787109375, 16.9345703125, 18.08203125, 19.2294921875, 20.376953125, 21.5244140625, 22.671875, 23.8193359375, 24.966796875, 26.1142578125, 27.26171875, 28.4091796875, 29.556640625, 30.7041015625, 31.8515625, 32.9990234375, 34.146484375, 35.2939453125, 36.44140625, 37.5888671875, 38.736328125, 39.8837890625, 41.03125]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 31.0, 369.0, 529.0, 78.0, 10.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.16609954833984, -107.54523468017578, -101.92436981201172, -96.30350494384766, -90.6826400756836, -85.06177520751953, -79.44091033935547, -73.8200454711914, -68.19918060302734, -62.57831573486328, -56.95745086669922, -51.336585998535156, -45.715721130371094, -40.09485626220703, -34.47399139404297, -28.853126525878906, -23.232261657714844, -17.61139678955078, -11.990531921386719, -6.369667053222656, -0.7488021850585938, 4.872062683105469, 10.492927551269531, 16.113792419433594, 21.734657287597656, 27.35552215576172, 32.97638702392578, 38.597251892089844, 44.218116760253906, 49.83898162841797, 55.45984649658203, 61.080711364746094, 66.70156860351562, 72.32243347167969, 77.94329833984375, 83.56416320800781, 89.18502807617188, 94.80589294433594, 100.4267578125, 106.04762268066406, 111.66848754882812, 117.28935241699219, 122.91021728515625, 128.5310821533203, 134.15194702148438, 139.77281188964844, 145.3936767578125, 151.01454162597656, 156.63540649414062, 162.2562713623047, 167.87713623046875, 173.4980010986328, 179.11886596679688, 184.73973083496094, 190.360595703125, 195.98146057128906, 201.60232543945312, 207.2231903076172, 212.84405517578125, 218.4649200439453, 224.08578491210938, 229.70664978027344, 235.3275146484375, 240.94837951660156, 246.56924438476562]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 7.0, 9.0, 10.0, 9.0, 12.0, 19.0, 14.0, 20.0, 16.0, 23.0, 31.0, 37.0, 36.0, 29.0, 34.0, 39.0, 49.0, 46.0, 38.0, 38.0, 40.0, 35.0, 36.0, 43.0, 38.0, 28.0, 40.0, 31.0, 26.0, 25.0, 15.0, 22.0, 17.0, 8.0, 19.0, 11.0, 13.0, 6.0, 6.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-35.00153732299805, -33.92715072631836, -32.85276412963867, -31.778379440307617, -30.703994750976562, -29.629608154296875, -28.555221557617188, -27.480836868286133, -26.406452178955078, -25.33206558227539, -24.257680892944336, -23.18329429626465, -22.108909606933594, -21.034523010253906, -19.96013641357422, -18.885751724243164, -17.811365127563477, -16.73697853088379, -15.662593841552734, -14.588207244873047, -13.513822555541992, -12.439435958862305, -11.365050315856934, -10.290664672851562, -9.216279029846191, -8.14189338684082, -7.067507743835449, -5.99312162399292, -4.918735980987549, -3.8443503379821777, -2.7699642181396484, -1.6955785751342773, -0.6211929321289062, 0.4531928300857544, 1.527578592300415, 2.6019644737243652, 3.6763501167297363, 4.750735759735107, 5.825121879577637, 6.899507522583008, 7.973893165588379, 9.04827880859375, 10.122664451599121, 11.197050094604492, 12.27143669128418, 13.345821380615234, 14.420207977294922, 15.494593620300293, 16.568979263305664, 17.64336585998535, 18.717750549316406, 19.792137145996094, 20.86652183532715, 21.940908432006836, 23.01529312133789, 24.089679718017578, 25.164066314697266, 26.238452911376953, 27.312837600708008, 28.387224197387695, 29.46160888671875, 30.535995483398438, 31.610382080078125, 32.68476867675781, 33.759151458740234]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 2.0, 10.0, 14.0, 12.0, 17.0, 22.0, 20.0, 33.0, 34.0, 28.0, 40.0, 38.0, 39.0, 51.0, 44.0, 40.0, 37.0, 60.0, 50.0, 37.0, 45.0, 37.0, 29.0, 23.0, 26.0, 19.0, 31.0, 34.0, 21.0, 18.0, 16.0, 14.0, 9.0, 10.0, 9.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3828125, -6.17108154296875, -5.9593505859375, -5.74761962890625, -5.535888671875, -5.32415771484375, -5.1124267578125, -4.90069580078125, -4.68896484375, -4.47723388671875, -4.2655029296875, -4.05377197265625, -3.842041015625, -3.63031005859375, -3.4185791015625, -3.20684814453125, -2.9951171875, -2.78338623046875, -2.5716552734375, -2.35992431640625, -2.148193359375, -1.93646240234375, -1.7247314453125, -1.51300048828125, -1.30126953125, -1.08953857421875, -0.8778076171875, -0.66607666015625, -0.454345703125, -0.24261474609375, -0.0308837890625, 0.18084716796875, 0.392578125, 0.60430908203125, 0.8160400390625, 1.02777099609375, 1.239501953125, 1.45123291015625, 1.6629638671875, 1.87469482421875, 2.08642578125, 2.29815673828125, 2.5098876953125, 2.72161865234375, 2.933349609375, 3.14508056640625, 3.3568115234375, 3.56854248046875, 3.7802734375, 3.99200439453125, 4.2037353515625, 4.41546630859375, 4.627197265625, 4.83892822265625, 5.0506591796875, 5.26239013671875, 5.47412109375, 5.68585205078125, 5.8975830078125, 6.10931396484375, 6.321044921875, 6.53277587890625, 6.7445068359375, 6.95623779296875, 7.16796875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 6.0, 9.0, 13.0, 19.0, 26.0, 51.0, 60.0, 104.0, 129.0, 218.0, 303.0, 462.0, 718.0, 1083.0, 1666.0, 2720.0, 4324.0, 7208.0, 11811.0, 19812.0, 34442.0, 62058.0, 124254.0, 358041.0, 210063.0, 91710.0, 48806.0, 27459.0, 15899.0, 9690.0, 5877.0, 3459.0, 2161.0, 1370.0, 859.0, 570.0, 349.0, 253.0, 174.0, 111.0, 79.0, 47.0, 31.0, 24.0, 9.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.82421875, -1.770233154296875, -1.71624755859375, -1.662261962890625, -1.6082763671875, -1.554290771484375, -1.50030517578125, -1.446319580078125, -1.392333984375, -1.338348388671875, -1.28436279296875, -1.230377197265625, -1.1763916015625, -1.122406005859375, -1.06842041015625, -1.014434814453125, -0.96044921875, -0.906463623046875, -0.85247802734375, -0.798492431640625, -0.7445068359375, -0.690521240234375, -0.63653564453125, -0.582550048828125, -0.528564453125, -0.474578857421875, -0.42059326171875, -0.366607666015625, -0.3126220703125, -0.258636474609375, -0.20465087890625, -0.150665283203125, -0.0966796875, -0.042694091796875, 0.01129150390625, 0.065277099609375, 0.1192626953125, 0.173248291015625, 0.22723388671875, 0.281219482421875, 0.335205078125, 0.389190673828125, 0.44317626953125, 0.497161865234375, 0.5511474609375, 0.605133056640625, 0.65911865234375, 0.713104248046875, 0.76708984375, 0.821075439453125, 0.87506103515625, 0.929046630859375, 0.9830322265625, 1.037017822265625, 1.09100341796875, 1.144989013671875, 1.198974609375, 1.252960205078125, 1.30694580078125, 1.360931396484375, 1.4149169921875, 1.468902587890625, 1.52288818359375, 1.576873779296875, 1.630859375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 12.0, 14.0, 11.0, 7.0, 10.0, 13.0, 19.0, 13.0, 27.0, 27.0, 25.0, 19.0, 27.0, 28.0, 38.0, 31.0, 44.0, 26.0, 35.0, 32.0, 1054.0, 46.0, 28.0, 36.0, 33.0, 39.0, 33.0, 39.0, 25.0, 32.0, 30.0, 24.0, 20.0, 21.0, 16.0, 10.0, 10.0, 17.0, 9.0, 9.0, 6.0, 7.0, 7.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.37890625, -3.26141357421875, -3.1439208984375, -3.02642822265625, -2.908935546875, -2.79144287109375, -2.6739501953125, -2.55645751953125, -2.43896484375, -2.32147216796875, -2.2039794921875, -2.08648681640625, -1.968994140625, -1.85150146484375, -1.7340087890625, -1.61651611328125, -1.4990234375, -1.38153076171875, -1.2640380859375, -1.14654541015625, -1.029052734375, -0.91156005859375, -0.7940673828125, -0.67657470703125, -0.55908203125, -0.44158935546875, -0.3240966796875, -0.20660400390625, -0.089111328125, 0.02838134765625, 0.1458740234375, 0.26336669921875, 0.380859375, 0.49835205078125, 0.6158447265625, 0.73333740234375, 0.850830078125, 0.96832275390625, 1.0858154296875, 1.20330810546875, 1.32080078125, 1.43829345703125, 1.5557861328125, 1.67327880859375, 1.790771484375, 1.90826416015625, 2.0257568359375, 2.14324951171875, 2.2607421875, 2.37823486328125, 2.4957275390625, 2.61322021484375, 2.730712890625, 2.84820556640625, 2.9656982421875, 3.08319091796875, 3.20068359375, 3.31817626953125, 3.4356689453125, 3.55316162109375, 3.670654296875, 3.78814697265625, 3.9056396484375, 4.02313232421875, 4.140625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 10.0, 1.0, 2.0, 9.0, 20.0, 17.0, 35.0, 23.0, 51.0, 86.0, 118.0, 165.0, 211.0, 378.0, 550.0, 807.0, 1251.0, 1996.0, 3203.0, 4611.0, 7874.0, 12194.0, 19773.0, 32625.0, 55758.0, 97788.0, 203540.0, 1363515.0, 121136.0, 67252.0, 39491.0, 23420.0, 14257.0, 8992.0, 5616.0, 3602.0, 2371.0, 1503.0, 973.0, 633.0, 479.0, 263.0, 172.0, 130.0, 86.0, 41.0, 42.0, 27.0, 22.0, 10.0, 3.0, 0.0, 4.0, 3.0, 4.0, 2.0], "bins": [-1.6669921875, -1.619598388671875, -1.57220458984375, -1.524810791015625, -1.4774169921875, -1.430023193359375, -1.38262939453125, -1.335235595703125, -1.287841796875, -1.240447998046875, -1.19305419921875, -1.145660400390625, -1.0982666015625, -1.050872802734375, -1.00347900390625, -0.956085205078125, -0.90869140625, -0.861297607421875, -0.81390380859375, -0.766510009765625, -0.7191162109375, -0.671722412109375, -0.62432861328125, -0.576934814453125, -0.529541015625, -0.482147216796875, -0.43475341796875, -0.387359619140625, -0.3399658203125, -0.292572021484375, -0.24517822265625, -0.197784423828125, -0.150390625, -0.102996826171875, -0.05560302734375, -0.008209228515625, 0.0391845703125, 0.086578369140625, 0.13397216796875, 0.181365966796875, 0.228759765625, 0.276153564453125, 0.32354736328125, 0.370941162109375, 0.4183349609375, 0.465728759765625, 0.51312255859375, 0.560516357421875, 0.60791015625, 0.655303955078125, 0.70269775390625, 0.750091552734375, 0.7974853515625, 0.844879150390625, 0.89227294921875, 0.939666748046875, 0.987060546875, 1.034454345703125, 1.08184814453125, 1.129241943359375, 1.1766357421875, 1.224029541015625, 1.27142333984375, 1.318817138671875, 1.3662109375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 3.0, 8.0, 6.0, 5.0, 8.0, 12.0, 15.0, 16.0, 16.0, 11.0, 22.0, 21.0, 26.0, 28.0, 29.0, 39.0, 33.0, 55.0, 68.0, 74.0, 72.0, 55.0, 51.0, 50.0, 39.0, 36.0, 31.0, 31.0, 19.0, 17.0, 16.0, 14.0, 12.0, 8.0, 8.0, 9.0, 7.0, 7.0, 2.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0008640289306640625, -0.0008352398872375488, -0.0008064508438110352, -0.0007776618003845215, -0.0007488727569580078, -0.0007200837135314941, -0.0006912946701049805, -0.0006625056266784668, -0.0006337165832519531, -0.0006049275398254395, -0.0005761384963989258, -0.0005473494529724121, -0.0005185604095458984, -0.0004897713661193848, -0.0004609823226928711, -0.0004321932792663574, -0.00040340423583984375, -0.0003746151924133301, -0.0003458261489868164, -0.00031703710556030273, -0.00028824806213378906, -0.0002594590187072754, -0.00023066997528076172, -0.00020188093185424805, -0.00017309188842773438, -0.0001443028450012207, -0.00011551380157470703, -8.672475814819336e-05, -5.793571472167969e-05, -2.9146671295166016e-05, -3.5762786865234375e-07, 2.8431415557861328e-05, 5.7220458984375e-05, 8.600950241088867e-05, 0.00011479854583740234, 0.00014358758926391602, 0.0001723766326904297, 0.00020116567611694336, 0.00022995471954345703, 0.0002587437629699707, 0.0002875328063964844, 0.00031632184982299805, 0.0003451108932495117, 0.0003738999366760254, 0.00040268898010253906, 0.00043147802352905273, 0.0004602670669555664, 0.0004890561103820801, 0.0005178451538085938, 0.0005466341972351074, 0.0005754232406616211, 0.0006042122840881348, 0.0006330013275146484, 0.0006617903709411621, 0.0006905794143676758, 0.0007193684577941895, 0.0007481575012207031, 0.0007769465446472168, 0.0008057355880737305, 0.0008345246315002441, 0.0008633136749267578, 0.0008921027183532715, 0.0009208917617797852, 0.0009496808052062988, 0.0009784698486328125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 8.0, 9.0, 5.0, 6.0, 14.0, 11.0, 19.0, 18.0, 29.0, 34.0, 35.0, 49.0, 68.0, 97.0, 125.0, 213.0, 380.0, 723.0, 7014.0, 1028818.0, 8966.0, 734.0, 373.0, 229.0, 130.0, 88.0, 66.0, 41.0, 42.0, 40.0, 27.0, 27.0, 24.0, 18.0, 16.0, 8.0, 7.0, 15.0, 8.0, 5.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0214080810546875, -0.020787954330444336, -0.020167827606201172, -0.019547700881958008, -0.018927574157714844, -0.01830744743347168, -0.017687320709228516, -0.01706719398498535, -0.016447067260742188, -0.015826940536499023, -0.01520681381225586, -0.014586687088012695, -0.013966560363769531, -0.013346433639526367, -0.012726306915283203, -0.012106180191040039, -0.011486053466796875, -0.010865926742553711, -0.010245800018310547, -0.009625673294067383, -0.009005546569824219, -0.008385419845581055, -0.007765293121337891, -0.0071451663970947266, -0.0065250396728515625, -0.0059049129486083984, -0.005284786224365234, -0.00466465950012207, -0.004044532775878906, -0.003424406051635742, -0.002804279327392578, -0.002184152603149414, -0.00156402587890625, -0.0009438991546630859, -0.0003237724304199219, 0.0002963542938232422, 0.0009164810180664062, 0.0015366077423095703, 0.0021567344665527344, 0.0027768611907958984, 0.0033969879150390625, 0.0040171146392822266, 0.004637241363525391, 0.005257368087768555, 0.005877494812011719, 0.006497621536254883, 0.007117748260498047, 0.007737874984741211, 0.008358001708984375, 0.008978128433227539, 0.009598255157470703, 0.010218381881713867, 0.010838508605957031, 0.011458635330200195, 0.01207876205444336, 0.012698888778686523, 0.013319015502929688, 0.013939142227172852, 0.014559268951416016, 0.01517939567565918, 0.015799522399902344, 0.016419649124145508, 0.017039775848388672, 0.017659902572631836, 0.018280029296875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 24.0, 444.0, 523.0, 23.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001531265559606254, -0.0014137448742985725, -0.0012962243054062128, -0.0011787036200985312, -0.0010611829347908497, -0.0009436622494831681, -0.0008261416223831475, -0.0007086209952831268, -0.0005911003099754453, -0.00047357965377159417, -0.00035605899756774306, -0.00023853834136389196, -0.00012101768516004086, -3.496999852359295e-06, 0.00011402362724766135, 0.000231544254347682, 0.00034906493965536356, 0.00046658559585921466, 0.0005841062520630658, 0.0007016268791630864, 0.000819147564470768, 0.0009366682497784495, 0.001054188935086131, 0.0011717095039784908, 0.0012892301892861724, 0.001406750874593854, 0.0015242714434862137, 0.0016417921287938952, 0.0017593128141015768, 0.0018768334994092584, 0.00199435418471694, 0.0021118747536092997, 0.0022293953225016594, 0.002346915891394019, 0.0024644366931170225, 0.0025819572620093822, 0.0026994780637323856, 0.0028169986326247454, 0.002934519201517105, 0.0030520400032401085, 0.0031695605721324682, 0.003287081141024828, 0.0034046019427478313, 0.003522122511640191, 0.003639643080532551, 0.003757163882255554, 0.003874684451147914, 0.003992205020040274, 0.004109725821763277, 0.0042272466234862804, 0.0043447669595479965, 0.004462287761271, 0.004579808562994003, 0.004697329364717007, 0.004814849700778723, 0.004932370502501726, 0.005049890838563442, 0.005167411640286446, 0.005284931976348162, 0.005402452778071165, 0.0055199735797941685, 0.0056374939158558846, 0.005755014717578888, 0.005872535519301891, 0.005990056321024895]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 5.0, 10.0, 5.0, 8.0, 6.0, 11.0, 10.0, 10.0, 14.0, 17.0, 22.0, 26.0, 22.0, 21.0, 35.0, 27.0, 34.0, 36.0, 29.0, 42.0, 44.0, 43.0, 41.0, 45.0, 49.0, 26.0, 48.0, 37.0, 38.0, 29.0, 25.0, 30.0, 19.0, 21.0, 20.0, 22.0, 12.0, 12.0, 9.0, 10.0, 7.0, 8.0, 7.0, 7.0, 3.0, 3.0, 0.0, 0.0, 5.0, 3.0], "bins": [-0.0005950927734375, -0.000578789971768856, -0.0005624871701002121, -0.0005461843684315681, -0.0005298815667629242, -0.0005135787650942802, -0.0004972759634256363, -0.00048097316175699234, -0.0004646703600883484, -0.00044836755841970444, -0.0004320647567510605, -0.00041576195508241653, -0.0003994591534137726, -0.00038315635174512863, -0.0003668535500764847, -0.00035055074840784073, -0.0003342479467391968, -0.0003179451450705528, -0.0003016423434019089, -0.0002853395417332649, -0.00026903674006462097, -0.000252733938395977, -0.00023643113672733307, -0.00022012833505868912, -0.00020382553339004517, -0.00018752273172140121, -0.00017121993005275726, -0.0001549171283841133, -0.00013861432671546936, -0.0001223115250468254, -0.00010600872337818146, -8.97059217095375e-05, -7.340312004089355e-05, -5.71003183722496e-05, -4.079751670360565e-05, -2.44947150349617e-05, -8.191913366317749e-06, 8.110888302326202e-06, 2.4413689970970154e-05, 4.0716491639614105e-05, 5.701929330825806e-05, 7.332209497690201e-05, 8.962489664554596e-05, 0.00010592769831418991, 0.00012223049998283386, 0.00013853330165147781, 0.00015483610332012177, 0.00017113890498876572, 0.00018744170665740967, 0.00020374450832605362, 0.00022004730999469757, 0.00023635011166334152, 0.0002526529133319855, 0.0002689557150006294, 0.0002852585166692734, 0.00030156131833791733, 0.0003178641200065613, 0.00033416692167520523, 0.0003504697233438492, 0.00036677252501249313, 0.0003830753266811371, 0.00039937812834978104, 0.000415680930018425, 0.00043198373168706894, 0.0004482865333557129]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 2.0, 10.0, 14.0, 12.0, 17.0, 22.0, 20.0, 33.0, 34.0, 28.0, 40.0, 38.0, 39.0, 51.0, 44.0, 40.0, 37.0, 60.0, 50.0, 37.0, 45.0, 37.0, 29.0, 23.0, 26.0, 19.0, 31.0, 34.0, 21.0, 18.0, 16.0, 14.0, 9.0, 10.0, 9.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3828125, -6.17108154296875, -5.9593505859375, -5.74761962890625, -5.535888671875, -5.32415771484375, -5.1124267578125, -4.90069580078125, -4.68896484375, -4.47723388671875, -4.2655029296875, -4.05377197265625, -3.842041015625, -3.63031005859375, -3.4185791015625, -3.20684814453125, -2.9951171875, -2.78338623046875, -2.5716552734375, -2.35992431640625, -2.148193359375, -1.93646240234375, -1.7247314453125, -1.51300048828125, -1.30126953125, -1.08953857421875, -0.8778076171875, -0.66607666015625, -0.454345703125, -0.24261474609375, -0.0308837890625, 0.18084716796875, 0.392578125, 0.60430908203125, 0.8160400390625, 1.02777099609375, 1.239501953125, 1.45123291015625, 1.6629638671875, 1.87469482421875, 2.08642578125, 2.29815673828125, 2.5098876953125, 2.72161865234375, 2.933349609375, 3.14508056640625, 3.3568115234375, 3.56854248046875, 3.7802734375, 3.99200439453125, 4.2037353515625, 4.41546630859375, 4.627197265625, 4.83892822265625, 5.0506591796875, 5.26239013671875, 5.47412109375, 5.68585205078125, 5.8975830078125, 6.10931396484375, 6.321044921875, 6.53277587890625, 6.7445068359375, 6.95623779296875, 7.16796875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 9.0, 5.0, 12.0, 14.0, 17.0, 25.0, 27.0, 42.0, 67.0, 98.0, 111.0, 175.0, 234.0, 410.0, 800.0, 2271.0, 10916.0, 69620.0, 528707.0, 376957.0, 46629.0, 7834.0, 1683.0, 696.0, 381.0, 209.0, 165.0, 114.0, 78.0, 62.0, 44.0, 32.0, 29.0, 20.0, 18.0, 15.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.4609375, -11.07763671875, -10.6943359375, -10.31103515625, -9.927734375, -9.54443359375, -9.1611328125, -8.77783203125, -8.39453125, -8.01123046875, -7.6279296875, -7.24462890625, -6.861328125, -6.47802734375, -6.0947265625, -5.71142578125, -5.328125, -4.94482421875, -4.5615234375, -4.17822265625, -3.794921875, -3.41162109375, -3.0283203125, -2.64501953125, -2.26171875, -1.87841796875, -1.4951171875, -1.11181640625, -0.728515625, -0.34521484375, 0.0380859375, 0.42138671875, 0.8046875, 1.18798828125, 1.5712890625, 1.95458984375, 2.337890625, 2.72119140625, 3.1044921875, 3.48779296875, 3.87109375, 4.25439453125, 4.6376953125, 5.02099609375, 5.404296875, 5.78759765625, 6.1708984375, 6.55419921875, 6.9375, 7.32080078125, 7.7041015625, 8.08740234375, 8.470703125, 8.85400390625, 9.2373046875, 9.62060546875, 10.00390625, 10.38720703125, 10.7705078125, 11.15380859375, 11.537109375, 11.92041015625, 12.3037109375, 12.68701171875, 13.0703125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 6.0, 9.0, 7.0, 8.0, 20.0, 12.0, 13.0, 24.0, 18.0, 29.0, 31.0, 33.0, 41.0, 41.0, 42.0, 56.0, 67.0, 117.0, 251.0, 1464.0, 209.0, 77.0, 72.0, 50.0, 47.0, 44.0, 34.0, 26.0, 32.0, 23.0, 29.0, 19.0, 13.0, 13.0, 12.0, 8.0, 10.0, 8.0, 5.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.65625, -20.01953125, -19.3828125, -18.74609375, -18.109375, -17.47265625, -16.8359375, -16.19921875, -15.5625, -14.92578125, -14.2890625, -13.65234375, -13.015625, -12.37890625, -11.7421875, -11.10546875, -10.46875, -9.83203125, -9.1953125, -8.55859375, -7.921875, -7.28515625, -6.6484375, -6.01171875, -5.375, -4.73828125, -4.1015625, -3.46484375, -2.828125, -2.19140625, -1.5546875, -0.91796875, -0.28125, 0.35546875, 0.9921875, 1.62890625, 2.265625, 2.90234375, 3.5390625, 4.17578125, 4.8125, 5.44921875, 6.0859375, 6.72265625, 7.359375, 7.99609375, 8.6328125, 9.26953125, 9.90625, 10.54296875, 11.1796875, 11.81640625, 12.453125, 13.08984375, 13.7265625, 14.36328125, 15.0, 15.63671875, 16.2734375, 16.91015625, 17.546875, 18.18359375, 18.8203125, 19.45703125, 20.09375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 5.0, 5.0, 13.0, 10.0, 25.0, 28.0, 53.0, 70.0, 92.0, 189.0, 329.0, 1022.0, 24863.0, 3114130.0, 3589.0, 592.0, 268.0, 137.0, 105.0, 66.0, 40.0, 22.0, 20.0, 9.0, 12.0, 6.0, 9.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.125, -66.2802734375, -63.435546875, -60.5908203125, -57.74609375, -54.9013671875, -52.056640625, -49.2119140625, -46.3671875, -43.5224609375, -40.677734375, -37.8330078125, -34.98828125, -32.1435546875, -29.298828125, -26.4541015625, -23.609375, -20.7646484375, -17.919921875, -15.0751953125, -12.23046875, -9.3857421875, -6.541015625, -3.6962890625, -0.8515625, 1.9931640625, 4.837890625, 7.6826171875, 10.52734375, 13.3720703125, 16.216796875, 19.0615234375, 21.90625, 24.7509765625, 27.595703125, 30.4404296875, 33.28515625, 36.1298828125, 38.974609375, 41.8193359375, 44.6640625, 47.5087890625, 50.353515625, 53.1982421875, 56.04296875, 58.8876953125, 61.732421875, 64.5771484375, 67.421875, 70.2666015625, 73.111328125, 75.9560546875, 78.80078125, 81.6455078125, 84.490234375, 87.3349609375, 90.1796875, 93.0244140625, 95.869140625, 98.7138671875, 101.55859375, 104.4033203125, 107.248046875, 110.0927734375, 112.9375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 832.0, 183.0], "bins": [-853.7847290039062, -840.1876831054688, -826.590576171875, -812.9935302734375, -799.3964233398438, -785.7993774414062, -772.2022705078125, -758.605224609375, -745.0081176757812, -731.4110717773438, -717.81396484375, -704.2169189453125, -690.6198120117188, -677.0227661132812, -663.4256591796875, -649.82861328125, -636.2315063476562, -622.6344604492188, -609.037353515625, -595.4403076171875, -581.8432006835938, -568.2461547851562, -554.6490478515625, -541.052001953125, -527.4548950195312, -513.8578491210938, -500.2607421875, -486.6636657714844, -473.06658935546875, -459.4695129394531, -445.8724365234375, -432.2753601074219, -418.6783142089844, -405.08123779296875, -391.4841613769531, -377.8870849609375, -364.2900085449219, -350.69293212890625, -337.0958557128906, -323.498779296875, -309.9017028808594, -296.30462646484375, -282.7075500488281, -269.1104736328125, -255.51339721679688, -241.91632080078125, -228.31924438476562, -214.72216796875, -201.12510681152344, -187.5280303955078, -173.9309539794922, -160.33387756347656, -146.73680114746094, -133.13973999023438, -119.54265594482422, -105.9455795288086, -92.34849548339844, -78.75141906738281, -65.15434265136719, -51.55727005004883, -37.9601936340332, -24.363121032714844, -10.766044616699219, 2.8310317993164062, 16.4281063079834]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 7.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 7.0, 12.0, 10.0, 17.0, 19.0, 21.0, 16.0, 25.0, 16.0, 40.0, 31.0, 22.0, 26.0, 36.0, 40.0, 31.0, 30.0, 44.0, 37.0, 32.0, 32.0, 31.0, 37.0, 38.0, 38.0, 24.0, 38.0, 27.0, 23.0, 24.0, 22.0, 22.0, 17.0, 20.0, 16.0, 11.0, 12.0, 9.0, 7.0, 12.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0], "bins": [-53.73471450805664, -52.15325164794922, -50.57178497314453, -48.99032211303711, -47.40885925292969, -45.827396392822266, -44.245933532714844, -42.664466857910156, -41.083003997802734, -39.50154113769531, -37.920074462890625, -36.3386116027832, -34.75714874267578, -33.17568588256836, -31.594221115112305, -30.01275634765625, -28.431293487548828, -26.849830627441406, -25.26836585998535, -23.686901092529297, -22.105438232421875, -20.523975372314453, -18.9425106048584, -17.361045837402344, -15.779582977294922, -14.198119163513184, -12.616655349731445, -11.035191535949707, -9.453727722167969, -7.8722639083862305, -6.290800094604492, -4.709336280822754, -3.1278762817382812, -1.546412467956543, 0.03505134582519531, 1.6165151596069336, 3.197978973388672, 4.77944278717041, 6.360906600952148, 7.942370414733887, 9.523834228515625, 11.105298042297363, 12.686761856079102, 14.26822566986084, 15.849689483642578, 17.43115234375, 19.012617111206055, 20.59408187866211, 22.17554473876953, 23.757007598876953, 25.338472366333008, 26.919937133789062, 28.501399993896484, 30.082862854003906, 31.66432762145996, 33.245792388916016, 34.82725524902344, 36.40871810913086, 37.99018096923828, 39.57164764404297, 41.15311050415039, 42.73457336425781, 44.3160400390625, 45.89750289916992, 47.478965759277344]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 7.0, 9.0, 8.0, 9.0, 13.0, 12.0, 12.0, 13.0, 19.0, 20.0, 34.0, 33.0, 33.0, 29.0, 42.0, 35.0, 61.0, 42.0, 43.0, 47.0, 41.0, 38.0, 34.0, 36.0, 33.0, 38.0, 35.0, 25.0, 27.0, 37.0, 18.0, 18.0, 22.0, 15.0, 13.0, 11.0, 11.0, 7.0, 3.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.96875, -6.7279052734375, -6.487060546875, -6.2462158203125, -6.00537109375, -5.7645263671875, -5.523681640625, -5.2828369140625, -5.0419921875, -4.8011474609375, -4.560302734375, -4.3194580078125, -4.07861328125, -3.8377685546875, -3.596923828125, -3.3560791015625, -3.115234375, -2.8743896484375, -2.633544921875, -2.3927001953125, -2.15185546875, -1.9110107421875, -1.670166015625, -1.4293212890625, -1.1884765625, -0.9476318359375, -0.706787109375, -0.4659423828125, -0.22509765625, 0.0157470703125, 0.256591796875, 0.4974365234375, 0.73828125, 0.9791259765625, 1.219970703125, 1.4608154296875, 1.70166015625, 1.9425048828125, 2.183349609375, 2.4241943359375, 2.6650390625, 2.9058837890625, 3.146728515625, 3.3875732421875, 3.62841796875, 3.8692626953125, 4.110107421875, 4.3509521484375, 4.591796875, 4.8326416015625, 5.073486328125, 5.3143310546875, 5.55517578125, 5.7960205078125, 6.036865234375, 6.2777099609375, 6.5185546875, 6.7593994140625, 7.000244140625, 7.2410888671875, 7.48193359375, 7.7227783203125, 7.963623046875, 8.2044677734375, 8.4453125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 8.0, 9.0, 3.0, 12.0, 8.0, 8.0, 14.0, 15.0, 27.0, 23.0, 37.0, 53.0, 47.0, 67.0, 86.0, 166.0, 336.0, 784.0, 5017.0, 211689.0, 3032186.0, 924522.0, 16591.0, 1428.0, 436.0, 209.0, 108.0, 82.0, 55.0, 52.0, 42.0, 37.0, 25.0, 9.0, 21.0, 10.0, 18.0, 11.0, 7.0, 4.0, 4.0, 1.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.328125, -16.724365234375, -16.12060546875, -15.516845703125, -14.9130859375, -14.309326171875, -13.70556640625, -13.101806640625, -12.498046875, -11.894287109375, -11.29052734375, -10.686767578125, -10.0830078125, -9.479248046875, -8.87548828125, -8.271728515625, -7.66796875, -7.064208984375, -6.46044921875, -5.856689453125, -5.2529296875, -4.649169921875, -4.04541015625, -3.441650390625, -2.837890625, -2.234130859375, -1.63037109375, -1.026611328125, -0.4228515625, 0.180908203125, 0.78466796875, 1.388427734375, 1.9921875, 2.595947265625, 3.19970703125, 3.803466796875, 4.4072265625, 5.010986328125, 5.61474609375, 6.218505859375, 6.822265625, 7.426025390625, 8.02978515625, 8.633544921875, 9.2373046875, 9.841064453125, 10.44482421875, 11.048583984375, 11.65234375, 12.256103515625, 12.85986328125, 13.463623046875, 14.0673828125, 14.671142578125, 15.27490234375, 15.878662109375, 16.482421875, 17.086181640625, 17.68994140625, 18.293701171875, 18.8974609375, 19.501220703125, 20.10498046875, 20.708740234375, 21.3125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 3.0, 5.0, 13.0, 5.0, 13.0, 20.0, 22.0, 34.0, 49.0, 100.0, 155.0, 282.0, 427.0, 652.0, 781.0, 614.0, 378.0, 198.0, 127.0, 70.0, 51.0, 28.0, 20.0, 8.0, 2.0, 2.0, 6.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.953125, -13.42578125, -12.8984375, -12.37109375, -11.84375, -11.31640625, -10.7890625, -10.26171875, -9.734375, -9.20703125, -8.6796875, -8.15234375, -7.625, -7.09765625, -6.5703125, -6.04296875, -5.515625, -4.98828125, -4.4609375, -3.93359375, -3.40625, -2.87890625, -2.3515625, -1.82421875, -1.296875, -0.76953125, -0.2421875, 0.28515625, 0.8125, 1.33984375, 1.8671875, 2.39453125, 2.921875, 3.44921875, 3.9765625, 4.50390625, 5.03125, 5.55859375, 6.0859375, 6.61328125, 7.140625, 7.66796875, 8.1953125, 8.72265625, 9.25, 9.77734375, 10.3046875, 10.83203125, 11.359375, 11.88671875, 12.4140625, 12.94140625, 13.46875, 13.99609375, 14.5234375, 15.05078125, 15.578125, 16.10546875, 16.6328125, 17.16015625, 17.6875, 18.21484375, 18.7421875, 19.26953125, 19.796875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 8.0, 10.0, 11.0, 11.0, 19.0, 35.0, 54.0, 64.0, 105.0, 164.0, 252.0, 404.0, 907.0, 3942.0, 162808.0, 3978742.0, 42402.0, 2465.0, 812.0, 397.0, 231.0, 145.0, 86.0, 68.0, 35.0, 31.0, 27.0, 16.0, 17.0, 6.0, 9.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-49.46875, -48.1796875, -46.890625, -45.6015625, -44.3125, -43.0234375, -41.734375, -40.4453125, -39.15625, -37.8671875, -36.578125, -35.2890625, -34.0, -32.7109375, -31.421875, -30.1328125, -28.84375, -27.5546875, -26.265625, -24.9765625, -23.6875, -22.3984375, -21.109375, -19.8203125, -18.53125, -17.2421875, -15.953125, -14.6640625, -13.375, -12.0859375, -10.796875, -9.5078125, -8.21875, -6.9296875, -5.640625, -4.3515625, -3.0625, -1.7734375, -0.484375, 0.8046875, 2.09375, 3.3828125, 4.671875, 5.9609375, 7.25, 8.5390625, 9.828125, 11.1171875, 12.40625, 13.6953125, 14.984375, 16.2734375, 17.5625, 18.8515625, 20.140625, 21.4296875, 22.71875, 24.0078125, 25.296875, 26.5859375, 27.875, 29.1640625, 30.453125, 31.7421875, 33.03125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 15.0, 64.0, 180.0, 316.0, 280.0, 116.0, 28.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.09215545654297, -77.01634216308594, -73.9405288696289, -70.86471557617188, -67.78890228271484, -64.71308898925781, -61.63727569580078, -58.56146240234375, -55.48564910888672, -52.40983581542969, -49.334022521972656, -46.258209228515625, -43.182395935058594, -40.10658264160156, -37.03076934814453, -33.9549560546875, -30.879138946533203, -27.803325653076172, -24.72751235961914, -21.65169906616211, -18.575885772705078, -15.50007152557373, -12.424257278442383, -9.348443984985352, -6.27263069152832, -3.19681715965271, -0.12100362777709961, 2.95481014251709, 6.030623435974121, 9.106436729431152, 12.1822509765625, 15.258064270019531, 18.333877563476562, 21.409690856933594, 24.485504150390625, 27.561317443847656, 30.637130737304688, 33.71294403076172, 36.78875732421875, 39.86457061767578, 42.94038391113281, 46.016197204589844, 49.092010498046875, 52.167823791503906, 55.24363708496094, 58.31945037841797, 61.395263671875, 64.47107696533203, 67.54689025878906, 70.6227035522461, 73.69851684570312, 76.77433013916016, 79.85014343261719, 82.92595672607422, 86.00177001953125, 89.07758331298828, 92.15340423583984, 95.22921752929688, 98.3050308227539, 101.38084411621094, 104.45665740966797, 107.532470703125, 110.60828399658203, 113.68409729003906, 116.7599105834961]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 8.0, 4.0, 6.0, 16.0, 11.0, 12.0, 13.0, 20.0, 15.0, 18.0, 23.0, 29.0, 23.0, 27.0, 26.0, 29.0, 29.0, 36.0, 32.0, 30.0, 36.0, 31.0, 41.0, 44.0, 37.0, 47.0, 29.0, 27.0, 32.0, 23.0, 30.0, 33.0, 25.0, 11.0, 16.0, 18.0, 13.0, 14.0, 14.0, 12.0, 18.0, 5.0, 8.0, 6.0, 6.0, 8.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-33.84520721435547, -32.7781982421875, -31.711193084716797, -30.64418601989746, -29.577178955078125, -28.510169982910156, -27.44316291809082, -26.376155853271484, -25.30914878845215, -24.242141723632812, -23.175134658813477, -22.10812759399414, -21.041118621826172, -19.97411346435547, -18.9071044921875, -17.840097427368164, -16.773090362548828, -15.706083297729492, -14.639076232910156, -13.572068214416504, -12.505061149597168, -11.438054084777832, -10.37104606628418, -9.304039001464844, -8.237031936645508, -7.170024871826172, -6.103017330169678, -5.036009788513184, -3.9690027236938477, -2.9019956588745117, -1.8349881172180176, -0.7679805755615234, 0.2990264892578125, 1.3660337924957275, 2.4330410957336426, 3.5000483989715576, 4.567055702209473, 5.634062767028809, 6.701070308685303, 7.768077850341797, 8.835084915161133, 9.902091979980469, 10.969099044799805, 12.036107063293457, 13.103114128112793, 14.170121192932129, 15.237129211425781, 16.304136276245117, 17.371143341064453, 18.43815040588379, 19.505157470703125, 20.57216453552246, 21.639171600341797, 22.706180572509766, 23.7731876373291, 24.840194702148438, 25.907201766967773, 26.97420883178711, 28.041215896606445, 29.10822296142578, 30.17523193359375, 31.242237091064453, 32.30924606323242, 33.376251220703125, 34.443260192871094]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 7.0, 5.0, 5.0, 3.0, 10.0, 9.0, 11.0, 10.0, 14.0, 25.0, 19.0, 21.0, 34.0, 26.0, 29.0, 40.0, 40.0, 37.0, 46.0, 39.0, 49.0, 45.0, 47.0, 39.0, 32.0, 39.0, 40.0, 44.0, 31.0, 30.0, 21.0, 31.0, 19.0, 14.0, 12.0, 16.0, 12.0, 10.0, 8.0, 7.0, 4.0, 2.0, 5.0, 4.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.87890625, -6.65362548828125, -6.4283447265625, -6.20306396484375, -5.977783203125, -5.75250244140625, -5.5272216796875, -5.30194091796875, -5.07666015625, -4.85137939453125, -4.6260986328125, -4.40081787109375, -4.175537109375, -3.95025634765625, -3.7249755859375, -3.49969482421875, -3.2744140625, -3.04913330078125, -2.8238525390625, -2.59857177734375, -2.373291015625, -2.14801025390625, -1.9227294921875, -1.69744873046875, -1.47216796875, -1.24688720703125, -1.0216064453125, -0.79632568359375, -0.571044921875, -0.34576416015625, -0.1204833984375, 0.10479736328125, 0.330078125, 0.55535888671875, 0.7806396484375, 1.00592041015625, 1.231201171875, 1.45648193359375, 1.6817626953125, 1.90704345703125, 2.13232421875, 2.35760498046875, 2.5828857421875, 2.80816650390625, 3.033447265625, 3.25872802734375, 3.4840087890625, 3.70928955078125, 3.9345703125, 4.15985107421875, 4.3851318359375, 4.61041259765625, 4.835693359375, 5.06097412109375, 5.2862548828125, 5.51153564453125, 5.73681640625, 5.96209716796875, 6.1873779296875, 6.41265869140625, 6.637939453125, 6.86322021484375, 7.0885009765625, 7.31378173828125, 7.5390625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 9.0, 6.0, 19.0, 22.0, 40.0, 48.0, 53.0, 100.0, 149.0, 222.0, 289.0, 460.0, 577.0, 830.0, 1290.0, 1873.0, 2711.0, 4038.0, 6106.0, 9394.0, 14479.0, 22790.0, 37032.0, 62544.0, 110818.0, 286686.0, 232479.0, 100364.0, 57500.0, 34466.0, 21193.0, 13511.0, 8692.0, 5794.0, 3610.0, 2679.0, 1766.0, 1182.0, 811.0, 593.0, 405.0, 285.0, 203.0, 142.0, 96.0, 75.0, 41.0, 31.0, 18.0, 15.0, 14.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.6396484375, -1.58984375, -1.5400390625, -1.490234375, -1.4404296875, -1.390625, -1.3408203125, -1.291015625, -1.2412109375, -1.19140625, -1.1416015625, -1.091796875, -1.0419921875, -0.9921875, -0.9423828125, -0.892578125, -0.8427734375, -0.79296875, -0.7431640625, -0.693359375, -0.6435546875, -0.59375, -0.5439453125, -0.494140625, -0.4443359375, -0.39453125, -0.3447265625, -0.294921875, -0.2451171875, -0.1953125, -0.1455078125, -0.095703125, -0.0458984375, 0.00390625, 0.0537109375, 0.103515625, 0.1533203125, 0.203125, 0.2529296875, 0.302734375, 0.3525390625, 0.40234375, 0.4521484375, 0.501953125, 0.5517578125, 0.6015625, 0.6513671875, 0.701171875, 0.7509765625, 0.80078125, 0.8505859375, 0.900390625, 0.9501953125, 1.0, 1.0498046875, 1.099609375, 1.1494140625, 1.19921875, 1.2490234375, 1.298828125, 1.3486328125, 1.3984375, 1.4482421875, 1.498046875, 1.5478515625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 2.0, 0.0, 7.0, 9.0, 9.0, 18.0, 14.0, 16.0, 23.0, 14.0, 25.0, 24.0, 40.0, 36.0, 25.0, 29.0, 46.0, 40.0, 36.0, 35.0, 465.0, 642.0, 34.0, 40.0, 39.0, 46.0, 37.0, 23.0, 31.0, 32.0, 30.0, 29.0, 16.0, 16.0, 14.0, 21.0, 14.0, 6.0, 5.0, 6.0, 5.0, 5.0, 7.0, 2.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0], "bins": [-4.921875, -4.78125, -4.640625, -4.5, -4.359375, -4.21875, -4.078125, -3.9375, -3.796875, -3.65625, -3.515625, -3.375, -3.234375, -3.09375, -2.953125, -2.8125, -2.671875, -2.53125, -2.390625, -2.25, -2.109375, -1.96875, -1.828125, -1.6875, -1.546875, -1.40625, -1.265625, -1.125, -0.984375, -0.84375, -0.703125, -0.5625, -0.421875, -0.28125, -0.140625, 0.0, 0.140625, 0.28125, 0.421875, 0.5625, 0.703125, 0.84375, 0.984375, 1.125, 1.265625, 1.40625, 1.546875, 1.6875, 1.828125, 1.96875, 2.109375, 2.25, 2.390625, 2.53125, 2.671875, 2.8125, 2.953125, 3.09375, 3.234375, 3.375, 3.515625, 3.65625, 3.796875, 3.9375, 4.078125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 2.0, 6.0, 2.0, 8.0, 17.0, 20.0, 38.0, 28.0, 76.0, 121.0, 125.0, 229.0, 293.0, 467.0, 664.0, 1007.0, 1517.0, 2360.0, 3930.0, 6286.0, 10223.0, 17186.0, 29913.0, 52129.0, 95758.0, 210445.0, 1389428.0, 121070.0, 64517.0, 35947.0, 20697.0, 12346.0, 7352.0, 4636.0, 2893.0, 1878.0, 1211.0, 789.0, 554.0, 324.0, 194.0, 128.0, 90.0, 83.0, 40.0, 31.0, 24.0, 17.0, 12.0, 12.0, 4.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.66015625, -1.6032562255859375, -1.546356201171875, -1.4894561767578125, -1.43255615234375, -1.3756561279296875, -1.318756103515625, -1.2618560791015625, -1.2049560546875, -1.1480560302734375, -1.091156005859375, -1.0342559814453125, -0.97735595703125, -0.9204559326171875, -0.863555908203125, -0.8066558837890625, -0.749755859375, -0.6928558349609375, -0.635955810546875, -0.5790557861328125, -0.52215576171875, -0.4652557373046875, -0.408355712890625, -0.3514556884765625, -0.2945556640625, -0.2376556396484375, -0.180755615234375, -0.1238555908203125, -0.06695556640625, -0.0100555419921875, 0.046844482421875, 0.1037445068359375, 0.16064453125, 0.2175445556640625, 0.274444580078125, 0.3313446044921875, 0.38824462890625, 0.4451446533203125, 0.502044677734375, 0.5589447021484375, 0.6158447265625, 0.6727447509765625, 0.729644775390625, 0.7865447998046875, 0.84344482421875, 0.9003448486328125, 0.957244873046875, 1.0141448974609375, 1.071044921875, 1.1279449462890625, 1.184844970703125, 1.2417449951171875, 1.29864501953125, 1.3555450439453125, 1.412445068359375, 1.4693450927734375, 1.5262451171875, 1.5831451416015625, 1.640045166015625, 1.6969451904296875, 1.75384521484375, 1.8107452392578125, 1.867645263671875, 1.9245452880859375, 1.9814453125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 7.0, 9.0, 12.0, 12.0, 15.0, 21.0, 14.0, 15.0, 32.0, 43.0, 50.0, 96.0, 125.0, 131.0, 108.0, 96.0, 50.0, 48.0, 29.0, 24.0, 19.0, 9.0, 12.0, 11.0, 3.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016145706176757812, -0.0015532523393630981, -0.001491934061050415, -0.001430615782737732, -0.0013692975044250488, -0.0013079792261123657, -0.0012466609477996826, -0.0011853426694869995, -0.0011240243911743164, -0.0010627061128616333, -0.0010013878345489502, -0.0009400695562362671, -0.000878751277923584, -0.0008174329996109009, -0.0007561147212982178, -0.0006947964429855347, -0.0006334781646728516, -0.0005721598863601685, -0.0005108416080474854, -0.00044952332973480225, -0.00038820505142211914, -0.00032688677310943604, -0.00026556849479675293, -0.00020425021648406982, -0.00014293193817138672, -8.161365985870361e-05, -2.0295381546020508e-05, 4.10228967666626e-05, 0.0001023411750793457, 0.0001636594533920288, 0.00022497773170471191, 0.000286296010017395, 0.0003476142883300781, 0.00040893256664276123, 0.00047025084495544434, 0.0005315691232681274, 0.0005928874015808105, 0.0006542056798934937, 0.0007155239582061768, 0.0007768422365188599, 0.000838160514831543, 0.0008994787931442261, 0.0009607970714569092, 0.0010221153497695923, 0.0010834336280822754, 0.0011447519063949585, 0.0012060701847076416, 0.0012673884630203247, 0.0013287067413330078, 0.001390025019645691, 0.001451343297958374, 0.0015126615762710571, 0.0015739798545837402, 0.0016352981328964233, 0.0016966164112091064, 0.0017579346895217896, 0.0018192529678344727, 0.0018805712461471558, 0.0019418895244598389, 0.002003207802772522, 0.002064526081085205, 0.002125844359397888, 0.0021871626377105713, 0.0022484809160232544, 0.0023097991943359375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 1.0, 3.0, 11.0, 10.0, 15.0, 19.0, 32.0, 43.0, 54.0, 94.0, 170.0, 306.0, 672.0, 8698.0, 1035797.0, 1539.0, 470.0, 238.0, 109.0, 62.0, 42.0, 39.0, 38.0, 25.0, 22.0, 11.0, 13.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.046722412109375, -0.045502662658691406, -0.04428291320800781, -0.04306316375732422, -0.041843414306640625, -0.04062366485595703, -0.03940391540527344, -0.038184165954589844, -0.03696441650390625, -0.035744667053222656, -0.03452491760253906, -0.03330516815185547, -0.032085418701171875, -0.03086566925048828, -0.029645919799804688, -0.028426170349121094, -0.0272064208984375, -0.025986671447753906, -0.024766921997070312, -0.02354717254638672, -0.022327423095703125, -0.02110767364501953, -0.019887924194335938, -0.018668174743652344, -0.01744842529296875, -0.016228675842285156, -0.015008926391601562, -0.013789176940917969, -0.012569427490234375, -0.011349678039550781, -0.010129928588867188, -0.008910179138183594, -0.0076904296875, -0.006470680236816406, -0.0052509307861328125, -0.004031181335449219, -0.002811431884765625, -0.0015916824340820312, -0.0003719329833984375, 0.0008478164672851562, 0.00206756591796875, 0.0032873153686523438, 0.0045070648193359375, 0.005726814270019531, 0.006946563720703125, 0.008166313171386719, 0.009386062622070312, 0.010605812072753906, 0.0118255615234375, 0.013045310974121094, 0.014265060424804688, 0.015484809875488281, 0.016704559326171875, 0.01792430877685547, 0.019144058227539062, 0.020363807678222656, 0.02158355712890625, 0.022803306579589844, 0.024023056030273438, 0.02524280548095703, 0.026462554931640625, 0.02768230438232422, 0.028902053833007812, 0.030121803283691406, 0.031341552734375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 96.0, 387.0, 414.0, 95.0, 9.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0034516933374106884, -0.003369476180523634, -0.003287258790805936, -0.0032050416339188814, -0.003122824477031827, -0.003040607087314129, -0.0029583899304270744, -0.00287617277354002, -0.0027939556166529655, -0.002711738459765911, -0.002629521070048213, -0.0025473039131611586, -0.002465086756274104, -0.002382869366556406, -0.0023006522096693516, -0.002218435052782297, -0.002136217663064599, -0.0020540005061775446, -0.0019717831164598465, -0.001889565959572792, -0.0018073488026857376, -0.0017251315293833613, -0.001642914256080985, -0.0015606970991939306, -0.0014784798258915544, -0.001396262552589178, -0.0013140453957021236, -0.0012318281223997474, -0.001149610849097371, -0.0010673936922103167, -0.0009851764189079404, -0.000902959203813225, -0.000820741755887866, -0.0007385245407931507, -0.0006563073256984353, -0.000574090052396059, -0.0004918728373013437, -0.0004096556222066283, -0.00032743834890425205, -0.0002452211338095367, -0.00016300391871482134, -8.078668906819075e-05, 1.4305405784398317e-06, 8.364778477698565e-05, 0.000165864999871701, 0.00024808221496641636, 0.00033029948826879263, 0.000412516703363508, 0.0004947339184582233, 0.0005769511335529387, 0.0006591683486476541, 0.0007413856219500303, 0.0008236028370447457, 0.000905820052139461, 0.0009880373254418373, 0.0010702544823288918, 0.001152471755631268, 0.0012346890289336443, 0.0013169061858206987, 0.001399123459123075, 0.0014813407324254513, 0.0015635578893125057, 0.001645775162614882, 0.0017279924359172583, 0.0018102095928043127]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 3.0, 4.0, 6.0, 14.0, 14.0, 12.0, 18.0, 19.0, 15.0, 32.0, 20.0, 22.0, 31.0, 31.0, 32.0, 48.0, 43.0, 42.0, 35.0, 41.0, 37.0, 45.0, 38.0, 43.0, 38.0, 42.0, 34.0, 28.0, 29.0, 28.0, 24.0, 20.0, 12.0, 26.0, 16.0, 16.0, 7.0, 5.0, 9.0, 5.0, 3.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005869865417480469, -0.0005651433020830154, -0.000543300062417984, -0.0005214568227529526, -0.0004996135830879211, -0.0004777703434228897, -0.0004559271037578583, -0.00043408386409282684, -0.0004122406244277954, -0.000390397384762764, -0.00036855414509773254, -0.0003467109054327011, -0.0003248676657676697, -0.00030302442610263824, -0.0002811811864376068, -0.0002593379467725754, -0.00023749470710754395, -0.0002156514674425125, -0.00019380822777748108, -0.00017196498811244965, -0.0001501217484474182, -0.00012827850878238678, -0.00010643526911735535, -8.459202945232391e-05, -6.274878978729248e-05, -4.090555012226105e-05, -1.9062310457229614e-05, 2.780929207801819e-06, 2.4624168872833252e-05, 4.6467408537864685e-05, 6.831064820289612e-05, 9.015388786792755e-05, 0.00011199712753295898, 0.00013384036719799042, 0.00015568360686302185, 0.00017752684652805328, 0.00019937008619308472, 0.00022121332585811615, 0.00024305656552314758, 0.000264899805188179, 0.00028674304485321045, 0.0003085862845182419, 0.0003304295241832733, 0.00035227276384830475, 0.0003741160035133362, 0.0003959592431783676, 0.00041780248284339905, 0.0004396457225084305, 0.0004614889621734619, 0.00048333220183849335, 0.0005051754415035248, 0.0005270186811685562, 0.0005488619208335876, 0.0005707051604986191, 0.0005925484001636505, 0.000614391639828682, 0.0006362348794937134, 0.0006580781191587448, 0.0006799213588237762, 0.0007017645984888077, 0.0007236078381538391, 0.0007454510778188705, 0.000767294317483902, 0.0007891375571489334, 0.0008109807968139648]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 7.0, 5.0, 5.0, 3.0, 10.0, 9.0, 11.0, 10.0, 14.0, 25.0, 19.0, 21.0, 34.0, 26.0, 29.0, 40.0, 40.0, 37.0, 46.0, 39.0, 49.0, 45.0, 47.0, 39.0, 32.0, 39.0, 40.0, 44.0, 31.0, 30.0, 21.0, 31.0, 19.0, 14.0, 12.0, 16.0, 12.0, 10.0, 8.0, 7.0, 4.0, 2.0, 5.0, 4.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.87890625, -6.65362548828125, -6.4283447265625, -6.20306396484375, -5.977783203125, -5.75250244140625, -5.5272216796875, -5.30194091796875, -5.07666015625, -4.85137939453125, -4.6260986328125, -4.40081787109375, -4.175537109375, -3.95025634765625, -3.7249755859375, -3.49969482421875, -3.2744140625, -3.04913330078125, -2.8238525390625, -2.59857177734375, -2.373291015625, -2.14801025390625, -1.9227294921875, -1.69744873046875, -1.47216796875, -1.24688720703125, -1.0216064453125, -0.79632568359375, -0.571044921875, -0.34576416015625, -0.1204833984375, 0.10479736328125, 0.330078125, 0.55535888671875, 0.7806396484375, 1.00592041015625, 1.231201171875, 1.45648193359375, 1.6817626953125, 1.90704345703125, 2.13232421875, 2.35760498046875, 2.5828857421875, 2.80816650390625, 3.033447265625, 3.25872802734375, 3.4840087890625, 3.70928955078125, 3.9345703125, 4.15985107421875, 4.3851318359375, 4.61041259765625, 4.835693359375, 5.06097412109375, 5.2862548828125, 5.51153564453125, 5.73681640625, 5.96209716796875, 6.1873779296875, 6.41265869140625, 6.637939453125, 6.86322021484375, 7.0885009765625, 7.31378173828125, 7.5390625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 8.0, 7.0, 11.0, 19.0, 25.0, 27.0, 33.0, 49.0, 94.0, 97.0, 127.0, 165.0, 234.0, 321.0, 419.0, 548.0, 899.0, 2399.0, 13112.0, 139340.0, 812823.0, 65569.0, 7716.0, 1712.0, 764.0, 516.0, 380.0, 272.0, 205.0, 140.0, 144.0, 102.0, 57.0, 55.0, 40.0, 29.0, 22.0, 17.0, 8.0, 10.0, 6.0, 5.0, 5.0, 6.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.953125, -16.394775390625, -15.83642578125, -15.278076171875, -14.7197265625, -14.161376953125, -13.60302734375, -13.044677734375, -12.486328125, -11.927978515625, -11.36962890625, -10.811279296875, -10.2529296875, -9.694580078125, -9.13623046875, -8.577880859375, -8.01953125, -7.461181640625, -6.90283203125, -6.344482421875, -5.7861328125, -5.227783203125, -4.66943359375, -4.111083984375, -3.552734375, -2.994384765625, -2.43603515625, -1.877685546875, -1.3193359375, -0.760986328125, -0.20263671875, 0.355712890625, 0.9140625, 1.472412109375, 2.03076171875, 2.589111328125, 3.1474609375, 3.705810546875, 4.26416015625, 4.822509765625, 5.380859375, 5.939208984375, 6.49755859375, 7.055908203125, 7.6142578125, 8.172607421875, 8.73095703125, 9.289306640625, 9.84765625, 10.406005859375, 10.96435546875, 11.522705078125, 12.0810546875, 12.639404296875, 13.19775390625, 13.756103515625, 14.314453125, 14.872802734375, 15.43115234375, 15.989501953125, 16.5478515625, 17.106201171875, 17.66455078125, 18.222900390625, 18.78125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 9.0, 10.0, 4.0, 9.0, 12.0, 16.0, 18.0, 22.0, 19.0, 18.0, 32.0, 40.0, 40.0, 37.0, 47.0, 73.0, 81.0, 331.0, 1643.0, 118.0, 75.0, 59.0, 42.0, 42.0, 28.0, 29.0, 33.0, 31.0, 22.0, 20.0, 19.0, 11.0, 9.0, 10.0, 10.0, 7.0, 1.0, 5.0, 5.0, 3.0, 4.0, 0.0, 1.0, 3.0], "bins": [-27.75, -27.024169921875, -26.29833984375, -25.572509765625, -24.8466796875, -24.120849609375, -23.39501953125, -22.669189453125, -21.943359375, -21.217529296875, -20.49169921875, -19.765869140625, -19.0400390625, -18.314208984375, -17.58837890625, -16.862548828125, -16.13671875, -15.410888671875, -14.68505859375, -13.959228515625, -13.2333984375, -12.507568359375, -11.78173828125, -11.055908203125, -10.330078125, -9.604248046875, -8.87841796875, -8.152587890625, -7.4267578125, -6.700927734375, -5.97509765625, -5.249267578125, -4.5234375, -3.797607421875, -3.07177734375, -2.345947265625, -1.6201171875, -0.894287109375, -0.16845703125, 0.557373046875, 1.283203125, 2.009033203125, 2.73486328125, 3.460693359375, 4.1865234375, 4.912353515625, 5.63818359375, 6.364013671875, 7.08984375, 7.815673828125, 8.54150390625, 9.267333984375, 9.9931640625, 10.718994140625, 11.44482421875, 12.170654296875, 12.896484375, 13.622314453125, 14.34814453125, 15.073974609375, 15.7998046875, 16.525634765625, 17.25146484375, 17.977294921875, 18.703125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 1.0, 4.0, 2.0, 5.0, 8.0, 11.0, 9.0, 13.0, 8.0, 14.0, 12.0, 32.0, 32.0, 27.0, 61.0, 37.0, 54.0, 104.0, 182.0, 267.0, 792.0, 4169.0, 2836546.0, 299229.0, 2696.0, 615.0, 225.0, 148.0, 82.0, 61.0, 50.0, 37.0, 29.0, 32.0, 25.0, 12.0, 18.0, 13.0, 7.0, 7.0, 9.0, 9.0, 8.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.03125, -47.13818359375, -45.2451171875, -43.35205078125, -41.458984375, -39.56591796875, -37.6728515625, -35.77978515625, -33.88671875, -31.99365234375, -30.1005859375, -28.20751953125, -26.314453125, -24.42138671875, -22.5283203125, -20.63525390625, -18.7421875, -16.84912109375, -14.9560546875, -13.06298828125, -11.169921875, -9.27685546875, -7.3837890625, -5.49072265625, -3.59765625, -1.70458984375, 0.1884765625, 2.08154296875, 3.974609375, 5.86767578125, 7.7607421875, 9.65380859375, 11.546875, 13.43994140625, 15.3330078125, 17.22607421875, 19.119140625, 21.01220703125, 22.9052734375, 24.79833984375, 26.69140625, 28.58447265625, 30.4775390625, 32.37060546875, 34.263671875, 36.15673828125, 38.0498046875, 39.94287109375, 41.8359375, 43.72900390625, 45.6220703125, 47.51513671875, 49.408203125, 51.30126953125, 53.1943359375, 55.08740234375, 56.98046875, 58.87353515625, 60.7666015625, 62.65966796875, 64.552734375, 66.44580078125, 68.3388671875, 70.23193359375, 72.125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 71.0, 221.0, 365.0, 251.0, 85.0, 15.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.70166301727295, -7.986354827880859, -6.2710466384887695, -4.555738925933838, -2.840430736541748, -1.1251230239868164, 0.5901851654052734, 2.3054933547973633, 4.020801544189453, 5.736109733581543, 7.451417922973633, 9.166725158691406, 10.882034301757812, 12.597341537475586, 14.312649726867676, 16.027957916259766, 17.743267059326172, 19.458574295043945, 21.17388343811035, 22.889190673828125, 24.60449981689453, 26.319807052612305, 28.035114288330078, 29.750423431396484, 31.465730667114258, 33.18103790283203, 34.89634704589844, 36.611656188964844, 38.326961517333984, 40.04227066040039, 41.7575798034668, 43.47288513183594, 45.18819808959961, 46.903507232666016, 48.618812561035156, 50.33412170410156, 52.04943084716797, 53.764739990234375, 55.480045318603516, 57.19535446166992, 58.91066360473633, 60.625972747802734, 62.341278076171875, 64.05658721923828, 65.77189636230469, 67.4872055053711, 69.2025146484375, 70.91781616210938, 72.63312530517578, 74.34843444824219, 76.0637435913086, 77.779052734375, 79.49435424804688, 81.20966339111328, 82.92497253417969, 84.6402816772461, 86.3555908203125, 88.0708999633789, 89.78620910644531, 91.50151824951172, 93.2168197631836, 94.93212890625, 96.6474380493164, 98.36274719238281, 100.07805633544922]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 2.0, 7.0, 5.0, 11.0, 11.0, 5.0, 7.0, 5.0, 13.0, 22.0, 14.0, 22.0, 24.0, 26.0, 23.0, 24.0, 26.0, 25.0, 27.0, 34.0, 37.0, 40.0, 39.0, 43.0, 38.0, 37.0, 36.0, 30.0, 40.0, 37.0, 29.0, 25.0, 34.0, 21.0, 31.0, 14.0, 16.0, 23.0, 12.0, 17.0, 16.0, 13.0, 10.0, 5.0, 7.0, 5.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-54.41594696044922, -52.89585494995117, -51.37575912475586, -49.85566711425781, -48.3355712890625, -46.81547927856445, -45.295387268066406, -43.775291442871094, -42.25519943237305, -40.735107421875, -39.21501159667969, -37.69491958618164, -36.17482376098633, -34.65473175048828, -33.13463592529297, -31.614543914794922, -30.094449996948242, -28.574356079101562, -27.054262161254883, -25.534168243408203, -24.014076232910156, -22.493982315063477, -20.973888397216797, -19.45379638671875, -17.933700561523438, -16.413606643676758, -14.893513679504395, -13.373419761657715, -11.853326797485352, -10.333232879638672, -8.813138961791992, -7.293045997619629, -5.772953033447266, -4.252859592437744, -2.7327659130096436, -1.212672233581543, 0.3074212074279785, 1.8275146484375, 3.3476085662841797, 4.867701530456543, 6.387795448303223, 7.907888889312744, 9.427982330322266, 10.948076248168945, 12.468170166015625, 13.988263130187988, 15.508357048034668, 17.02845001220703, 18.54854393005371, 20.06863784790039, 21.58873176574707, 23.10882568359375, 24.628917694091797, 26.149011611938477, 27.669105529785156, 29.189197540283203, 30.709293365478516, 32.22938537597656, 33.749481201171875, 35.26957321166992, 36.789669036865234, 38.30976104736328, 39.829856872558594, 41.34994888305664, 42.87004089355469]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 6.0, 11.0, 11.0, 8.0, 16.0, 16.0, 17.0, 25.0, 30.0, 27.0, 35.0, 30.0, 35.0, 49.0, 52.0, 38.0, 45.0, 48.0, 47.0, 46.0, 47.0, 40.0, 39.0, 31.0, 37.0, 31.0, 33.0, 23.0, 18.0, 20.0, 17.0, 14.0, 14.0, 9.0, 8.0, 4.0, 7.0, 2.0, 4.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8359375, -7.5823974609375, -7.328857421875, -7.0753173828125, -6.82177734375, -6.5682373046875, -6.314697265625, -6.0611572265625, -5.8076171875, -5.5540771484375, -5.300537109375, -5.0469970703125, -4.79345703125, -4.5399169921875, -4.286376953125, -4.0328369140625, -3.779296875, -3.5257568359375, -3.272216796875, -3.0186767578125, -2.76513671875, -2.5115966796875, -2.258056640625, -2.0045166015625, -1.7509765625, -1.4974365234375, -1.243896484375, -0.9903564453125, -0.73681640625, -0.4832763671875, -0.229736328125, 0.0238037109375, 0.27734375, 0.5308837890625, 0.784423828125, 1.0379638671875, 1.29150390625, 1.5450439453125, 1.798583984375, 2.0521240234375, 2.3056640625, 2.5592041015625, 2.812744140625, 3.0662841796875, 3.31982421875, 3.5733642578125, 3.826904296875, 4.0804443359375, 4.333984375, 4.5875244140625, 4.841064453125, 5.0946044921875, 5.34814453125, 5.6016845703125, 5.855224609375, 6.1087646484375, 6.3623046875, 6.6158447265625, 6.869384765625, 7.1229248046875, 7.37646484375, 7.6300048828125, 7.883544921875, 8.1370849609375, 8.390625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 4.0, 8.0, 12.0, 14.0, 21.0, 25.0, 28.0, 44.0, 61.0, 75.0, 103.0, 135.0, 173.0, 260.0, 361.0, 717.0, 1927.0, 12659.0, 258445.0, 2465143.0, 1373253.0, 72717.0, 5140.0, 1198.0, 532.0, 352.0, 211.0, 169.0, 106.0, 100.0, 55.0, 75.0, 43.0, 21.0, 19.0, 15.0, 11.0, 7.0, 11.0, 11.0, 8.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.140625, -14.649169921875, -14.15771484375, -13.666259765625, -13.1748046875, -12.683349609375, -12.19189453125, -11.700439453125, -11.208984375, -10.717529296875, -10.22607421875, -9.734619140625, -9.2431640625, -8.751708984375, -8.26025390625, -7.768798828125, -7.27734375, -6.785888671875, -6.29443359375, -5.802978515625, -5.3115234375, -4.820068359375, -4.32861328125, -3.837158203125, -3.345703125, -2.854248046875, -2.36279296875, -1.871337890625, -1.3798828125, -0.888427734375, -0.39697265625, 0.094482421875, 0.5859375, 1.077392578125, 1.56884765625, 2.060302734375, 2.5517578125, 3.043212890625, 3.53466796875, 4.026123046875, 4.517578125, 5.009033203125, 5.50048828125, 5.991943359375, 6.4833984375, 6.974853515625, 7.46630859375, 7.957763671875, 8.44921875, 8.940673828125, 9.43212890625, 9.923583984375, 10.4150390625, 10.906494140625, 11.39794921875, 11.889404296875, 12.380859375, 12.872314453125, 13.36376953125, 13.855224609375, 14.3466796875, 14.838134765625, 15.32958984375, 15.821044921875, 16.3125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 5.0, 5.0, 10.0, 15.0, 15.0, 40.0, 81.0, 120.0, 237.0, 457.0, 705.0, 750.0, 645.0, 400.0, 242.0, 131.0, 83.0, 48.0, 29.0, 18.0, 7.0, 8.0, 5.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.40625, -17.85693359375, -17.3076171875, -16.75830078125, -16.208984375, -15.65966796875, -15.1103515625, -14.56103515625, -14.01171875, -13.46240234375, -12.9130859375, -12.36376953125, -11.814453125, -11.26513671875, -10.7158203125, -10.16650390625, -9.6171875, -9.06787109375, -8.5185546875, -7.96923828125, -7.419921875, -6.87060546875, -6.3212890625, -5.77197265625, -5.22265625, -4.67333984375, -4.1240234375, -3.57470703125, -3.025390625, -2.47607421875, -1.9267578125, -1.37744140625, -0.828125, -0.27880859375, 0.2705078125, 0.81982421875, 1.369140625, 1.91845703125, 2.4677734375, 3.01708984375, 3.56640625, 4.11572265625, 4.6650390625, 5.21435546875, 5.763671875, 6.31298828125, 6.8623046875, 7.41162109375, 7.9609375, 8.51025390625, 9.0595703125, 9.60888671875, 10.158203125, 10.70751953125, 11.2568359375, 11.80615234375, 12.35546875, 12.90478515625, 13.4541015625, 14.00341796875, 14.552734375, 15.10205078125, 15.6513671875, 16.20068359375, 16.75]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 11.0, 17.0, 12.0, 23.0, 41.0, 75.0, 108.0, 185.0, 314.0, 773.0, 2473.0, 56099.0, 4059737.0, 70009.0, 2849.0, 802.0, 356.0, 163.0, 92.0, 46.0, 36.0, 13.0, 17.0, 9.0, 10.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.0625, -43.5859375, -42.109375, -40.6328125, -39.15625, -37.6796875, -36.203125, -34.7265625, -33.25, -31.7734375, -30.296875, -28.8203125, -27.34375, -25.8671875, -24.390625, -22.9140625, -21.4375, -19.9609375, -18.484375, -17.0078125, -15.53125, -14.0546875, -12.578125, -11.1015625, -9.625, -8.1484375, -6.671875, -5.1953125, -3.71875, -2.2421875, -0.765625, 0.7109375, 2.1875, 3.6640625, 5.140625, 6.6171875, 8.09375, 9.5703125, 11.046875, 12.5234375, 14.0, 15.4765625, 16.953125, 18.4296875, 19.90625, 21.3828125, 22.859375, 24.3359375, 25.8125, 27.2890625, 28.765625, 30.2421875, 31.71875, 33.1953125, 34.671875, 36.1484375, 37.625, 39.1015625, 40.578125, 42.0546875, 43.53125, 45.0078125, 46.484375, 47.9609375, 49.4375]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [11.0, 94.0, 322.0, 421.0, 150.0, 12.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.007353782653809, -9.532444953918457, -5.0575361251831055, -0.5826272964477539, 3.8922815322875977, 8.36719036102295, 12.8420991897583, 17.31700897216797, 21.791915893554688, 26.26682472229004, 30.74173355102539, 35.216644287109375, 39.691551208496094, 44.16645812988281, 48.6413688659668, 53.11627960205078, 57.5911865234375, 62.06609344482422, 66.54100036621094, 71.01591491699219, 75.4908218383789, 79.96572875976562, 84.44064331054688, 88.9155502319336, 93.39045715332031, 97.86536407470703, 102.34027099609375, 106.815185546875, 111.29009246826172, 115.76499938964844, 120.23991394042969, 124.7148208618164, 129.18972778320312, 133.66464233398438, 138.13954162597656, 142.6144561767578, 147.08935546875, 151.56427001953125, 156.0391845703125, 160.5140838623047, 164.98899841308594, 169.4639129638672, 173.93881225585938, 178.41372680664062, 182.88864135742188, 187.36354064941406, 191.8384552001953, 196.3133544921875, 200.78826904296875, 205.26318359375, 209.7380828857422, 214.21299743652344, 218.68789672851562, 223.16281127929688, 227.63772583007812, 232.1126251220703, 236.58753967285156, 241.0624542236328, 245.537353515625, 250.01226806640625, 254.4871826171875, 258.96209716796875, 263.4369812011719, 267.9118957519531, 272.3868103027344]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 1.0, 3.0, 8.0, 9.0, 11.0, 5.0, 16.0, 15.0, 20.0, 15.0, 23.0, 18.0, 27.0, 24.0, 39.0, 39.0, 41.0, 45.0, 43.0, 52.0, 34.0, 37.0, 54.0, 38.0, 30.0, 34.0, 44.0, 28.0, 27.0, 34.0, 34.0, 26.0, 26.0, 17.0, 13.0, 10.0, 14.0, 18.0, 6.0, 10.0, 2.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.04771423339844, -38.866085052490234, -37.684452056884766, -36.50282287597656, -35.321189880371094, -34.13956069946289, -32.95792770385742, -31.77629852294922, -30.59466552734375, -29.413034439086914, -28.231403350830078, -27.049772262573242, -25.868141174316406, -24.68651008605957, -23.504878997802734, -22.32324981689453, -21.141618728637695, -19.95998764038086, -18.778356552124023, -17.596725463867188, -16.41509437561035, -15.233463287353516, -14.051833152770996, -12.87020206451416, -11.688570976257324, -10.506939888000488, -9.325308799743652, -8.143678665161133, -6.962047100067139, -5.780416011810303, -4.598785400390625, -3.417154312133789, -2.235523223876953, -1.0538922548294067, 0.12773871421813965, 1.3093695640563965, 2.4910006523132324, 3.6726317405700684, 4.854262351989746, 6.035893440246582, 7.217524528503418, 8.399155616760254, 9.58078670501709, 10.76241683959961, 11.944047927856445, 13.125679016113281, 14.307310104370117, 15.488941192626953, 16.67057228088379, 17.852203369140625, 19.03383445739746, 20.215465545654297, 21.397096633911133, 22.57872772216797, 23.760356903076172, 24.94198989868164, 26.123619079589844, 27.30525016784668, 28.486881256103516, 29.66851234436035, 30.850143432617188, 32.03177261352539, 33.21340560913086, 34.39503479003906, 35.57666778564453]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 12.0, 13.0, 8.0, 15.0, 17.0, 15.0, 31.0, 28.0, 44.0, 41.0, 47.0, 34.0, 36.0, 38.0, 47.0, 52.0, 53.0, 38.0, 53.0, 37.0, 45.0, 36.0, 41.0, 27.0, 24.0, 23.0, 25.0, 32.0, 19.0, 9.0, 11.0, 15.0, 10.0, 7.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7578125, -6.5015869140625, -6.245361328125, -5.9891357421875, -5.73291015625, -5.4766845703125, -5.220458984375, -4.9642333984375, -4.7080078125, -4.4517822265625, -4.195556640625, -3.9393310546875, -3.68310546875, -3.4268798828125, -3.170654296875, -2.9144287109375, -2.658203125, -2.4019775390625, -2.145751953125, -1.8895263671875, -1.63330078125, -1.3770751953125, -1.120849609375, -0.8646240234375, -0.6083984375, -0.3521728515625, -0.095947265625, 0.1602783203125, 0.41650390625, 0.6727294921875, 0.928955078125, 1.1851806640625, 1.44140625, 1.6976318359375, 1.953857421875, 2.2100830078125, 2.46630859375, 2.7225341796875, 2.978759765625, 3.2349853515625, 3.4912109375, 3.7474365234375, 4.003662109375, 4.2598876953125, 4.51611328125, 4.7723388671875, 5.028564453125, 5.2847900390625, 5.541015625, 5.7972412109375, 6.053466796875, 6.3096923828125, 6.56591796875, 6.8221435546875, 7.078369140625, 7.3345947265625, 7.5908203125, 7.8470458984375, 8.103271484375, 8.3594970703125, 8.61572265625, 8.8719482421875, 9.128173828125, 9.3843994140625, 9.640625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 0.0, 2.0, 5.0, 4.0, 9.0, 3.0, 10.0, 14.0, 23.0, 37.0, 61.0, 109.0, 164.0, 275.0, 450.0, 738.0, 1140.0, 1921.0, 3089.0, 5185.0, 8344.0, 13368.0, 22409.0, 37621.0, 64792.0, 120038.0, 305346.0, 221386.0, 101796.0, 56419.0, 32765.0, 19789.0, 12076.0, 7426.0, 4566.0, 2740.0, 1702.0, 1027.0, 658.0, 407.0, 246.0, 144.0, 91.0, 58.0, 38.0, 23.0, 16.0, 8.0, 5.0, 7.0, 0.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.771484375, -1.714111328125, -1.65673828125, -1.599365234375, -1.5419921875, -1.484619140625, -1.42724609375, -1.369873046875, -1.3125, -1.255126953125, -1.19775390625, -1.140380859375, -1.0830078125, -1.025634765625, -0.96826171875, -0.910888671875, -0.853515625, -0.796142578125, -0.73876953125, -0.681396484375, -0.6240234375, -0.566650390625, -0.50927734375, -0.451904296875, -0.39453125, -0.337158203125, -0.27978515625, -0.222412109375, -0.1650390625, -0.107666015625, -0.05029296875, 0.007080078125, 0.064453125, 0.121826171875, 0.17919921875, 0.236572265625, 0.2939453125, 0.351318359375, 0.40869140625, 0.466064453125, 0.5234375, 0.580810546875, 0.63818359375, 0.695556640625, 0.7529296875, 0.810302734375, 0.86767578125, 0.925048828125, 0.982421875, 1.039794921875, 1.09716796875, 1.154541015625, 1.2119140625, 1.269287109375, 1.32666015625, 1.384033203125, 1.44140625, 1.498779296875, 1.55615234375, 1.613525390625, 1.6708984375, 1.728271484375, 1.78564453125, 1.843017578125, 1.900390625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 1.0, 4.0, 4.0, 7.0, 5.0, 8.0, 8.0, 22.0, 18.0, 13.0, 16.0, 16.0, 25.0, 33.0, 24.0, 20.0, 38.0, 31.0, 41.0, 43.0, 33.0, 42.0, 1066.0, 54.0, 34.0, 45.0, 42.0, 41.0, 24.0, 29.0, 34.0, 25.0, 26.0, 23.0, 30.0, 18.0, 14.0, 11.0, 18.0, 9.0, 5.0, 9.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.23828125, -4.0950927734375, -3.951904296875, -3.8087158203125, -3.66552734375, -3.5223388671875, -3.379150390625, -3.2359619140625, -3.0927734375, -2.9495849609375, -2.806396484375, -2.6632080078125, -2.52001953125, -2.3768310546875, -2.233642578125, -2.0904541015625, -1.947265625, -1.8040771484375, -1.660888671875, -1.5177001953125, -1.37451171875, -1.2313232421875, -1.088134765625, -0.9449462890625, -0.8017578125, -0.6585693359375, -0.515380859375, -0.3721923828125, -0.22900390625, -0.0858154296875, 0.057373046875, 0.2005615234375, 0.34375, 0.4869384765625, 0.630126953125, 0.7733154296875, 0.91650390625, 1.0596923828125, 1.202880859375, 1.3460693359375, 1.4892578125, 1.6324462890625, 1.775634765625, 1.9188232421875, 2.06201171875, 2.2052001953125, 2.348388671875, 2.4915771484375, 2.634765625, 2.7779541015625, 2.921142578125, 3.0643310546875, 3.20751953125, 3.3507080078125, 3.493896484375, 3.6370849609375, 3.7802734375, 3.9234619140625, 4.066650390625, 4.2098388671875, 4.35302734375, 4.4962158203125, 4.639404296875, 4.7825927734375, 4.92578125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 3.0, 11.0, 12.0, 10.0, 31.0, 30.0, 40.0, 77.0, 89.0, 159.0, 228.0, 370.0, 579.0, 892.0, 1339.0, 2096.0, 3499.0, 5621.0, 9043.0, 15098.0, 25306.0, 43607.0, 78531.0, 160997.0, 1428892.0, 145527.0, 72884.0, 40926.0, 24274.0, 14242.0, 8560.0, 5352.0, 3175.0, 2031.0, 1243.0, 811.0, 533.0, 329.0, 197.0, 172.0, 107.0, 75.0, 41.0, 29.0, 28.0, 12.0, 6.0, 10.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.9814453125, -1.923919677734375, -1.86639404296875, -1.808868408203125, -1.7513427734375, -1.693817138671875, -1.63629150390625, -1.578765869140625, -1.521240234375, -1.463714599609375, -1.40618896484375, -1.348663330078125, -1.2911376953125, -1.233612060546875, -1.17608642578125, -1.118560791015625, -1.06103515625, -1.003509521484375, -0.94598388671875, -0.888458251953125, -0.8309326171875, -0.773406982421875, -0.71588134765625, -0.658355712890625, -0.600830078125, -0.543304443359375, -0.48577880859375, -0.428253173828125, -0.3707275390625, -0.313201904296875, -0.25567626953125, -0.198150634765625, -0.140625, -0.083099365234375, -0.02557373046875, 0.031951904296875, 0.0894775390625, 0.147003173828125, 0.20452880859375, 0.262054443359375, 0.319580078125, 0.377105712890625, 0.43463134765625, 0.492156982421875, 0.5496826171875, 0.607208251953125, 0.66473388671875, 0.722259521484375, 0.77978515625, 0.837310791015625, 0.89483642578125, 0.952362060546875, 1.0098876953125, 1.067413330078125, 1.12493896484375, 1.182464599609375, 1.239990234375, 1.297515869140625, 1.35504150390625, 1.412567138671875, 1.4700927734375, 1.527618408203125, 1.58514404296875, 1.642669677734375, 1.7001953125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 1.0, 5.0, 2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 14.0, 10.0, 12.0, 24.0, 24.0, 22.0, 35.0, 29.0, 47.0, 68.0, 67.0, 113.0, 116.0, 95.0, 63.0, 51.0, 38.0, 20.0, 30.0, 21.0, 18.0, 11.0, 13.0, 6.0, 4.0, 7.0, 7.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013217926025390625, -0.001272827386856079, -0.0012238621711730957, -0.0011748969554901123, -0.001125931739807129, -0.0010769665241241455, -0.0010280013084411621, -0.0009790360927581787, -0.0009300708770751953, -0.0008811056613922119, -0.0008321404457092285, -0.0007831752300262451, -0.0007342100143432617, -0.0006852447986602783, -0.0006362795829772949, -0.0005873143672943115, -0.0005383491516113281, -0.0004893839359283447, -0.00044041872024536133, -0.00039145350456237793, -0.00034248828887939453, -0.00029352307319641113, -0.00024455785751342773, -0.00019559264183044434, -0.00014662742614746094, -9.766221046447754e-05, -4.869699478149414e-05, 2.682209014892578e-07, 4.9233436584472656e-05, 9.819865226745605e-05, 0.00014716386795043945, 0.00019612908363342285, 0.00024509429931640625, 0.00029405951499938965, 0.00034302473068237305, 0.00039198994636535645, 0.00044095516204833984, 0.0004899203777313232, 0.0005388855934143066, 0.00058785080909729, 0.0006368160247802734, 0.0006857812404632568, 0.0007347464561462402, 0.0007837116718292236, 0.000832676887512207, 0.0008816421031951904, 0.0009306073188781738, 0.0009795725345611572, 0.0010285377502441406, 0.001077502965927124, 0.0011264681816101074, 0.0011754333972930908, 0.0012243986129760742, 0.0012733638286590576, 0.001322329044342041, 0.0013712942600250244, 0.0014202594757080078, 0.0014692246913909912, 0.0015181899070739746, 0.001567155122756958, 0.0016161203384399414, 0.0016650855541229248, 0.0017140507698059082, 0.0017630159854888916, 0.001811981201171875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 5.0, 8.0, 8.0, 15.0, 23.0, 6.0, 15.0, 24.0, 33.0, 45.0, 65.0, 66.0, 99.0, 151.0, 241.0, 489.0, 1111.0, 160235.0, 883009.0, 1465.0, 552.0, 245.0, 158.0, 102.0, 91.0, 69.0, 42.0, 45.0, 32.0, 22.0, 18.0, 8.0, 9.0, 5.0, 5.0, 7.0, 9.0, 3.0, 2.0, 6.0, 4.0, 2.0, 5.0, 3.0, 4.0], "bins": [-0.03240966796875, -0.03153586387634277, -0.030662059783935547, -0.02978825569152832, -0.028914451599121094, -0.028040647506713867, -0.02716684341430664, -0.026293039321899414, -0.025419235229492188, -0.02454543113708496, -0.023671627044677734, -0.022797822952270508, -0.02192401885986328, -0.021050214767456055, -0.020176410675048828, -0.0193026065826416, -0.018428802490234375, -0.01755499839782715, -0.016681194305419922, -0.015807390213012695, -0.014933586120605469, -0.014059782028198242, -0.013185977935791016, -0.012312173843383789, -0.011438369750976562, -0.010564565658569336, -0.00969076156616211, -0.008816957473754883, -0.007943153381347656, -0.00706934928894043, -0.006195545196533203, -0.0053217411041259766, -0.00444793701171875, -0.0035741329193115234, -0.002700328826904297, -0.0018265247344970703, -0.0009527206420898438, -7.891654968261719e-05, 0.0007948875427246094, 0.001668691635131836, 0.0025424957275390625, 0.003416299819946289, 0.004290103912353516, 0.005163908004760742, 0.006037712097167969, 0.006911516189575195, 0.007785320281982422, 0.008659124374389648, 0.009532928466796875, 0.010406732559204102, 0.011280536651611328, 0.012154340744018555, 0.013028144836425781, 0.013901948928833008, 0.014775753021240234, 0.01564955711364746, 0.016523361206054688, 0.017397165298461914, 0.01827096939086914, 0.019144773483276367, 0.020018577575683594, 0.02089238166809082, 0.021766185760498047, 0.022639989852905273, 0.0235137939453125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 16.0, 164.0, 494.0, 295.0, 37.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0047285594046115875, -0.004638840910047293, -0.004549122415482998, -0.004459403920918703, -0.004369685426354408, -0.0042799669317901134, -0.004190248437225819, -0.004100529942661524, -0.004010811448097229, -0.003921092953532934, -0.0038313744589686394, -0.0037416559644043446, -0.0036519374698400497, -0.003562218975275755, -0.00347250048071146, -0.0033827819861471653, -0.003293063724413514, -0.0032033452298492193, -0.0031136267352849245, -0.0030239082407206297, -0.002934189746156335, -0.00284447125159204, -0.002754752989858389, -0.002665034495294094, -0.0025753160007297993, -0.0024855975061655045, -0.0023958790116012096, -0.002306160517036915, -0.00221644202247262, -0.002126723527908325, -0.0020370050333440304, -0.0019472866551950574, -0.0018575682770460844, -0.0017678497824817896, -0.0016781312879174948, -0.0015884127933532, -0.0014986942987889051, -0.0014089758042246103, -0.0013192574260756373, -0.0012295389315113425, -0.0011398204369470477, -0.001050101942382753, -0.0009603834478184581, -0.0008706650114618242, -0.0007809465168975294, -0.0006912280223332345, -0.0006015095859766006, -0.0005117910914123058, -0.000422072596848011, -0.0003323541022837162, -0.00024263563682325184, -0.00015291717136278749, -6.319867679849267e-05, 2.6519817765802145e-05, 0.00011623825412243605, 0.00020595674868673086, 0.0002956752432510257, 0.0003853937378153205, 0.00047511220327578485, 0.0005648306687362492, 0.000654549163300544, 0.0007442676578648388, 0.0008339860942214727, 0.0009237045887857676, 0.0010134230833500624]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 9.0, 5.0, 4.0, 5.0, 10.0, 11.0, 7.0, 14.0, 19.0, 18.0, 21.0, 20.0, 19.0, 28.0, 26.0, 27.0, 47.0, 43.0, 42.0, 38.0, 38.0, 44.0, 31.0, 43.0, 37.0, 43.0, 36.0, 23.0, 30.0, 31.0, 41.0, 27.0, 27.0, 26.0, 14.0, 14.0, 13.0, 17.0, 11.0, 10.0, 5.0, 5.0, 4.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.0006949305534362793, -0.0006743390113115311, -0.0006537474691867828, -0.0006331559270620346, -0.0006125643849372864, -0.0005919728428125381, -0.0005713813006877899, -0.0005507897585630417, -0.0005301982164382935, -0.0005096066743135452, -0.000489015132188797, -0.00046842359006404877, -0.00044783204793930054, -0.0004272405058145523, -0.0004066489636898041, -0.00038605742156505585, -0.0003654658794403076, -0.0003448743373155594, -0.00032428279519081116, -0.00030369125306606293, -0.0002830997109413147, -0.00026250816881656647, -0.00024191662669181824, -0.00022132508456707, -0.00020073354244232178, -0.00018014200031757355, -0.00015955045819282532, -0.0001389589160680771, -0.00011836737394332886, -9.777583181858063e-05, -7.71842896938324e-05, -5.659274756908417e-05, -3.600120544433594e-05, -1.5409663319587708e-05, 5.1818788051605225e-06, 2.5773420929908752e-05, 4.636496305465698e-05, 6.695650517940521e-05, 8.754804730415344e-05, 0.00010813958942890167, 0.0001287311315536499, 0.00014932267367839813, 0.00016991421580314636, 0.0001905057579278946, 0.00021109730005264282, 0.00023168884217739105, 0.0002522803843021393, 0.0002728719264268875, 0.00029346346855163574, 0.00031405501067638397, 0.0003346465528011322, 0.00035523809492588043, 0.00037582963705062866, 0.0003964211791753769, 0.0004170127213001251, 0.00043760426342487335, 0.0004581958055496216, 0.0004787873476743698, 0.000499378889799118, 0.0005199704319238663, 0.0005405619740486145, 0.0005611535161733627, 0.000581745058298111, 0.0006023366004228592, 0.0006229281425476074]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 12.0, 13.0, 8.0, 15.0, 17.0, 15.0, 31.0, 28.0, 44.0, 41.0, 47.0, 34.0, 36.0, 38.0, 47.0, 52.0, 53.0, 38.0, 53.0, 37.0, 45.0, 36.0, 41.0, 27.0, 24.0, 23.0, 25.0, 32.0, 19.0, 9.0, 11.0, 15.0, 10.0, 7.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7578125, -6.5015869140625, -6.245361328125, -5.9891357421875, -5.73291015625, -5.4766845703125, -5.220458984375, -4.9642333984375, -4.7080078125, -4.4517822265625, -4.195556640625, -3.9393310546875, -3.68310546875, -3.4268798828125, -3.170654296875, -2.9144287109375, -2.658203125, -2.4019775390625, -2.145751953125, -1.8895263671875, -1.63330078125, -1.3770751953125, -1.120849609375, -0.8646240234375, -0.6083984375, -0.3521728515625, -0.095947265625, 0.1602783203125, 0.41650390625, 0.6727294921875, 0.928955078125, 1.1851806640625, 1.44140625, 1.6976318359375, 1.953857421875, 2.2100830078125, 2.46630859375, 2.7225341796875, 2.978759765625, 3.2349853515625, 3.4912109375, 3.7474365234375, 4.003662109375, 4.2598876953125, 4.51611328125, 4.7723388671875, 5.028564453125, 5.2847900390625, 5.541015625, 5.7972412109375, 6.053466796875, 6.3096923828125, 6.56591796875, 6.8221435546875, 7.078369140625, 7.3345947265625, 7.5908203125, 7.8470458984375, 8.103271484375, 8.3594970703125, 8.61572265625, 8.8719482421875, 9.128173828125, 9.3843994140625, 9.640625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 3.0, 11.0, 13.0, 15.0, 31.0, 37.0, 44.0, 57.0, 96.0, 128.0, 188.0, 276.0, 527.0, 893.0, 2010.0, 5105.0, 14828.0, 50324.0, 179389.0, 475755.0, 226869.0, 62612.0, 18207.0, 6239.0, 2345.0, 1069.0, 484.0, 313.0, 180.0, 149.0, 83.0, 78.0, 61.0, 38.0, 27.0, 24.0, 14.0, 12.0, 11.0, 4.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0625, -7.75927734375, -7.4560546875, -7.15283203125, -6.849609375, -6.54638671875, -6.2431640625, -5.93994140625, -5.63671875, -5.33349609375, -5.0302734375, -4.72705078125, -4.423828125, -4.12060546875, -3.8173828125, -3.51416015625, -3.2109375, -2.90771484375, -2.6044921875, -2.30126953125, -1.998046875, -1.69482421875, -1.3916015625, -1.08837890625, -0.78515625, -0.48193359375, -0.1787109375, 0.12451171875, 0.427734375, 0.73095703125, 1.0341796875, 1.33740234375, 1.640625, 1.94384765625, 2.2470703125, 2.55029296875, 2.853515625, 3.15673828125, 3.4599609375, 3.76318359375, 4.06640625, 4.36962890625, 4.6728515625, 4.97607421875, 5.279296875, 5.58251953125, 5.8857421875, 6.18896484375, 6.4921875, 6.79541015625, 7.0986328125, 7.40185546875, 7.705078125, 8.00830078125, 8.3115234375, 8.61474609375, 8.91796875, 9.22119140625, 9.5244140625, 9.82763671875, 10.130859375, 10.43408203125, 10.7373046875, 11.04052734375, 11.34375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 1.0, 8.0, 8.0, 5.0, 10.0, 18.0, 22.0, 17.0, 16.0, 20.0, 30.0, 31.0, 33.0, 43.0, 48.0, 57.0, 83.0, 132.0, 370.0, 1461.0, 147.0, 87.0, 50.0, 45.0, 39.0, 47.0, 34.0, 37.0, 30.0, 31.0, 12.0, 12.0, 13.0, 6.0, 13.0, 4.0, 9.0, 8.0, 0.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.90625, -22.233154296875, -21.56005859375, -20.886962890625, -20.2138671875, -19.540771484375, -18.86767578125, -18.194580078125, -17.521484375, -16.848388671875, -16.17529296875, -15.502197265625, -14.8291015625, -14.156005859375, -13.48291015625, -12.809814453125, -12.13671875, -11.463623046875, -10.79052734375, -10.117431640625, -9.4443359375, -8.771240234375, -8.09814453125, -7.425048828125, -6.751953125, -6.078857421875, -5.40576171875, -4.732666015625, -4.0595703125, -3.386474609375, -2.71337890625, -2.040283203125, -1.3671875, -0.694091796875, -0.02099609375, 0.652099609375, 1.3251953125, 1.998291015625, 2.67138671875, 3.344482421875, 4.017578125, 4.690673828125, 5.36376953125, 6.036865234375, 6.7099609375, 7.383056640625, 8.05615234375, 8.729248046875, 9.40234375, 10.075439453125, 10.74853515625, 11.421630859375, 12.0947265625, 12.767822265625, 13.44091796875, 14.114013671875, 14.787109375, 15.460205078125, 16.13330078125, 16.806396484375, 17.4794921875, 18.152587890625, 18.82568359375, 19.498779296875, 20.171875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 9.0, 7.0, 9.0, 8.0, 15.0, 23.0, 28.0, 48.0, 58.0, 80.0, 155.0, 256.0, 415.0, 858.0, 3857.0, 641531.0, 2488941.0, 7203.0, 966.0, 502.0, 265.0, 164.0, 98.0, 71.0, 35.0, 30.0, 18.0, 15.0, 10.0, 7.0, 6.0, 6.0, 1.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-51.8125, -50.41552734375, -49.0185546875, -47.62158203125, -46.224609375, -44.82763671875, -43.4306640625, -42.03369140625, -40.63671875, -39.23974609375, -37.8427734375, -36.44580078125, -35.048828125, -33.65185546875, -32.2548828125, -30.85791015625, -29.4609375, -28.06396484375, -26.6669921875, -25.27001953125, -23.873046875, -22.47607421875, -21.0791015625, -19.68212890625, -18.28515625, -16.88818359375, -15.4912109375, -14.09423828125, -12.697265625, -11.30029296875, -9.9033203125, -8.50634765625, -7.109375, -5.71240234375, -4.3154296875, -2.91845703125, -1.521484375, -0.12451171875, 1.2724609375, 2.66943359375, 4.06640625, 5.46337890625, 6.8603515625, 8.25732421875, 9.654296875, 11.05126953125, 12.4482421875, 13.84521484375, 15.2421875, 16.63916015625, 18.0361328125, 19.43310546875, 20.830078125, 22.22705078125, 23.6240234375, 25.02099609375, 26.41796875, 27.81494140625, 29.2119140625, 30.60888671875, 32.005859375, 33.40283203125, 34.7998046875, 36.19677734375, 37.59375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 10.0, 98.0, 528.0, 359.0, 17.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.33464050292969, -120.4271011352539, -116.51956176757812, -112.61202239990234, -108.70448303222656, -104.79693603515625, -100.88939666748047, -96.98185729980469, -93.0743179321289, -89.16677856445312, -85.25923919677734, -81.35169982910156, -77.44415283203125, -73.53662109375, -69.62907409667969, -65.7215347290039, -61.813995361328125, -57.906455993652344, -53.99891662597656, -50.091373443603516, -46.183834075927734, -42.27629470825195, -38.368751525878906, -34.461212158203125, -30.553672790527344, -26.646133422851562, -22.73859214782715, -18.831050872802734, -14.923511505126953, -11.015972137451172, -7.108430862426758, -3.2008895874023438, 0.7066497802734375, 4.614190101623535, 8.521730422973633, 12.42927074432373, 16.336811065673828, 20.24435043334961, 24.151891708374023, 28.059432983398438, 31.96697235107422, 35.87451171875, 39.78205108642578, 43.68959426879883, 47.59713363647461, 51.50467300415039, 55.41221618652344, 59.31975555419922, 63.227294921875, 67.13483428955078, 71.04237365722656, 74.94991302490234, 78.85745239257812, 82.76499938964844, 86.67253875732422, 90.580078125, 94.48761749267578, 98.39515686035156, 102.30269622802734, 106.21023559570312, 110.11778259277344, 114.02531433105469, 117.932861328125, 121.84040069580078, 125.74794006347656]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 7.0, 2.0, 9.0, 2.0, 8.0, 8.0, 11.0, 14.0, 15.0, 21.0, 23.0, 26.0, 21.0, 24.0, 29.0, 31.0, 37.0, 48.0, 33.0, 43.0, 32.0, 49.0, 49.0, 52.0, 47.0, 43.0, 38.0, 33.0, 33.0, 29.0, 42.0, 30.0, 24.0, 11.0, 17.0, 15.0, 14.0, 8.0, 1.0, 11.0, 3.0, 6.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-52.30714797973633, -50.89025115966797, -49.473358154296875, -48.056461334228516, -46.639564514160156, -45.22267150878906, -43.8057746887207, -42.388877868652344, -40.97198486328125, -39.55508804321289, -38.1381950378418, -36.72129821777344, -35.304405212402344, -33.887508392333984, -32.470611572265625, -31.0537166595459, -29.636821746826172, -28.219926834106445, -26.80303192138672, -25.38613510131836, -23.969240188598633, -22.552345275878906, -21.135448455810547, -19.71855354309082, -18.301658630371094, -16.884763717651367, -15.467867851257324, -14.050971984863281, -12.634077072143555, -11.217182159423828, -9.800286293029785, -8.383390426635742, -6.966499328613281, -5.5496039390563965, -4.132708549499512, -2.715813159942627, -1.2989177703857422, 0.11797761917114258, 1.5348730087280273, 2.9517688751220703, 4.368663787841797, 5.785559177398682, 7.202454566955566, 8.61935043334961, 10.036245346069336, 11.453140258789062, 12.870036125183105, 14.286931991577148, 15.703826904296875, 17.1207218170166, 18.537616729736328, 19.954513549804688, 21.371408462524414, 22.78830337524414, 24.2052001953125, 25.622095108032227, 27.038990020751953, 28.45588493347168, 29.872779846191406, 31.289676666259766, 32.706573486328125, 34.12346649169922, 35.54036331176758, 36.95726013183594, 38.37415313720703]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 9.0, 7.0, 18.0, 17.0, 23.0, 21.0, 36.0, 27.0, 43.0, 39.0, 48.0, 47.0, 41.0, 45.0, 65.0, 50.0, 57.0, 48.0, 51.0, 37.0, 47.0, 32.0, 33.0, 26.0, 30.0, 16.0, 14.0, 17.0, 8.0, 14.0, 9.0, 10.0, 7.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8984375, -7.60888671875, -7.3193359375, -7.02978515625, -6.740234375, -6.45068359375, -6.1611328125, -5.87158203125, -5.58203125, -5.29248046875, -5.0029296875, -4.71337890625, -4.423828125, -4.13427734375, -3.8447265625, -3.55517578125, -3.265625, -2.97607421875, -2.6865234375, -2.39697265625, -2.107421875, -1.81787109375, -1.5283203125, -1.23876953125, -0.94921875, -0.65966796875, -0.3701171875, -0.08056640625, 0.208984375, 0.49853515625, 0.7880859375, 1.07763671875, 1.3671875, 1.65673828125, 1.9462890625, 2.23583984375, 2.525390625, 2.81494140625, 3.1044921875, 3.39404296875, 3.68359375, 3.97314453125, 4.2626953125, 4.55224609375, 4.841796875, 5.13134765625, 5.4208984375, 5.71044921875, 6.0, 6.28955078125, 6.5791015625, 6.86865234375, 7.158203125, 7.44775390625, 7.7373046875, 8.02685546875, 8.31640625, 8.60595703125, 8.8955078125, 9.18505859375, 9.474609375, 9.76416015625, 10.0537109375, 10.34326171875, 10.6328125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 9.0, 4.0, 7.0, 7.0, 11.0, 12.0, 18.0, 17.0, 22.0, 32.0, 52.0, 48.0, 105.0, 149.0, 246.0, 517.0, 1191.0, 4381.0, 24339.0, 267051.0, 1757420.0, 1838396.0, 269411.0, 24266.0, 4000.0, 1240.0, 508.0, 300.0, 162.0, 97.0, 75.0, 40.0, 33.0, 26.0, 21.0, 12.0, 10.0, 9.0, 11.0, 6.0, 10.0, 4.0, 1.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.4296875, -12.0413818359375, -11.653076171875, -11.2647705078125, -10.87646484375, -10.4881591796875, -10.099853515625, -9.7115478515625, -9.3232421875, -8.9349365234375, -8.546630859375, -8.1583251953125, -7.77001953125, -7.3817138671875, -6.993408203125, -6.6051025390625, -6.216796875, -5.8284912109375, -5.440185546875, -5.0518798828125, -4.66357421875, -4.2752685546875, -3.886962890625, -3.4986572265625, -3.1103515625, -2.7220458984375, -2.333740234375, -1.9454345703125, -1.55712890625, -1.1688232421875, -0.780517578125, -0.3922119140625, -0.00390625, 0.3843994140625, 0.772705078125, 1.1610107421875, 1.54931640625, 1.9376220703125, 2.325927734375, 2.7142333984375, 3.1025390625, 3.4908447265625, 3.879150390625, 4.2674560546875, 4.65576171875, 5.0440673828125, 5.432373046875, 5.8206787109375, 6.208984375, 6.5972900390625, 6.985595703125, 7.3739013671875, 7.76220703125, 8.1505126953125, 8.538818359375, 8.9271240234375, 9.3154296875, 9.7037353515625, 10.092041015625, 10.4803466796875, 10.86865234375, 11.2569580078125, 11.645263671875, 12.0335693359375, 12.421875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 3.0, 3.0, 5.0, 7.0, 11.0, 12.0, 19.0, 31.0, 27.0, 54.0, 67.0, 88.0, 161.0, 247.0, 300.0, 411.0, 492.0, 495.0, 464.0, 343.0, 245.0, 179.0, 114.0, 72.0, 51.0, 40.0, 26.0, 19.0, 21.0, 8.0, 9.0, 16.0, 6.0, 4.0, 2.0, 6.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.0234375, -9.7015380859375, -9.379638671875, -9.0577392578125, -8.73583984375, -8.4139404296875, -8.092041015625, -7.7701416015625, -7.4482421875, -7.1263427734375, -6.804443359375, -6.4825439453125, -6.16064453125, -5.8387451171875, -5.516845703125, -5.1949462890625, -4.873046875, -4.5511474609375, -4.229248046875, -3.9073486328125, -3.58544921875, -3.2635498046875, -2.941650390625, -2.6197509765625, -2.2978515625, -1.9759521484375, -1.654052734375, -1.3321533203125, -1.01025390625, -0.6883544921875, -0.366455078125, -0.0445556640625, 0.27734375, 0.5992431640625, 0.921142578125, 1.2430419921875, 1.56494140625, 1.8868408203125, 2.208740234375, 2.5306396484375, 2.8525390625, 3.1744384765625, 3.496337890625, 3.8182373046875, 4.14013671875, 4.4620361328125, 4.783935546875, 5.1058349609375, 5.427734375, 5.7496337890625, 6.071533203125, 6.3934326171875, 6.71533203125, 7.0372314453125, 7.359130859375, 7.6810302734375, 8.0029296875, 8.3248291015625, 8.646728515625, 8.9686279296875, 9.29052734375, 9.6124267578125, 9.934326171875, 10.2562255859375, 10.578125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 7.0, 8.0, 3.0, 9.0, 12.0, 12.0, 9.0, 13.0, 26.0, 31.0, 36.0, 51.0, 78.0, 104.0, 157.0, 253.0, 513.0, 1135.0, 3220.0, 12403.0, 73656.0, 839601.0, 2909842.0, 304459.0, 36760.0, 7676.0, 2222.0, 915.0, 389.0, 205.0, 130.0, 92.0, 63.0, 51.0, 31.0, 25.0, 19.0, 21.0, 8.0, 9.0, 10.0, 7.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-16.15625, -15.6712646484375, -15.186279296875, -14.7012939453125, -14.21630859375, -13.7313232421875, -13.246337890625, -12.7613525390625, -12.2763671875, -11.7913818359375, -11.306396484375, -10.8214111328125, -10.33642578125, -9.8514404296875, -9.366455078125, -8.8814697265625, -8.396484375, -7.9114990234375, -7.426513671875, -6.9415283203125, -6.45654296875, -5.9715576171875, -5.486572265625, -5.0015869140625, -4.5166015625, -4.0316162109375, -3.546630859375, -3.0616455078125, -2.57666015625, -2.0916748046875, -1.606689453125, -1.1217041015625, -0.63671875, -0.1517333984375, 0.333251953125, 0.8182373046875, 1.30322265625, 1.7882080078125, 2.273193359375, 2.7581787109375, 3.2431640625, 3.7281494140625, 4.213134765625, 4.6981201171875, 5.18310546875, 5.6680908203125, 6.153076171875, 6.6380615234375, 7.123046875, 7.6080322265625, 8.093017578125, 8.5780029296875, 9.06298828125, 9.5479736328125, 10.032958984375, 10.5179443359375, 11.0029296875, 11.4879150390625, 11.972900390625, 12.4578857421875, 12.94287109375, 13.4278564453125, 13.912841796875, 14.3978271484375, 14.8828125]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 8.0, 23.0, 105.0, 276.0, 365.0, 173.0, 52.0, 10.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.252296447753906, -29.078163146972656, -25.90403175354004, -22.729900360107422, -19.555767059326172, -16.381633758544922, -13.207502365112305, -10.033370971679688, -6.8592376708984375, -3.685105323791504, -0.5109729766845703, 2.6631593704223633, 5.837291717529297, 9.01142406463623, 12.185556411743164, 15.359687805175781, 18.53382110595703, 21.70795440673828, 24.8820858001709, 28.056217193603516, 31.230350494384766, 34.404483795166016, 37.57861328125, 40.75274658203125, 43.9268798828125, 47.10101318359375, 50.275146484375, 53.449275970458984, 56.623409271240234, 59.797542572021484, 62.97167205810547, 66.14580535888672, 69.31993103027344, 72.49406433105469, 75.66819763183594, 78.84233093261719, 82.01646423339844, 85.19058990478516, 88.3647232055664, 91.53885650634766, 94.7129898071289, 97.88712310791016, 101.0612564086914, 104.23538970947266, 107.40951538085938, 110.58364868164062, 113.75778198242188, 116.93191528320312, 120.10604858398438, 123.28018188476562, 126.45431518554688, 129.62844848632812, 132.80258178710938, 135.97671508789062, 139.15084838867188, 142.32498168945312, 145.49911499023438, 148.67324829101562, 151.84738159179688, 155.02151489257812, 158.19564819335938, 161.36978149414062, 164.54391479492188, 167.71804809570312, 170.8921661376953]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 6.0, 11.0, 12.0, 15.0, 14.0, 18.0, 28.0, 32.0, 24.0, 33.0, 33.0, 36.0, 48.0, 39.0, 75.0, 31.0, 49.0, 51.0, 48.0, 38.0, 39.0, 33.0, 30.0, 33.0, 50.0, 28.0, 27.0, 15.0, 18.0, 20.0, 13.0, 16.0, 7.0, 4.0, 8.0, 2.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.34954833984375, -40.12251281738281, -38.89547348022461, -37.66843795776367, -36.44139862060547, -35.21436309814453, -33.98732376098633, -32.76028823852539, -31.53325080871582, -30.30621337890625, -29.07917594909668, -27.85213851928711, -26.625102996826172, -25.39806365966797, -24.17102813720703, -22.94399070739746, -21.71695327758789, -20.48991584777832, -19.26287841796875, -18.03584098815918, -16.80880355834961, -15.581767082214355, -14.354730606079102, -13.127693176269531, -11.900655746459961, -10.67361831665039, -9.44658088684082, -8.219544410705566, -6.992506980895996, -5.765469551086426, -4.538432598114014, -3.3113956451416016, -2.0843582153320312, -0.85732102394104, 0.36971616744995117, 1.5967533588409424, 2.8237905502319336, 4.050827980041504, 5.277864933013916, 6.504901885986328, 7.731939315795898, 8.958976745605469, 10.186014175415039, 11.413050651550293, 12.640088081359863, 13.867125511169434, 15.094161987304688, 16.321199417114258, 17.548236846923828, 18.7752742767334, 20.00231170654297, 21.22934913635254, 22.45638656616211, 23.683422088623047, 24.910459518432617, 26.137496948242188, 27.364534378051758, 28.591571807861328, 29.8186092376709, 31.04564666748047, 32.272682189941406, 33.49972152709961, 34.72675704956055, 35.95379638671875, 37.18083190917969]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 0.0, 4.0, 2.0, 5.0, 13.0, 9.0, 12.0, 8.0, 14.0, 16.0, 23.0, 18.0, 35.0, 27.0, 41.0, 36.0, 33.0, 49.0, 54.0, 39.0, 50.0, 38.0, 48.0, 41.0, 34.0, 40.0, 38.0, 45.0, 32.0, 25.0, 19.0, 28.0, 19.0, 18.0, 23.0, 10.0, 7.0, 11.0, 11.0, 10.0, 4.0, 4.0, 6.0, 3.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.06640625, -6.82061767578125, -6.5748291015625, -6.32904052734375, -6.083251953125, -5.83746337890625, -5.5916748046875, -5.34588623046875, -5.10009765625, -4.85430908203125, -4.6085205078125, -4.36273193359375, -4.116943359375, -3.87115478515625, -3.6253662109375, -3.37957763671875, -3.1337890625, -2.88800048828125, -2.6422119140625, -2.39642333984375, -2.150634765625, -1.90484619140625, -1.6590576171875, -1.41326904296875, -1.16748046875, -0.92169189453125, -0.6759033203125, -0.43011474609375, -0.184326171875, 0.06146240234375, 0.3072509765625, 0.55303955078125, 0.798828125, 1.04461669921875, 1.2904052734375, 1.53619384765625, 1.781982421875, 2.02777099609375, 2.2735595703125, 2.51934814453125, 2.76513671875, 3.01092529296875, 3.2567138671875, 3.50250244140625, 3.748291015625, 3.99407958984375, 4.2398681640625, 4.48565673828125, 4.7314453125, 4.97723388671875, 5.2230224609375, 5.46881103515625, 5.714599609375, 5.96038818359375, 6.2061767578125, 6.45196533203125, 6.69775390625, 6.94354248046875, 7.1893310546875, 7.43511962890625, 7.680908203125, 7.92669677734375, 8.1724853515625, 8.41827392578125, 8.6640625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 10.0, 18.0, 21.0, 24.0, 36.0, 56.0, 103.0, 149.0, 272.0, 352.0, 534.0, 813.0, 1307.0, 1978.0, 2791.0, 4507.0, 6986.0, 10679.0, 17438.0, 28368.0, 49150.0, 90002.0, 200342.0, 351851.0, 121930.0, 63948.0, 36240.0, 21625.0, 13290.0, 8347.0, 5431.0, 3400.0, 2283.0, 1538.0, 958.0, 586.0, 418.0, 294.0, 163.0, 122.0, 74.0, 44.0, 28.0, 19.0, 12.0, 11.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.0078125, -1.9473724365234375, -1.886932373046875, -1.8264923095703125, -1.76605224609375, -1.7056121826171875, -1.645172119140625, -1.5847320556640625, -1.5242919921875, -1.4638519287109375, -1.403411865234375, -1.3429718017578125, -1.28253173828125, -1.2220916748046875, -1.161651611328125, -1.1012115478515625, -1.040771484375, -0.9803314208984375, -0.919891357421875, -0.8594512939453125, -0.79901123046875, -0.7385711669921875, -0.678131103515625, -0.6176910400390625, -0.5572509765625, -0.4968109130859375, -0.436370849609375, -0.3759307861328125, -0.31549072265625, -0.2550506591796875, -0.194610595703125, -0.1341705322265625, -0.07373046875, -0.0132904052734375, 0.047149658203125, 0.1075897216796875, 0.16802978515625, 0.2284698486328125, 0.288909912109375, 0.3493499755859375, 0.4097900390625, 0.4702301025390625, 0.530670166015625, 0.5911102294921875, 0.65155029296875, 0.7119903564453125, 0.772430419921875, 0.8328704833984375, 0.893310546875, 0.9537506103515625, 1.014190673828125, 1.0746307373046875, 1.13507080078125, 1.1955108642578125, 1.255950927734375, 1.3163909912109375, 1.3768310546875, 1.4372711181640625, 1.497711181640625, 1.5581512451171875, 1.61859130859375, 1.6790313720703125, 1.739471435546875, 1.7999114990234375, 1.8603515625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 8.0, 6.0, 10.0, 4.0, 21.0, 15.0, 12.0, 22.0, 27.0, 21.0, 20.0, 25.0, 20.0, 36.0, 53.0, 33.0, 35.0, 32.0, 36.0, 1072.0, 50.0, 40.0, 58.0, 39.0, 37.0, 35.0, 35.0, 32.0, 24.0, 24.0, 27.0, 22.0, 19.0, 16.0, 9.0, 4.0, 13.0, 7.0, 7.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0], "bins": [-5.1484375, -4.998779296875, -4.84912109375, -4.699462890625, -4.5498046875, -4.400146484375, -4.25048828125, -4.100830078125, -3.951171875, -3.801513671875, -3.65185546875, -3.502197265625, -3.3525390625, -3.202880859375, -3.05322265625, -2.903564453125, -2.75390625, -2.604248046875, -2.45458984375, -2.304931640625, -2.1552734375, -2.005615234375, -1.85595703125, -1.706298828125, -1.556640625, -1.406982421875, -1.25732421875, -1.107666015625, -0.9580078125, -0.808349609375, -0.65869140625, -0.509033203125, -0.359375, -0.209716796875, -0.06005859375, 0.089599609375, 0.2392578125, 0.388916015625, 0.53857421875, 0.688232421875, 0.837890625, 0.987548828125, 1.13720703125, 1.286865234375, 1.4365234375, 1.586181640625, 1.73583984375, 1.885498046875, 2.03515625, 2.184814453125, 2.33447265625, 2.484130859375, 2.6337890625, 2.783447265625, 2.93310546875, 3.082763671875, 3.232421875, 3.382080078125, 3.53173828125, 3.681396484375, 3.8310546875, 3.980712890625, 4.13037109375, 4.280029296875, 4.4296875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 16.0, 13.0, 13.0, 24.0, 42.0, 55.0, 78.0, 98.0, 178.0, 285.0, 374.0, 551.0, 908.0, 1477.0, 2415.0, 3707.0, 6157.0, 10055.0, 17031.0, 28729.0, 50807.0, 95651.0, 227781.0, 1390705.0, 115626.0, 60479.0, 34160.0, 19567.0, 11544.0, 7034.0, 4220.0, 2577.0, 1706.0, 1079.0, 659.0, 440.0, 299.0, 224.0, 118.0, 76.0, 59.0, 29.0, 32.0, 13.0, 16.0, 8.0, 15.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7373046875, -1.6776885986328125, -1.618072509765625, -1.5584564208984375, -1.49884033203125, -1.4392242431640625, -1.379608154296875, -1.3199920654296875, -1.2603759765625, -1.2007598876953125, -1.141143798828125, -1.0815277099609375, -1.02191162109375, -0.9622955322265625, -0.902679443359375, -0.8430633544921875, -0.783447265625, -0.7238311767578125, -0.664215087890625, -0.6045989990234375, -0.54498291015625, -0.4853668212890625, -0.425750732421875, -0.3661346435546875, -0.3065185546875, -0.2469024658203125, -0.187286376953125, -0.1276702880859375, -0.06805419921875, -0.0084381103515625, 0.051177978515625, 0.1107940673828125, 0.17041015625, 0.2300262451171875, 0.289642333984375, 0.3492584228515625, 0.40887451171875, 0.4684906005859375, 0.528106689453125, 0.5877227783203125, 0.6473388671875, 0.7069549560546875, 0.766571044921875, 0.8261871337890625, 0.88580322265625, 0.9454193115234375, 1.005035400390625, 1.0646514892578125, 1.124267578125, 1.1838836669921875, 1.243499755859375, 1.3031158447265625, 1.36273193359375, 1.4223480224609375, 1.481964111328125, 1.5415802001953125, 1.6011962890625, 1.6608123779296875, 1.720428466796875, 1.7800445556640625, 1.83966064453125, 1.8992767333984375, 1.958892822265625, 2.0185089111328125, 2.078125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 7.0, 7.0, 11.0, 5.0, 8.0, 8.0, 15.0, 15.0, 21.0, 26.0, 36.0, 56.0, 63.0, 94.0, 101.0, 105.0, 112.0, 62.0, 60.0, 30.0, 28.0, 27.0, 19.0, 11.0, 14.0, 11.0, 7.0, 5.0, 4.0, 3.0, 6.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.001430511474609375, -0.0013874918222427368, -0.0013444721698760986, -0.0013014525175094604, -0.0012584328651428223, -0.001215413212776184, -0.001172393560409546, -0.0011293739080429077, -0.0010863542556762695, -0.0010433346033096313, -0.0010003149509429932, -0.000957295298576355, -0.0009142756462097168, -0.0008712559938430786, -0.0008282363414764404, -0.0007852166891098022, -0.0007421970367431641, -0.0006991773843765259, -0.0006561577320098877, -0.0006131380796432495, -0.0005701184272766113, -0.0005270987749099731, -0.00048407912254333496, -0.0004410594701766968, -0.0003980398178100586, -0.0003550201654434204, -0.0003120005130767822, -0.00026898086071014404, -0.00022596120834350586, -0.00018294155597686768, -0.0001399219036102295, -9.690225124359131e-05, -5.3882598876953125e-05, -1.0862946510314941e-05, 3.215670585632324e-05, 7.517635822296143e-05, 0.00011819601058959961, 0.0001612156629562378, 0.00020423531532287598, 0.00024725496768951416, 0.00029027462005615234, 0.00033329427242279053, 0.0003763139247894287, 0.0004193335771560669, 0.0004623532295227051, 0.0005053728818893433, 0.0005483925342559814, 0.0005914121866226196, 0.0006344318389892578, 0.000677451491355896, 0.0007204711437225342, 0.0007634907960891724, 0.0008065104484558105, 0.0008495301008224487, 0.0008925497531890869, 0.0009355694055557251, 0.0009785890579223633, 0.0010216087102890015, 0.0010646283626556396, 0.0011076480150222778, 0.001150667667388916, 0.0011936873197555542, 0.0012367069721221924, 0.0012797266244888306, 0.0013227462768554688]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 5.0, 5.0, 7.0, 6.0, 9.0, 11.0, 15.0, 16.0, 26.0, 37.0, 63.0, 55.0, 102.0, 144.0, 253.0, 515.0, 1769.0, 947308.0, 96011.0, 1038.0, 405.0, 243.0, 145.0, 90.0, 61.0, 46.0, 27.0, 23.0, 21.0, 17.0, 11.0, 12.0, 11.0, 4.0, 2.0, 6.0, 6.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.025848388671875, -0.02501058578491211, -0.02417278289794922, -0.023334980010986328, -0.022497177124023438, -0.021659374237060547, -0.020821571350097656, -0.019983768463134766, -0.019145965576171875, -0.018308162689208984, -0.017470359802246094, -0.016632556915283203, -0.015794754028320312, -0.014956951141357422, -0.014119148254394531, -0.01328134536743164, -0.01244354248046875, -0.01160573959350586, -0.010767936706542969, -0.009930133819580078, -0.009092330932617188, -0.008254528045654297, -0.007416725158691406, -0.006578922271728516, -0.005741119384765625, -0.004903316497802734, -0.004065513610839844, -0.003227710723876953, -0.0023899078369140625, -0.0015521049499511719, -0.0007143020629882812, 0.00012350082397460938, 0.0009613037109375, 0.0017991065979003906, 0.0026369094848632812, 0.003474712371826172, 0.0043125152587890625, 0.005150318145751953, 0.005988121032714844, 0.006825923919677734, 0.007663726806640625, 0.008501529693603516, 0.009339332580566406, 0.010177135467529297, 0.011014938354492188, 0.011852741241455078, 0.012690544128417969, 0.01352834701538086, 0.01436614990234375, 0.01520395278930664, 0.01604175567626953, 0.016879558563232422, 0.017717361450195312, 0.018555164337158203, 0.019392967224121094, 0.020230770111083984, 0.021068572998046875, 0.021906375885009766, 0.022744178771972656, 0.023581981658935547, 0.024419784545898438, 0.025257587432861328, 0.02609539031982422, 0.02693319320678711, 0.02777099609375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 16.0, 43.0, 137.0, 243.0, 319.0, 157.0, 64.0, 24.0, 7.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00042936060344800353, -0.0003769064205698669, -0.0003244522667955607, -0.00027199811302125454, -0.0002195439301431179, -0.00016708974726498127, -0.00011463559349067509, -6.218143971636891e-05, -9.727256838232279e-06, 4.272691148798913e-05, 9.518107981421053e-05, 0.00014763524814043194, 0.00020008941646665335, 0.00025254359934479, 0.00030499775311909616, 0.00035745190689340234, 0.00040990608977153897, 0.0004623602726496756, 0.0005148143973201513, 0.000567268580198288, 0.0006197227630764246, 0.0006721769459545612, 0.0007246311288326979, 0.0007770852535031736, 0.0008295394363813102, 0.0008819936192594469, 0.0009344477439299226, 0.0009869019268080592, 0.0010393561096861959, 0.0010918102925643325, 0.0011442644754424691, 0.001196718541905284, 0.0012491727247834206, 0.0013016269076615572, 0.0013540810905396938, 0.0014065352734178305, 0.001458989456295967, 0.0015114436391741037, 0.0015638977056369185, 0.0016163518885150552, 0.0016688060713931918, 0.0017212602542713284, 0.001773714437149465, 0.0018261686200276017, 0.0018786226864904165, 0.0019310768693685532, 0.00198353105224669, 0.0020359852351248264, 0.002088439418002963, 0.0021408936008810997, 0.0021933477837592363, 0.002245801966637373, 0.0022982561495155096, 0.0023507103323936462, 0.002403164515271783, 0.0024556186981499195, 0.0025080726481974125, 0.002560526831075549, 0.0026129810139536858, 0.0026654351968318224, 0.002717889379709959, 0.0027703435625880957, 0.0028227977454662323, 0.0028752516955137253, 0.0029277061112225056]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 6.0, 4.0, 4.0, 7.0, 15.0, 11.0, 13.0, 20.0, 14.0, 19.0, 17.0, 17.0, 21.0, 32.0, 36.0, 31.0, 36.0, 31.0, 46.0, 31.0, 57.0, 50.0, 32.0, 42.0, 36.0, 33.0, 37.0, 32.0, 35.0, 36.0, 29.0, 24.0, 20.0, 25.0, 19.0, 13.0, 20.0, 15.0, 7.0, 8.0, 6.0, 5.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006527304649353027, -0.0006332546472549438, -0.000613778829574585, -0.0005943030118942261, -0.0005748271942138672, -0.0005553513765335083, -0.0005358755588531494, -0.0005163997411727905, -0.0004969239234924316, -0.00047744810581207275, -0.00045797228813171387, -0.000438496470451355, -0.0004190206527709961, -0.0003995448350906372, -0.0003800690174102783, -0.00036059319972991943, -0.00034111738204956055, -0.00032164156436920166, -0.0003021657466888428, -0.0002826899290084839, -0.000263214111328125, -0.0002437382936477661, -0.00022426247596740723, -0.00020478665828704834, -0.00018531084060668945, -0.00016583502292633057, -0.00014635920524597168, -0.0001268833875656128, -0.0001074075698852539, -8.793175220489502e-05, -6.845593452453613e-05, -4.8980116844177246e-05, -2.950429916381836e-05, -1.0028481483459473e-05, 9.447336196899414e-06, 2.89231538772583e-05, 4.839897155761719e-05, 6.787478923797607e-05, 8.735060691833496e-05, 0.00010682642459869385, 0.00012630224227905273, 0.00014577805995941162, 0.0001652538776397705, 0.0001847296953201294, 0.00020420551300048828, 0.00022368133068084717, 0.00024315714836120605, 0.00026263296604156494, 0.00028210878372192383, 0.0003015846014022827, 0.0003210604190826416, 0.0003405362367630005, 0.0003600120544433594, 0.00037948787212371826, 0.00039896368980407715, 0.00041843950748443604, 0.0004379153251647949, 0.0004573911428451538, 0.0004768669605255127, 0.0004963427782058716, 0.0005158185958862305, 0.0005352944135665894, 0.0005547702312469482, 0.0005742460489273071, 0.000593721866607666]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 0.0, 4.0, 2.0, 5.0, 13.0, 9.0, 12.0, 8.0, 14.0, 16.0, 23.0, 18.0, 35.0, 27.0, 41.0, 36.0, 33.0, 49.0, 54.0, 39.0, 50.0, 38.0, 48.0, 41.0, 34.0, 40.0, 38.0, 45.0, 32.0, 25.0, 19.0, 28.0, 19.0, 18.0, 23.0, 10.0, 7.0, 11.0, 11.0, 10.0, 4.0, 4.0, 6.0, 3.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.06640625, -6.82061767578125, -6.5748291015625, -6.32904052734375, -6.083251953125, -5.83746337890625, -5.5916748046875, -5.34588623046875, -5.10009765625, -4.85430908203125, -4.6085205078125, -4.36273193359375, -4.116943359375, -3.87115478515625, -3.6253662109375, -3.37957763671875, -3.1337890625, -2.88800048828125, -2.6422119140625, -2.39642333984375, -2.150634765625, -1.90484619140625, -1.6590576171875, -1.41326904296875, -1.16748046875, -0.92169189453125, -0.6759033203125, -0.43011474609375, -0.184326171875, 0.06146240234375, 0.3072509765625, 0.55303955078125, 0.798828125, 1.04461669921875, 1.2904052734375, 1.53619384765625, 1.781982421875, 2.02777099609375, 2.2735595703125, 2.51934814453125, 2.76513671875, 3.01092529296875, 3.2567138671875, 3.50250244140625, 3.748291015625, 3.99407958984375, 4.2398681640625, 4.48565673828125, 4.7314453125, 4.97723388671875, 5.2230224609375, 5.46881103515625, 5.714599609375, 5.96038818359375, 6.2061767578125, 6.45196533203125, 6.69775390625, 6.94354248046875, 7.1893310546875, 7.43511962890625, 7.680908203125, 7.92669677734375, 8.1724853515625, 8.41827392578125, 8.6640625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 8.0, 8.0, 15.0, 11.0, 20.0, 31.0, 47.0, 53.0, 91.0, 98.0, 102.0, 157.0, 228.0, 318.0, 443.0, 657.0, 1247.0, 2224.0, 5696.0, 19549.0, 75006.0, 259103.0, 428283.0, 182775.0, 50066.0, 13111.0, 4287.0, 1874.0, 994.0, 550.0, 391.0, 278.0, 214.0, 141.0, 122.0, 87.0, 68.0, 52.0, 35.0, 33.0, 25.0, 20.0, 15.0, 10.0, 3.0, 3.0, 2.0, 0.0, 3.0, 3.0, 1.0], "bins": [-10.5546875, -10.256103515625, -9.95751953125, -9.658935546875, -9.3603515625, -9.061767578125, -8.76318359375, -8.464599609375, -8.166015625, -7.867431640625, -7.56884765625, -7.270263671875, -6.9716796875, -6.673095703125, -6.37451171875, -6.075927734375, -5.77734375, -5.478759765625, -5.18017578125, -4.881591796875, -4.5830078125, -4.284423828125, -3.98583984375, -3.687255859375, -3.388671875, -3.090087890625, -2.79150390625, -2.492919921875, -2.1943359375, -1.895751953125, -1.59716796875, -1.298583984375, -1.0, -0.701416015625, -0.40283203125, -0.104248046875, 0.1943359375, 0.492919921875, 0.79150390625, 1.090087890625, 1.388671875, 1.687255859375, 1.98583984375, 2.284423828125, 2.5830078125, 2.881591796875, 3.18017578125, 3.478759765625, 3.77734375, 4.075927734375, 4.37451171875, 4.673095703125, 4.9716796875, 5.270263671875, 5.56884765625, 5.867431640625, 6.166015625, 6.464599609375, 6.76318359375, 7.061767578125, 7.3603515625, 7.658935546875, 7.95751953125, 8.256103515625, 8.5546875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 6.0, 3.0, 8.0, 6.0, 12.0, 12.0, 14.0, 29.0, 21.0, 21.0, 38.0, 37.0, 27.0, 55.0, 53.0, 60.0, 78.0, 112.0, 274.0, 1475.0, 199.0, 108.0, 64.0, 60.0, 30.0, 49.0, 31.0, 31.0, 23.0, 19.0, 22.0, 19.0, 12.0, 14.0, 9.0, 6.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.28125, -21.631591796875, -20.98193359375, -20.332275390625, -19.6826171875, -19.032958984375, -18.38330078125, -17.733642578125, -17.083984375, -16.434326171875, -15.78466796875, -15.135009765625, -14.4853515625, -13.835693359375, -13.18603515625, -12.536376953125, -11.88671875, -11.237060546875, -10.58740234375, -9.937744140625, -9.2880859375, -8.638427734375, -7.98876953125, -7.339111328125, -6.689453125, -6.039794921875, -5.39013671875, -4.740478515625, -4.0908203125, -3.441162109375, -2.79150390625, -2.141845703125, -1.4921875, -0.842529296875, -0.19287109375, 0.456787109375, 1.1064453125, 1.756103515625, 2.40576171875, 3.055419921875, 3.705078125, 4.354736328125, 5.00439453125, 5.654052734375, 6.3037109375, 6.953369140625, 7.60302734375, 8.252685546875, 8.90234375, 9.552001953125, 10.20166015625, 10.851318359375, 11.5009765625, 12.150634765625, 12.80029296875, 13.449951171875, 14.099609375, 14.749267578125, 15.39892578125, 16.048583984375, 16.6982421875, 17.347900390625, 17.99755859375, 18.647216796875, 19.296875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 9.0, 7.0, 6.0, 7.0, 9.0, 14.0, 11.0, 14.0, 24.0, 30.0, 51.0, 73.0, 105.0, 158.0, 217.0, 297.0, 427.0, 769.0, 1707.0, 22685.0, 2749669.0, 361043.0, 5213.0, 1115.0, 624.0, 419.0, 249.0, 178.0, 137.0, 107.0, 81.0, 46.0, 45.0, 34.0, 30.0, 15.0, 17.0, 13.0, 13.0, 5.0, 8.0, 9.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.65625, -32.59765625, -31.5390625, -30.48046875, -29.421875, -28.36328125, -27.3046875, -26.24609375, -25.1875, -24.12890625, -23.0703125, -22.01171875, -20.953125, -19.89453125, -18.8359375, -17.77734375, -16.71875, -15.66015625, -14.6015625, -13.54296875, -12.484375, -11.42578125, -10.3671875, -9.30859375, -8.25, -7.19140625, -6.1328125, -5.07421875, -4.015625, -2.95703125, -1.8984375, -0.83984375, 0.21875, 1.27734375, 2.3359375, 3.39453125, 4.453125, 5.51171875, 6.5703125, 7.62890625, 8.6875, 9.74609375, 10.8046875, 11.86328125, 12.921875, 13.98046875, 15.0390625, 16.09765625, 17.15625, 18.21484375, 19.2734375, 20.33203125, 21.390625, 22.44921875, 23.5078125, 24.56640625, 25.625, 26.68359375, 27.7421875, 28.80078125, 29.859375, 30.91796875, 31.9765625, 33.03515625, 34.09375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 36.0, 612.0, 357.0, 12.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.7442626953125, -115.21851348876953, -109.69276428222656, -104.1670150756836, -98.64126586914062, -93.11551666259766, -87.58976745605469, -82.06401062011719, -76.53826904296875, -71.01251983642578, -65.48677062988281, -59.961021423339844, -54.435272216796875, -48.909523010253906, -43.38376998901367, -37.8580207824707, -32.33226776123047, -26.8065185546875, -21.28076934814453, -15.75501823425293, -10.229269027709961, -4.703519821166992, 0.8222312927246094, 6.347980499267578, 11.873729705810547, 17.399478912353516, 22.925228118896484, 28.450979232788086, 33.97673034667969, 39.502479553222656, 45.028228759765625, 50.553977966308594, 56.07972717285156, 61.60547637939453, 67.1312255859375, 72.65697479248047, 78.18272399902344, 83.7084732055664, 89.23422241210938, 94.75997924804688, 100.28572082519531, 105.81147003173828, 111.33721923828125, 116.86296844482422, 122.38871765136719, 127.91446685791016, 133.44021606445312, 138.96597290039062, 144.49172973632812, 150.01748657226562, 155.54322814941406, 161.06898498535156, 166.5947265625, 172.1204833984375, 177.64622497558594, 183.17198181152344, 188.69772338867188, 194.22348022460938, 199.7492218017578, 205.2749786376953, 210.80072021484375, 216.32647705078125, 221.8522186279297, 227.3779754638672, 232.90371704101562]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 7.0, 6.0, 3.0, 7.0, 16.0, 18.0, 19.0, 27.0, 21.0, 17.0, 27.0, 40.0, 35.0, 31.0, 52.0, 42.0, 42.0, 33.0, 51.0, 50.0, 39.0, 38.0, 47.0, 51.0, 43.0, 30.0, 30.0, 21.0, 27.0, 23.0, 17.0, 16.0, 13.0, 10.0, 16.0, 8.0, 6.0, 4.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-47.08586502075195, -45.65842056274414, -44.230979919433594, -42.80353546142578, -41.37609100341797, -39.948646545410156, -38.52120590209961, -37.0937614440918, -35.66632080078125, -34.23887634277344, -32.81143569946289, -31.383991241455078, -29.956546783447266, -28.529104232788086, -27.101661682128906, -25.674217224121094, -24.24677276611328, -22.8193302154541, -21.39188575744629, -19.96444320678711, -18.536998748779297, -17.109556198120117, -15.682113647460938, -14.254670143127441, -12.827226638793945, -11.39978313446045, -9.972339630126953, -8.544897079467773, -7.117453575134277, -5.690010070800781, -4.262567520141602, -2.8351240158081055, -1.407684326171875, 0.019758939743041992, 1.447202205657959, 2.874645233154297, 4.302088737487793, 5.729532241821289, 7.156974792480469, 8.584418296813965, 10.011861801147461, 11.439305305480957, 12.866748809814453, 14.294191360473633, 15.721634864807129, 17.149078369140625, 18.576520919799805, 20.003963470458984, 21.431407928466797, 22.858850479125977, 24.28629493713379, 25.71373748779297, 27.14118194580078, 28.56862449645996, 29.99606704711914, 31.423511505126953, 32.8509521484375, 34.27839660644531, 35.70583724975586, 37.13328170776367, 38.560726165771484, 39.98816680908203, 41.415611267089844, 42.843055725097656, 44.27050018310547]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 2.0, 5.0, 2.0, 9.0, 4.0, 17.0, 9.0, 17.0, 21.0, 30.0, 22.0, 29.0, 33.0, 35.0, 36.0, 53.0, 46.0, 40.0, 66.0, 50.0, 60.0, 48.0, 40.0, 50.0, 37.0, 26.0, 32.0, 15.0, 35.0, 22.0, 18.0, 15.0, 25.0, 12.0, 15.0, 7.0, 6.0, 3.0, 7.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3828125, -7.1075439453125, -6.832275390625, -6.5570068359375, -6.28173828125, -6.0064697265625, -5.731201171875, -5.4559326171875, -5.1806640625, -4.9053955078125, -4.630126953125, -4.3548583984375, -4.07958984375, -3.8043212890625, -3.529052734375, -3.2537841796875, -2.978515625, -2.7032470703125, -2.427978515625, -2.1527099609375, -1.87744140625, -1.6021728515625, -1.326904296875, -1.0516357421875, -0.7763671875, -0.5010986328125, -0.225830078125, 0.0494384765625, 0.32470703125, 0.5999755859375, 0.875244140625, 1.1505126953125, 1.42578125, 1.7010498046875, 1.976318359375, 2.2515869140625, 2.52685546875, 2.8021240234375, 3.077392578125, 3.3526611328125, 3.6279296875, 3.9031982421875, 4.178466796875, 4.4537353515625, 4.72900390625, 5.0042724609375, 5.279541015625, 5.5548095703125, 5.830078125, 6.1053466796875, 6.380615234375, 6.6558837890625, 6.93115234375, 7.2064208984375, 7.481689453125, 7.7569580078125, 8.0322265625, 8.3074951171875, 8.582763671875, 8.8580322265625, 9.13330078125, 9.4085693359375, 9.683837890625, 9.9591064453125, 10.234375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 5.0, 8.0, 7.0, 5.0, 12.0, 18.0, 25.0, 31.0, 30.0, 37.0, 48.0, 66.0, 108.0, 118.0, 165.0, 261.0, 325.0, 411.0, 800.0, 1843393.0, 2345912.0, 784.0, 442.0, 309.0, 234.0, 168.0, 136.0, 96.0, 76.0, 49.0, 43.0, 31.0, 21.0, 15.0, 26.0, 12.0, 9.0, 8.0, 10.0, 7.0, 5.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-104.3125, -101.0537109375, -97.794921875, -94.5361328125, -91.27734375, -88.0185546875, -84.759765625, -81.5009765625, -78.2421875, -74.9833984375, -71.724609375, -68.4658203125, -65.20703125, -61.9482421875, -58.689453125, -55.4306640625, -52.171875, -48.9130859375, -45.654296875, -42.3955078125, -39.13671875, -35.8779296875, -32.619140625, -29.3603515625, -26.1015625, -22.8427734375, -19.583984375, -16.3251953125, -13.06640625, -9.8076171875, -6.548828125, -3.2900390625, -0.03125, 3.2275390625, 6.486328125, 9.7451171875, 13.00390625, 16.2626953125, 19.521484375, 22.7802734375, 26.0390625, 29.2978515625, 32.556640625, 35.8154296875, 39.07421875, 42.3330078125, 45.591796875, 48.8505859375, 52.109375, 55.3681640625, 58.626953125, 61.8857421875, 65.14453125, 68.4033203125, 71.662109375, 74.9208984375, 78.1796875, 81.4384765625, 84.697265625, 87.9560546875, 91.21484375, 94.4736328125, 97.732421875, 100.9912109375, 104.25]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 10.0, 6.0, 8.0, 18.0, 17.0, 12.0, 24.0, 33.0, 48.0, 57.0, 84.0, 118.0, 203.0, 320.0, 444.0, 510.0, 560.0, 465.0, 361.0, 225.0, 142.0, 123.0, 59.0, 46.0, 38.0, 33.0, 26.0, 16.0, 16.0, 6.0, 7.0, 7.0, 5.0, 2.0, 7.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.8125, -10.4554443359375, -10.098388671875, -9.7413330078125, -9.38427734375, -9.0272216796875, -8.670166015625, -8.3131103515625, -7.9560546875, -7.5989990234375, -7.241943359375, -6.8848876953125, -6.52783203125, -6.1707763671875, -5.813720703125, -5.4566650390625, -5.099609375, -4.7425537109375, -4.385498046875, -4.0284423828125, -3.67138671875, -3.3143310546875, -2.957275390625, -2.6002197265625, -2.2431640625, -1.8861083984375, -1.529052734375, -1.1719970703125, -0.81494140625, -0.4578857421875, -0.100830078125, 0.2562255859375, 0.61328125, 0.9703369140625, 1.327392578125, 1.6844482421875, 2.04150390625, 2.3985595703125, 2.755615234375, 3.1126708984375, 3.4697265625, 3.8267822265625, 4.183837890625, 4.5408935546875, 4.89794921875, 5.2550048828125, 5.612060546875, 5.9691162109375, 6.326171875, 6.6832275390625, 7.040283203125, 7.3973388671875, 7.75439453125, 8.1114501953125, 8.468505859375, 8.8255615234375, 9.1826171875, 9.5396728515625, 9.896728515625, 10.2537841796875, 10.61083984375, 10.9678955078125, 11.324951171875, 11.6820068359375, 12.0390625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 10.0, 9.0, 12.0, 20.0, 25.0, 27.0, 33.0, 44.0, 52.0, 57.0, 127.0, 219.0, 913.0, 31108.0, 4136596.0, 23557.0, 838.0, 206.0, 105.0, 84.0, 54.0, 37.0, 25.0, 35.0, 16.0, 13.0, 11.0, 11.0, 12.0, 3.0, 4.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.78125, -47.74755859375, -45.7138671875, -43.68017578125, -41.646484375, -39.61279296875, -37.5791015625, -35.54541015625, -33.51171875, -31.47802734375, -29.4443359375, -27.41064453125, -25.376953125, -23.34326171875, -21.3095703125, -19.27587890625, -17.2421875, -15.20849609375, -13.1748046875, -11.14111328125, -9.107421875, -7.07373046875, -5.0400390625, -3.00634765625, -0.97265625, 1.06103515625, 3.0947265625, 5.12841796875, 7.162109375, 9.19580078125, 11.2294921875, 13.26318359375, 15.296875, 17.33056640625, 19.3642578125, 21.39794921875, 23.431640625, 25.46533203125, 27.4990234375, 29.53271484375, 31.56640625, 33.60009765625, 35.6337890625, 37.66748046875, 39.701171875, 41.73486328125, 43.7685546875, 45.80224609375, 47.8359375, 49.86962890625, 51.9033203125, 53.93701171875, 55.970703125, 58.00439453125, 60.0380859375, 62.07177734375, 64.10546875, 66.13916015625, 68.1728515625, 70.20654296875, 72.240234375, 74.27392578125, 76.3076171875, 78.34130859375, 80.375]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 39.0, 99.0, 194.0, 277.0, 210.0, 122.0, 38.0, 15.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-46.22077178955078, -43.872989654541016, -41.52520751953125, -39.177425384521484, -36.82964324951172, -34.48185729980469, -32.13407516479492, -29.786293029785156, -27.43851089477539, -25.090728759765625, -22.74294662475586, -20.39516258239746, -18.047380447387695, -15.69959831237793, -13.351815223693848, -11.004032135009766, -8.65625, -6.308467388153076, -3.9606847763061523, -1.6129021644592285, 0.7348804473876953, 3.082662582397461, 5.430445671081543, 7.778228759765625, 10.12601089477539, 12.473793029785156, 14.821576118469238, 17.16935920715332, 19.517141342163086, 21.86492347717285, 24.21270751953125, 26.560489654541016, 28.908279418945312, 31.256061553955078, 33.603843688964844, 35.95162582397461, 38.299407958984375, 40.647193908691406, 42.99497604370117, 45.34275817871094, 47.6905403137207, 50.03832244873047, 52.386104583740234, 54.73388671875, 57.08167266845703, 59.42945098876953, 61.77723693847656, 64.12501525878906, 66.4728012084961, 68.82058715820312, 71.16836547851562, 73.51615142822266, 75.86392974853516, 78.21171569824219, 80.55949401855469, 82.90727996826172, 85.25506591796875, 87.60285186767578, 89.95063018798828, 92.29841613769531, 94.64619445800781, 96.99398040771484, 99.34175872802734, 101.68954467773438, 104.03732299804688]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 5.0, 6.0, 3.0, 4.0, 5.0, 13.0, 10.0, 14.0, 12.0, 24.0, 29.0, 29.0, 19.0, 23.0, 30.0, 25.0, 27.0, 35.0, 30.0, 36.0, 40.0, 33.0, 36.0, 46.0, 35.0, 49.0, 41.0, 31.0, 38.0, 31.0, 21.0, 29.0, 33.0, 31.0, 29.0, 16.0, 13.0, 14.0, 10.0, 10.0, 10.0, 6.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-36.1537971496582, -35.039039611816406, -33.92428207397461, -32.80952453613281, -31.694765090942383, -30.580007553100586, -29.465248107910156, -28.35049057006836, -27.235733032226562, -26.120975494384766, -25.00621795654297, -23.89145851135254, -22.776700973510742, -21.661943435668945, -20.547183990478516, -19.43242645263672, -18.317668914794922, -17.202911376953125, -16.088153839111328, -14.973394393920898, -13.858636856079102, -12.743879318237305, -11.629120826721191, -10.514362335205078, -9.399604797363281, -8.284847259521484, -7.170088768005371, -6.055330753326416, -4.940572738647461, -3.825814723968506, -2.711056709289551, -1.5962986946105957, -0.481536865234375, 0.6332211494445801, 1.7479791641235352, 2.8627371788024902, 3.9774951934814453, 5.0922532081604, 6.2070112228393555, 7.3217692375183105, 8.436527252197266, 9.551284790039062, 10.666043281555176, 11.780801773071289, 12.895559310913086, 14.010316848754883, 15.125075340270996, 16.23983383178711, 17.354591369628906, 18.469348907470703, 19.5841064453125, 20.69886589050293, 21.813623428344727, 22.928380966186523, 24.043140411376953, 25.15789794921875, 26.272655487060547, 27.387413024902344, 28.50217056274414, 29.61693000793457, 30.731687545776367, 31.846445083618164, 32.961204528808594, 34.07596206665039, 35.19071960449219]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 5.0, 4.0, 6.0, 14.0, 18.0, 4.0, 10.0, 19.0, 19.0, 25.0, 33.0, 25.0, 27.0, 27.0, 34.0, 38.0, 42.0, 40.0, 42.0, 42.0, 46.0, 40.0, 48.0, 51.0, 31.0, 38.0, 33.0, 36.0, 17.0, 31.0, 15.0, 23.0, 22.0, 18.0, 16.0, 14.0, 9.0, 5.0, 8.0, 6.0, 2.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.85546875, -6.62225341796875, -6.3890380859375, -6.15582275390625, -5.922607421875, -5.68939208984375, -5.4561767578125, -5.22296142578125, -4.98974609375, -4.75653076171875, -4.5233154296875, -4.29010009765625, -4.056884765625, -3.82366943359375, -3.5904541015625, -3.35723876953125, -3.1240234375, -2.89080810546875, -2.6575927734375, -2.42437744140625, -2.191162109375, -1.95794677734375, -1.7247314453125, -1.49151611328125, -1.25830078125, -1.02508544921875, -0.7918701171875, -0.55865478515625, -0.325439453125, -0.09222412109375, 0.1409912109375, 0.37420654296875, 0.607421875, 0.84063720703125, 1.0738525390625, 1.30706787109375, 1.540283203125, 1.77349853515625, 2.0067138671875, 2.23992919921875, 2.47314453125, 2.70635986328125, 2.9395751953125, 3.17279052734375, 3.406005859375, 3.63922119140625, 3.8724365234375, 4.10565185546875, 4.3388671875, 4.57208251953125, 4.8052978515625, 5.03851318359375, 5.271728515625, 5.50494384765625, 5.7381591796875, 5.97137451171875, 6.20458984375, 6.43780517578125, 6.6710205078125, 6.90423583984375, 7.137451171875, 7.37066650390625, 7.6038818359375, 7.83709716796875, 8.0703125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 6.0, 15.0, 30.0, 30.0, 44.0, 71.0, 108.0, 141.0, 205.0, 304.0, 393.0, 613.0, 928.0, 1348.0, 1899.0, 2774.0, 4146.0, 6303.0, 9041.0, 13847.0, 20802.0, 31433.0, 49884.0, 83988.0, 172683.0, 331891.0, 124924.0, 68136.0, 41514.0, 26990.0, 17700.0, 11881.0, 8054.0, 5140.0, 3626.0, 2411.0, 1686.0, 1128.0, 725.0, 559.0, 338.0, 263.0, 174.0, 112.0, 88.0, 49.0, 41.0, 35.0, 18.0, 15.0, 8.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.615234375, -1.5636444091796875, -1.512054443359375, -1.4604644775390625, -1.40887451171875, -1.3572845458984375, -1.305694580078125, -1.2541046142578125, -1.2025146484375, -1.1509246826171875, -1.099334716796875, -1.0477447509765625, -0.99615478515625, -0.9445648193359375, -0.892974853515625, -0.8413848876953125, -0.789794921875, -0.7382049560546875, -0.686614990234375, -0.6350250244140625, -0.58343505859375, -0.5318450927734375, -0.480255126953125, -0.4286651611328125, -0.3770751953125, -0.3254852294921875, -0.273895263671875, -0.2223052978515625, -0.17071533203125, -0.1191253662109375, -0.067535400390625, -0.0159454345703125, 0.03564453125, 0.0872344970703125, 0.138824462890625, 0.1904144287109375, 0.24200439453125, 0.2935943603515625, 0.345184326171875, 0.3967742919921875, 0.4483642578125, 0.4999542236328125, 0.551544189453125, 0.6031341552734375, 0.65472412109375, 0.7063140869140625, 0.757904052734375, 0.8094940185546875, 0.861083984375, 0.9126739501953125, 0.964263916015625, 1.0158538818359375, 1.06744384765625, 1.1190338134765625, 1.170623779296875, 1.2222137451171875, 1.2738037109375, 1.3253936767578125, 1.376983642578125, 1.4285736083984375, 1.48016357421875, 1.5317535400390625, 1.583343505859375, 1.6349334716796875, 1.6865234375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 8.0, 5.0, 9.0, 14.0, 14.0, 13.0, 14.0, 22.0, 26.0, 23.0, 36.0, 36.0, 32.0, 30.0, 36.0, 41.0, 40.0, 44.0, 40.0, 1069.0, 52.0, 40.0, 48.0, 28.0, 41.0, 30.0, 32.0, 33.0, 28.0, 22.0, 27.0, 20.0, 12.0, 12.0, 10.0, 11.0, 9.0, 6.0, 5.0, 5.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.0390625, -4.8841552734375, -4.729248046875, -4.5743408203125, -4.41943359375, -4.2645263671875, -4.109619140625, -3.9547119140625, -3.7998046875, -3.6448974609375, -3.489990234375, -3.3350830078125, -3.18017578125, -3.0252685546875, -2.870361328125, -2.7154541015625, -2.560546875, -2.4056396484375, -2.250732421875, -2.0958251953125, -1.94091796875, -1.7860107421875, -1.631103515625, -1.4761962890625, -1.3212890625, -1.1663818359375, -1.011474609375, -0.8565673828125, -0.70166015625, -0.5467529296875, -0.391845703125, -0.2369384765625, -0.08203125, 0.0728759765625, 0.227783203125, 0.3826904296875, 0.53759765625, 0.6925048828125, 0.847412109375, 1.0023193359375, 1.1572265625, 1.3121337890625, 1.467041015625, 1.6219482421875, 1.77685546875, 1.9317626953125, 2.086669921875, 2.2415771484375, 2.396484375, 2.5513916015625, 2.706298828125, 2.8612060546875, 3.01611328125, 3.1710205078125, 3.325927734375, 3.4808349609375, 3.6357421875, 3.7906494140625, 3.945556640625, 4.1004638671875, 4.25537109375, 4.4102783203125, 4.565185546875, 4.7200927734375, 4.875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 10.0, 5.0, 14.0, 19.0, 17.0, 43.0, 56.0, 91.0, 128.0, 208.0, 319.0, 493.0, 712.0, 1211.0, 2047.0, 3523.0, 5876.0, 10409.0, 17870.0, 32775.0, 59742.0, 115996.0, 1401893.0, 232432.0, 96039.0, 50534.0, 27544.0, 15387.0, 8693.0, 5106.0, 3075.0, 1847.0, 1153.0, 689.0, 421.0, 278.0, 167.0, 108.0, 66.0, 45.0, 38.0, 17.0, 14.0, 13.0, 6.0, 3.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0390625, -1.975067138671875, -1.91107177734375, -1.847076416015625, -1.7830810546875, -1.719085693359375, -1.65509033203125, -1.591094970703125, -1.527099609375, -1.463104248046875, -1.39910888671875, -1.335113525390625, -1.2711181640625, -1.207122802734375, -1.14312744140625, -1.079132080078125, -1.01513671875, -0.951141357421875, -0.88714599609375, -0.823150634765625, -0.7591552734375, -0.695159912109375, -0.63116455078125, -0.567169189453125, -0.503173828125, -0.439178466796875, -0.37518310546875, -0.311187744140625, -0.2471923828125, -0.183197021484375, -0.11920166015625, -0.055206298828125, 0.0087890625, 0.072784423828125, 0.13677978515625, 0.200775146484375, 0.2647705078125, 0.328765869140625, 0.39276123046875, 0.456756591796875, 0.520751953125, 0.584747314453125, 0.64874267578125, 0.712738037109375, 0.7767333984375, 0.840728759765625, 0.90472412109375, 0.968719482421875, 1.03271484375, 1.096710205078125, 1.16070556640625, 1.224700927734375, 1.2886962890625, 1.352691650390625, 1.41668701171875, 1.480682373046875, 1.544677734375, 1.608673095703125, 1.67266845703125, 1.736663818359375, 1.8006591796875, 1.864654541015625, 1.92864990234375, 1.992645263671875, 2.056640625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 7.0, 3.0, 6.0, 14.0, 10.0, 13.0, 18.0, 20.0, 33.0, 42.0, 62.0, 82.0, 92.0, 94.0, 82.0, 86.0, 87.0, 54.0, 45.0, 34.0, 23.0, 20.0, 17.0, 11.0, 10.0, 3.0, 10.0, 3.0, 1.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0016574859619140625, -0.0016127228736877441, -0.0015679597854614258, -0.0015231966972351074, -0.001478433609008789, -0.0014336705207824707, -0.0013889074325561523, -0.001344144344329834, -0.0012993812561035156, -0.0012546181678771973, -0.001209855079650879, -0.0011650919914245605, -0.0011203289031982422, -0.0010755658149719238, -0.0010308027267456055, -0.0009860396385192871, -0.0009412765502929688, -0.0008965134620666504, -0.000851750373840332, -0.0008069872856140137, -0.0007622241973876953, -0.000717461109161377, -0.0006726980209350586, -0.0006279349327087402, -0.0005831718444824219, -0.0005384087562561035, -0.0004936456680297852, -0.0004488825798034668, -0.00040411949157714844, -0.0003593564033508301, -0.0003145933151245117, -0.00026983022689819336, -0.000225067138671875, -0.00018030405044555664, -0.00013554096221923828, -9.077787399291992e-05, -4.601478576660156e-05, -1.2516975402832031e-06, 4.3511390686035156e-05, 8.827447891235352e-05, 0.00013303756713867188, 0.00017780065536499023, 0.0002225637435913086, 0.00026732683181762695, 0.0003120899200439453, 0.00035685300827026367, 0.00040161609649658203, 0.0004463791847229004, 0.0004911422729492188, 0.0005359053611755371, 0.0005806684494018555, 0.0006254315376281738, 0.0006701946258544922, 0.0007149577140808105, 0.0007597208023071289, 0.0008044838905334473, 0.0008492469787597656, 0.000894010066986084, 0.0009387731552124023, 0.0009835362434387207, 0.001028299331665039, 0.0010730624198913574, 0.0011178255081176758, 0.0011625885963439941, 0.0012073516845703125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 6.0, 7.0, 9.0, 8.0, 10.0, 11.0, 17.0, 28.0, 30.0, 44.0, 71.0, 88.0, 148.0, 221.0, 415.0, 719.0, 2968.0, 1015491.0, 25935.0, 970.0, 485.0, 289.0, 175.0, 106.0, 82.0, 55.0, 35.0, 24.0, 30.0, 17.0, 13.0, 9.0, 6.0, 7.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0204010009765625, -0.019664525985717773, -0.018928050994873047, -0.01819157600402832, -0.017455101013183594, -0.016718626022338867, -0.01598215103149414, -0.015245676040649414, -0.014509201049804688, -0.013772726058959961, -0.013036251068115234, -0.012299776077270508, -0.011563301086425781, -0.010826826095581055, -0.010090351104736328, -0.009353876113891602, -0.008617401123046875, -0.007880926132202148, -0.007144451141357422, -0.006407976150512695, -0.005671501159667969, -0.004935026168823242, -0.004198551177978516, -0.003462076187133789, -0.0027256011962890625, -0.001989126205444336, -0.0012526512145996094, -0.0005161762237548828, 0.00022029876708984375, 0.0009567737579345703, 0.0016932487487792969, 0.0024297237396240234, 0.00316619873046875, 0.0039026737213134766, 0.004639148712158203, 0.00537562370300293, 0.006112098693847656, 0.006848573684692383, 0.007585048675537109, 0.008321523666381836, 0.009057998657226562, 0.009794473648071289, 0.010530948638916016, 0.011267423629760742, 0.012003898620605469, 0.012740373611450195, 0.013476848602294922, 0.014213323593139648, 0.014949798583984375, 0.0156862735748291, 0.016422748565673828, 0.017159223556518555, 0.01789569854736328, 0.018632173538208008, 0.019368648529052734, 0.02010512351989746, 0.020841598510742188, 0.021578073501586914, 0.02231454849243164, 0.023051023483276367, 0.023787498474121094, 0.02452397346496582, 0.025260448455810547, 0.025996923446655273, 0.0267333984375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 8.0, 58.0, 355.0, 466.0, 106.0, 18.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002323971828445792, -0.0022468899842351675, -0.002169807907193899, -0.0020927260629832745, -0.0020156442187726498, -0.0019385621417313814, -0.0018614802975207567, -0.0017843983368948102, -0.0017073163762688637, -0.0016302344156429172, -0.0015531524550169706, -0.001476070610806346, -0.0013989886501803994, -0.001321906689554453, -0.0012448248453438282, -0.0011677428847178817, -0.0010906609240919352, -0.0010135789634659886, -0.000936497061047703, -0.0008594151586294174, -0.0007823331980034709, -0.0007052512373775244, -0.0006281693349592388, -0.0005510874325409532, -0.00047400547191500664, -0.00039692354039289057, -0.0003198416088707745, -0.00024275967734865844, -0.00016567774582654238, -8.859581430442631e-05, -1.1513882782310247e-05, 6.556801963597536e-05, 0.00014264998026192188, 0.00021973191178403795, 0.000296813843306154, 0.0003738957748282701, 0.00045097770635038614, 0.0005280596669763327, 0.0006051415693946183, 0.0006822234718129039, 0.0007593054324388504, 0.0008363873930647969, 0.0009134692954830825, 0.0009905511979013681, 0.0010676331585273147, 0.0011447151191532612, 0.0012217969633638859, 0.0012988789239898324, 0.001375960884615779, 0.0014530428452417254, 0.001530124805867672, 0.0016072066500782967, 0.0016842886107042432, 0.0017613705713301897, 0.0018384524155408144, 0.001915534376166761, 0.0019926163367927074, 0.002069698181003332, 0.0021467802580446005, 0.002223862102255225, 0.0023009441792964935, 0.0023780260235071182, 0.002455107867717743, 0.0025321897119283676, 0.002609271788969636]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 4.0, 7.0, 8.0, 13.0, 7.0, 11.0, 13.0, 16.0, 22.0, 20.0, 23.0, 17.0, 20.0, 32.0, 18.0, 23.0, 23.0, 37.0, 39.0, 36.0, 34.0, 45.0, 35.0, 24.0, 42.0, 35.0, 43.0, 22.0, 25.0, 28.0, 29.0, 25.0, 28.0, 25.0, 24.0, 16.0, 21.0, 14.0, 9.0, 11.0, 12.0, 19.0, 9.0, 7.0, 2.0, 3.0, 5.0, 4.0, 1.0, 5.0, 3.0, 2.0, 3.0], "bins": [-0.0005110502243041992, -0.0004959879443049431, -0.00048092566430568695, -0.0004658633843064308, -0.0004508011043071747, -0.00043573882430791855, -0.0004206765443086624, -0.0004056142643094063, -0.00039055198431015015, -0.000375489704310894, -0.0003604274243116379, -0.00034536514431238174, -0.0003303028643131256, -0.0003152405843138695, -0.00030017830431461334, -0.0002851160243153572, -0.0002700537443161011, -0.00025499146431684494, -0.0002399291843175888, -0.00022486690431833267, -0.00020980462431907654, -0.0001947423443198204, -0.00017968006432056427, -0.00016461778432130814, -0.000149555504322052, -0.00013449322432279587, -0.00011943094432353973, -0.0001043686643242836, -8.930638432502747e-05, -7.424410432577133e-05, -5.91818243265152e-05, -4.4119544327259064e-05, -2.905726432800293e-05, -1.3994984328746796e-05, 1.0672956705093384e-06, 1.6129575669765472e-05, 3.1191855669021606e-05, 4.625413566827774e-05, 6.131641566753387e-05, 7.637869566679001e-05, 9.144097566604614e-05, 0.00010650325566530228, 0.00012156553566455841, 0.00013662781566381454, 0.00015169009566307068, 0.0001667523756623268, 0.00018181465566158295, 0.00019687693566083908, 0.00021193921566009521, 0.00022700149565935135, 0.00024206377565860748, 0.0002571260556578636, 0.00027218833565711975, 0.0002872506156563759, 0.000302312895655632, 0.00031737517565488815, 0.0003324374556541443, 0.0003474997356534004, 0.00036256201565265656, 0.0003776242956519127, 0.0003926865756511688, 0.00040774885565042496, 0.0004228111356496811, 0.0004378734156489372, 0.00045293569564819336]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 5.0, 4.0, 6.0, 13.0, 19.0, 4.0, 10.0, 19.0, 19.0, 25.0, 33.0, 25.0, 27.0, 27.0, 34.0, 38.0, 42.0, 40.0, 42.0, 42.0, 46.0, 40.0, 48.0, 51.0, 31.0, 38.0, 33.0, 36.0, 17.0, 31.0, 15.0, 23.0, 22.0, 18.0, 16.0, 14.0, 9.0, 5.0, 8.0, 6.0, 2.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.85546875, -6.62225341796875, -6.3890380859375, -6.15582275390625, -5.922607421875, -5.68939208984375, -5.4561767578125, -5.22296142578125, -4.98974609375, -4.75653076171875, -4.5233154296875, -4.29010009765625, -4.056884765625, -3.82366943359375, -3.5904541015625, -3.35723876953125, -3.1240234375, -2.89080810546875, -2.6575927734375, -2.42437744140625, -2.191162109375, -1.95794677734375, -1.7247314453125, -1.49151611328125, -1.25830078125, -1.02508544921875, -0.7918701171875, -0.55865478515625, -0.325439453125, -0.09222412109375, 0.1409912109375, 0.37420654296875, 0.607421875, 0.84063720703125, 1.0738525390625, 1.30706787109375, 1.540283203125, 1.77349853515625, 2.0067138671875, 2.23992919921875, 2.47314453125, 2.70635986328125, 2.9395751953125, 3.17279052734375, 3.406005859375, 3.63922119140625, 3.8724365234375, 4.10565185546875, 4.3388671875, 4.57208251953125, 4.8052978515625, 5.03851318359375, 5.271728515625, 5.50494384765625, 5.7381591796875, 5.97137451171875, 6.20458984375, 6.43780517578125, 6.6710205078125, 6.90423583984375, 7.137451171875, 7.37066650390625, 7.6038818359375, 7.83709716796875, 8.0703125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 11.0, 9.0, 20.0, 17.0, 21.0, 34.0, 38.0, 69.0, 79.0, 99.0, 134.0, 160.0, 237.0, 339.0, 443.0, 547.0, 791.0, 1021.0, 1482.0, 2707.0, 9650.0, 79444.0, 495377.0, 387555.0, 53669.0, 7099.0, 2218.0, 1405.0, 963.0, 764.0, 536.0, 418.0, 318.0, 194.0, 179.0, 119.0, 107.0, 88.0, 48.0, 38.0, 24.0, 25.0, 13.0, 15.0, 8.0, 6.0, 9.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.8359375, -13.3883056640625, -12.940673828125, -12.4930419921875, -12.04541015625, -11.5977783203125, -11.150146484375, -10.7025146484375, -10.2548828125, -9.8072509765625, -9.359619140625, -8.9119873046875, -8.46435546875, -8.0167236328125, -7.569091796875, -7.1214599609375, -6.673828125, -6.2261962890625, -5.778564453125, -5.3309326171875, -4.88330078125, -4.4356689453125, -3.988037109375, -3.5404052734375, -3.0927734375, -2.6451416015625, -2.197509765625, -1.7498779296875, -1.30224609375, -0.8546142578125, -0.406982421875, 0.0406494140625, 0.48828125, 0.9359130859375, 1.383544921875, 1.8311767578125, 2.27880859375, 2.7264404296875, 3.174072265625, 3.6217041015625, 4.0693359375, 4.5169677734375, 4.964599609375, 5.4122314453125, 5.85986328125, 6.3074951171875, 6.755126953125, 7.2027587890625, 7.650390625, 8.0980224609375, 8.545654296875, 8.9932861328125, 9.44091796875, 9.8885498046875, 10.336181640625, 10.7838134765625, 11.2314453125, 11.6790771484375, 12.126708984375, 12.5743408203125, 13.02197265625, 13.4696044921875, 13.917236328125, 14.3648681640625, 14.8125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 5.0, 12.0, 14.0, 15.0, 19.0, 25.0, 45.0, 43.0, 65.0, 77.0, 99.0, 215.0, 1678.0, 276.0, 124.0, 70.0, 54.0, 41.0, 57.0, 37.0, 20.0, 21.0, 6.0, 11.0, 6.0, 10.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.578125, -28.612060546875, -27.64599609375, -26.679931640625, -25.7138671875, -24.747802734375, -23.78173828125, -22.815673828125, -21.849609375, -20.883544921875, -19.91748046875, -18.951416015625, -17.9853515625, -17.019287109375, -16.05322265625, -15.087158203125, -14.12109375, -13.155029296875, -12.18896484375, -11.222900390625, -10.2568359375, -9.290771484375, -8.32470703125, -7.358642578125, -6.392578125, -5.426513671875, -4.46044921875, -3.494384765625, -2.5283203125, -1.562255859375, -0.59619140625, 0.369873046875, 1.3359375, 2.302001953125, 3.26806640625, 4.234130859375, 5.2001953125, 6.166259765625, 7.13232421875, 8.098388671875, 9.064453125, 10.030517578125, 10.99658203125, 11.962646484375, 12.9287109375, 13.894775390625, 14.86083984375, 15.826904296875, 16.79296875, 17.759033203125, 18.72509765625, 19.691162109375, 20.6572265625, 21.623291015625, 22.58935546875, 23.555419921875, 24.521484375, 25.487548828125, 26.45361328125, 27.419677734375, 28.3857421875, 29.351806640625, 30.31787109375, 31.283935546875, 32.25]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 10.0, 5.0, 5.0, 7.0, 17.0, 12.0, 18.0, 23.0, 27.0, 47.0, 62.0, 78.0, 122.0, 187.0, 295.0, 499.0, 913.0, 2354.0, 2840822.0, 296095.0, 1937.0, 843.0, 467.0, 281.0, 159.0, 120.0, 70.0, 62.0, 34.0, 30.0, 24.0, 17.0, 14.0, 15.0, 8.0, 9.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.6875, -73.31640625, -70.9453125, -68.57421875, -66.203125, -63.83203125, -61.4609375, -59.08984375, -56.71875, -54.34765625, -51.9765625, -49.60546875, -47.234375, -44.86328125, -42.4921875, -40.12109375, -37.75, -35.37890625, -33.0078125, -30.63671875, -28.265625, -25.89453125, -23.5234375, -21.15234375, -18.78125, -16.41015625, -14.0390625, -11.66796875, -9.296875, -6.92578125, -4.5546875, -2.18359375, 0.1875, 2.55859375, 4.9296875, 7.30078125, 9.671875, 12.04296875, 14.4140625, 16.78515625, 19.15625, 21.52734375, 23.8984375, 26.26953125, 28.640625, 31.01171875, 33.3828125, 35.75390625, 38.125, 40.49609375, 42.8671875, 45.23828125, 47.609375, 49.98046875, 52.3515625, 54.72265625, 57.09375, 59.46484375, 61.8359375, 64.20703125, 66.578125, 68.94921875, 71.3203125, 73.69140625, 76.0625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 95.0, 654.0, 237.0, 19.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.23116302490234, -74.19345092773438, -69.15573120117188, -64.1180191040039, -59.080299377441406, -54.04258728027344, -49.0048713684082, -43.96715545654297, -38.929439544677734, -33.8917236328125, -28.854007720947266, -23.816293716430664, -18.77857780456543, -13.740861892700195, -8.703147888183594, -3.6654319763183594, 1.372283935546875, 6.409999370574951, 11.447714805603027, 16.485429763793945, 21.52314567565918, 26.560861587524414, 31.598575592041016, 36.63629150390625, 41.674007415771484, 46.71172332763672, 51.74943923950195, 56.78715515136719, 61.824867248535156, 66.86258697509766, 71.90029907226562, 76.93801879882812, 81.97572326660156, 87.01343536376953, 92.05115509033203, 97.0888671875, 102.1265869140625, 107.16429901123047, 112.20201110839844, 117.23973083496094, 122.27745056152344, 127.3151626586914, 132.35287475585938, 137.39059448242188, 142.42831420898438, 147.46603393554688, 152.5037384033203, 157.5414581298828, 162.57916259765625, 167.61688232421875, 172.6545867919922, 177.6923065185547, 182.7300262451172, 187.7677459716797, 192.80545043945312, 197.84317016601562, 202.88088989257812, 207.91860961914062, 212.95631408691406, 217.99403381347656, 223.03175354003906, 228.06947326660156, 233.107177734375, 238.1448974609375, 243.1826171875]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 9.0, 5.0, 9.0, 5.0, 9.0, 10.0, 19.0, 18.0, 15.0, 24.0, 23.0, 28.0, 29.0, 27.0, 31.0, 39.0, 33.0, 41.0, 52.0, 37.0, 42.0, 34.0, 50.0, 44.0, 28.0, 48.0, 44.0, 34.0, 33.0, 28.0, 31.0, 22.0, 22.0, 16.0, 14.0, 13.0, 10.0, 7.0, 4.0, 6.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-60.58242416381836, -58.814056396484375, -57.045684814453125, -55.277313232421875, -53.50894546508789, -51.740577697753906, -49.972206115722656, -48.203834533691406, -46.43546676635742, -44.66709899902344, -42.89872741699219, -41.13035583496094, -39.36198806762695, -37.59362030029297, -35.82524871826172, -34.05687713623047, -32.288509368896484, -30.520139694213867, -28.75177001953125, -26.983400344848633, -25.215030670166016, -23.4466609954834, -21.67829132080078, -19.909921646118164, -18.141551971435547, -16.37318229675293, -14.604812622070312, -12.836442947387695, -11.068073272705078, -9.299703598022461, -7.531333923339844, -5.762964248657227, -3.9945945739746094, -2.226224899291992, -0.457855224609375, 1.3105144500732422, 3.0788841247558594, 4.847253799438477, 6.615623474121094, 8.383993148803711, 10.152362823486328, 11.920732498168945, 13.689102172851562, 15.45747184753418, 17.225841522216797, 18.994211196899414, 20.76258087158203, 22.53095054626465, 24.299320220947266, 26.067689895629883, 27.8360595703125, 29.604429244995117, 31.372798919677734, 33.14116668701172, 34.90953826904297, 36.67790985107422, 38.4462776184082, 40.21464538574219, 41.98301696777344, 43.75138854980469, 45.51975631713867, 47.288124084472656, 49.056495666503906, 50.824867248535156, 52.59323501586914]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 4.0, 4.0, 3.0, 5.0, 4.0, 6.0, 11.0, 21.0, 18.0, 18.0, 23.0, 27.0, 26.0, 24.0, 29.0, 37.0, 34.0, 51.0, 36.0, 44.0, 44.0, 55.0, 46.0, 35.0, 41.0, 27.0, 29.0, 35.0, 32.0, 36.0, 34.0, 27.0, 15.0, 16.0, 20.0, 17.0, 12.0, 9.0, 7.0, 14.0, 5.0, 7.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.359375, -7.1199951171875, -6.880615234375, -6.6412353515625, -6.40185546875, -6.1624755859375, -5.923095703125, -5.6837158203125, -5.4443359375, -5.2049560546875, -4.965576171875, -4.7261962890625, -4.48681640625, -4.2474365234375, -4.008056640625, -3.7686767578125, -3.529296875, -3.2899169921875, -3.050537109375, -2.8111572265625, -2.57177734375, -2.3323974609375, -2.093017578125, -1.8536376953125, -1.6142578125, -1.3748779296875, -1.135498046875, -0.8961181640625, -0.65673828125, -0.4173583984375, -0.177978515625, 0.0614013671875, 0.30078125, 0.5401611328125, 0.779541015625, 1.0189208984375, 1.25830078125, 1.4976806640625, 1.737060546875, 1.9764404296875, 2.2158203125, 2.4552001953125, 2.694580078125, 2.9339599609375, 3.17333984375, 3.4127197265625, 3.652099609375, 3.8914794921875, 4.130859375, 4.3702392578125, 4.609619140625, 4.8489990234375, 5.08837890625, 5.3277587890625, 5.567138671875, 5.8065185546875, 6.0458984375, 6.2852783203125, 6.524658203125, 6.7640380859375, 7.00341796875, 7.2427978515625, 7.482177734375, 7.7215576171875, 7.9609375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 7.0, 10.0, 10.0, 16.0, 19.0, 27.0, 24.0, 38.0, 44.0, 64.0, 81.0, 126.0, 185.0, 237.0, 480.0, 961.0, 2737.0, 8995.0, 52942.0, 521239.0, 2295847.0, 1154549.0, 131523.0, 16741.0, 4173.0, 1468.0, 673.0, 325.0, 201.0, 134.0, 96.0, 77.0, 50.0, 46.0, 27.0, 31.0, 21.0, 12.0, 13.0, 10.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-14.8359375, -14.42041015625, -14.0048828125, -13.58935546875, -13.173828125, -12.75830078125, -12.3427734375, -11.92724609375, -11.51171875, -11.09619140625, -10.6806640625, -10.26513671875, -9.849609375, -9.43408203125, -9.0185546875, -8.60302734375, -8.1875, -7.77197265625, -7.3564453125, -6.94091796875, -6.525390625, -6.10986328125, -5.6943359375, -5.27880859375, -4.86328125, -4.44775390625, -4.0322265625, -3.61669921875, -3.201171875, -2.78564453125, -2.3701171875, -1.95458984375, -1.5390625, -1.12353515625, -0.7080078125, -0.29248046875, 0.123046875, 0.53857421875, 0.9541015625, 1.36962890625, 1.78515625, 2.20068359375, 2.6162109375, 3.03173828125, 3.447265625, 3.86279296875, 4.2783203125, 4.69384765625, 5.109375, 5.52490234375, 5.9404296875, 6.35595703125, 6.771484375, 7.18701171875, 7.6025390625, 8.01806640625, 8.43359375, 8.84912109375, 9.2646484375, 9.68017578125, 10.095703125, 10.51123046875, 10.9267578125, 11.34228515625, 11.7578125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 1.0, 1.0, 5.0, 7.0, 16.0, 27.0, 32.0, 58.0, 99.0, 112.0, 202.0, 345.0, 564.0, 808.0, 606.0, 431.0, 267.0, 164.0, 109.0, 79.0, 48.0, 31.0, 23.0, 14.0, 11.0, 7.0, 0.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.828125, -16.220703125, -15.61328125, -15.005859375, -14.3984375, -13.791015625, -13.18359375, -12.576171875, -11.96875, -11.361328125, -10.75390625, -10.146484375, -9.5390625, -8.931640625, -8.32421875, -7.716796875, -7.109375, -6.501953125, -5.89453125, -5.287109375, -4.6796875, -4.072265625, -3.46484375, -2.857421875, -2.25, -1.642578125, -1.03515625, -0.427734375, 0.1796875, 0.787109375, 1.39453125, 2.001953125, 2.609375, 3.216796875, 3.82421875, 4.431640625, 5.0390625, 5.646484375, 6.25390625, 6.861328125, 7.46875, 8.076171875, 8.68359375, 9.291015625, 9.8984375, 10.505859375, 11.11328125, 11.720703125, 12.328125, 12.935546875, 13.54296875, 14.150390625, 14.7578125, 15.365234375, 15.97265625, 16.580078125, 17.1875, 17.794921875, 18.40234375, 19.009765625, 19.6171875, 20.224609375, 20.83203125, 21.439453125, 22.046875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 7.0, 7.0, 16.0, 15.0, 34.0, 48.0, 88.0, 139.0, 248.0, 482.0, 1093.0, 3090.0, 25981.0, 3166873.0, 979806.0, 12284.0, 2301.0, 876.0, 404.0, 189.0, 135.0, 57.0, 40.0, 21.0, 21.0, 2.0, 13.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.9375, -35.84716796875, -34.7568359375, -33.66650390625, -32.576171875, -31.48583984375, -30.3955078125, -29.30517578125, -28.21484375, -27.12451171875, -26.0341796875, -24.94384765625, -23.853515625, -22.76318359375, -21.6728515625, -20.58251953125, -19.4921875, -18.40185546875, -17.3115234375, -16.22119140625, -15.130859375, -14.04052734375, -12.9501953125, -11.85986328125, -10.76953125, -9.67919921875, -8.5888671875, -7.49853515625, -6.408203125, -5.31787109375, -4.2275390625, -3.13720703125, -2.046875, -0.95654296875, 0.1337890625, 1.22412109375, 2.314453125, 3.40478515625, 4.4951171875, 5.58544921875, 6.67578125, 7.76611328125, 8.8564453125, 9.94677734375, 11.037109375, 12.12744140625, 13.2177734375, 14.30810546875, 15.3984375, 16.48876953125, 17.5791015625, 18.66943359375, 19.759765625, 20.85009765625, 21.9404296875, 23.03076171875, 24.12109375, 25.21142578125, 26.3017578125, 27.39208984375, 28.482421875, 29.57275390625, 30.6630859375, 31.75341796875, 32.84375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 30.0, 610.0, 367.0, 8.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-333.8099670410156, -322.9875793457031, -312.1651916503906, -301.3428039550781, -290.5204162597656, -279.6980285644531, -268.8756103515625, -258.05322265625, -247.23085021972656, -236.40846252441406, -225.58607482910156, -214.763671875, -203.9412841796875, -193.118896484375, -182.2965087890625, -171.47412109375, -160.6517333984375, -149.829345703125, -139.0069580078125, -128.1845703125, -117.36217498779297, -106.53978729248047, -95.71739196777344, -84.89500427246094, -74.07261657714844, -63.25022888183594, -52.42783737182617, -41.605445861816406, -30.783058166503906, -19.960670471191406, -9.138275146484375, 1.684112548828125, 12.50653076171875, 23.328920364379883, 34.151309967041016, 44.97370147705078, 55.79608917236328, 66.61847686767578, 77.44087219238281, 88.26325988769531, 99.08564758300781, 109.90803527832031, 120.73042297363281, 131.55282592773438, 142.37521362304688, 153.19760131835938, 164.01998901367188, 174.84237670898438, 185.66476440429688, 196.48715209960938, 207.30953979492188, 218.13192749023438, 228.95431518554688, 239.77670288085938, 250.59910583496094, 261.4215087890625, 272.243896484375, 283.0662841796875, 293.888671875, 304.7110595703125, 315.533447265625, 326.3558349609375, 337.17822265625, 348.0006103515625, 358.822998046875]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 8.0, 8.0, 8.0, 8.0, 6.0, 13.0, 11.0, 12.0, 17.0, 31.0, 25.0, 16.0, 26.0, 31.0, 41.0, 33.0, 36.0, 34.0, 31.0, 35.0, 41.0, 42.0, 38.0, 31.0, 28.0, 41.0, 27.0, 44.0, 25.0, 29.0, 29.0, 25.0, 25.0, 16.0, 24.0, 25.0, 18.0, 13.0, 10.0, 9.0, 7.0, 8.0, 5.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0], "bins": [-46.265296936035156, -44.86012268066406, -43.45494842529297, -42.049774169921875, -40.64459991455078, -39.23942565917969, -37.834251403808594, -36.4290771484375, -35.023902893066406, -33.61872863769531, -32.21355438232422, -30.808380126953125, -29.40320587158203, -27.998031616210938, -26.592859268188477, -25.187685012817383, -23.782512664794922, -22.377338409423828, -20.972164154052734, -19.56698989868164, -18.161815643310547, -16.756641387939453, -15.351469039916992, -13.946294784545898, -12.541120529174805, -11.135946273803711, -9.730772018432617, -8.32559871673584, -6.920424461364746, -5.515250205993652, -4.110076904296875, -2.7049026489257812, -1.2997283935546875, 0.10544562339782715, 1.5106196403503418, 2.9157934188842773, 4.320967674255371, 5.726141929626465, 7.131315231323242, 8.536489486694336, 9.94166374206543, 11.346837997436523, 12.752012252807617, 14.157185554504395, 15.562359809875488, 16.967533111572266, 18.37270736694336, 19.777881622314453, 21.183055877685547, 22.58823013305664, 23.993404388427734, 25.398578643798828, 26.803752899169922, 28.208927154541016, 29.614099502563477, 31.01927375793457, 32.42444610595703, 33.829620361328125, 35.23479461669922, 36.63996887207031, 38.045143127441406, 39.4503173828125, 40.855491638183594, 42.26066589355469, 43.66584014892578]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 9.0, 11.0, 10.0, 12.0, 15.0, 17.0, 23.0, 22.0, 31.0, 30.0, 33.0, 44.0, 42.0, 45.0, 44.0, 44.0, 56.0, 49.0, 59.0, 48.0, 44.0, 46.0, 41.0, 34.0, 40.0, 26.0, 15.0, 18.0, 12.0, 13.0, 15.0, 10.0, 9.0, 7.0, 9.0, 5.0, 0.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.42578125, -5.22357177734375, -5.0213623046875, -4.81915283203125, -4.616943359375, -4.41473388671875, -4.2125244140625, -4.01031494140625, -3.80810546875, -3.60589599609375, -3.4036865234375, -3.20147705078125, -2.999267578125, -2.79705810546875, -2.5948486328125, -2.39263916015625, -2.1904296875, -1.98822021484375, -1.7860107421875, -1.58380126953125, -1.381591796875, -1.17938232421875, -0.9771728515625, -0.77496337890625, -0.57275390625, -0.37054443359375, -0.1683349609375, 0.03387451171875, 0.236083984375, 0.43829345703125, 0.6405029296875, 0.84271240234375, 1.044921875, 1.24713134765625, 1.4493408203125, 1.65155029296875, 1.853759765625, 2.05596923828125, 2.2581787109375, 2.46038818359375, 2.66259765625, 2.86480712890625, 3.0670166015625, 3.26922607421875, 3.471435546875, 3.67364501953125, 3.8758544921875, 4.07806396484375, 4.2802734375, 4.48248291015625, 4.6846923828125, 4.88690185546875, 5.089111328125, 5.29132080078125, 5.4935302734375, 5.69573974609375, 5.89794921875, 6.10015869140625, 6.3023681640625, 6.50457763671875, 6.706787109375, 6.90899658203125, 7.1112060546875, 7.31341552734375, 7.515625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 7.0, 10.0, 16.0, 24.0, 39.0, 74.0, 78.0, 142.0, 211.0, 318.0, 539.0, 870.0, 1437.0, 2376.0, 3834.0, 6543.0, 10928.0, 19413.0, 36398.0, 72842.0, 165582.0, 423366.0, 154485.0, 68827.0, 34860.0, 18853.0, 10633.0, 6172.0, 3721.0, 2250.0, 1426.0, 833.0, 537.0, 342.0, 216.0, 126.0, 72.0, 57.0, 31.0, 15.0, 13.0, 21.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.525390625, -1.4718017578125, -1.418212890625, -1.3646240234375, -1.31103515625, -1.2574462890625, -1.203857421875, -1.1502685546875, -1.0966796875, -1.0430908203125, -0.989501953125, -0.9359130859375, -0.88232421875, -0.8287353515625, -0.775146484375, -0.7215576171875, -0.66796875, -0.6143798828125, -0.560791015625, -0.5072021484375, -0.45361328125, -0.4000244140625, -0.346435546875, -0.2928466796875, -0.2392578125, -0.1856689453125, -0.132080078125, -0.0784912109375, -0.02490234375, 0.0286865234375, 0.082275390625, 0.1358642578125, 0.189453125, 0.2430419921875, 0.296630859375, 0.3502197265625, 0.40380859375, 0.4573974609375, 0.510986328125, 0.5645751953125, 0.6181640625, 0.6717529296875, 0.725341796875, 0.7789306640625, 0.83251953125, 0.8861083984375, 0.939697265625, 0.9932861328125, 1.046875, 1.1004638671875, 1.154052734375, 1.2076416015625, 1.26123046875, 1.3148193359375, 1.368408203125, 1.4219970703125, 1.4755859375, 1.5291748046875, 1.582763671875, 1.6363525390625, 1.68994140625, 1.7435302734375, 1.797119140625, 1.8507080078125, 1.904296875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 7.0, 2.0, 13.0, 5.0, 4.0, 11.0, 6.0, 15.0, 17.0, 19.0, 18.0, 17.0, 34.0, 31.0, 34.0, 37.0, 34.0, 44.0, 49.0, 42.0, 42.0, 42.0, 1061.0, 31.0, 42.0, 30.0, 54.0, 43.0, 31.0, 31.0, 25.0, 17.0, 23.0, 13.0, 20.0, 17.0, 13.0, 14.0, 9.0, 9.0, 12.0, 5.0, 9.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6171875, -3.50115966796875, -3.3851318359375, -3.26910400390625, -3.153076171875, -3.03704833984375, -2.9210205078125, -2.80499267578125, -2.68896484375, -2.57293701171875, -2.4569091796875, -2.34088134765625, -2.224853515625, -2.10882568359375, -1.9927978515625, -1.87677001953125, -1.7607421875, -1.64471435546875, -1.5286865234375, -1.41265869140625, -1.296630859375, -1.18060302734375, -1.0645751953125, -0.94854736328125, -0.83251953125, -0.71649169921875, -0.6004638671875, -0.48443603515625, -0.368408203125, -0.25238037109375, -0.1363525390625, -0.02032470703125, 0.095703125, 0.21173095703125, 0.3277587890625, 0.44378662109375, 0.559814453125, 0.67584228515625, 0.7918701171875, 0.90789794921875, 1.02392578125, 1.13995361328125, 1.2559814453125, 1.37200927734375, 1.488037109375, 1.60406494140625, 1.7200927734375, 1.83612060546875, 1.9521484375, 2.06817626953125, 2.1842041015625, 2.30023193359375, 2.416259765625, 2.53228759765625, 2.6483154296875, 2.76434326171875, 2.88037109375, 2.99639892578125, 3.1124267578125, 3.22845458984375, 3.344482421875, 3.46051025390625, 3.5765380859375, 3.69256591796875, 3.80859375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 9.0, 11.0, 23.0, 25.0, 33.0, 81.0, 94.0, 164.0, 300.0, 455.0, 707.0, 1186.0, 1922.0, 2920.0, 4900.0, 8128.0, 13890.0, 23675.0, 42735.0, 80268.0, 172447.0, 1424108.0, 152520.0, 73234.0, 38932.0, 21746.0, 12840.0, 7858.0, 4571.0, 2841.0, 1690.0, 1009.0, 606.0, 397.0, 271.0, 181.0, 117.0, 84.0, 46.0, 35.0, 19.0, 27.0, 12.0, 5.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.58984375, -1.5422821044921875, -1.494720458984375, -1.4471588134765625, -1.39959716796875, -1.3520355224609375, -1.304473876953125, -1.2569122314453125, -1.2093505859375, -1.1617889404296875, -1.114227294921875, -1.0666656494140625, -1.01910400390625, -0.9715423583984375, -0.923980712890625, -0.8764190673828125, -0.828857421875, -0.7812957763671875, -0.733734130859375, -0.6861724853515625, -0.63861083984375, -0.5910491943359375, -0.543487548828125, -0.4959259033203125, -0.4483642578125, -0.4008026123046875, -0.353240966796875, -0.3056793212890625, -0.25811767578125, -0.2105560302734375, -0.162994384765625, -0.1154327392578125, -0.06787109375, -0.0203094482421875, 0.027252197265625, 0.0748138427734375, 0.12237548828125, 0.1699371337890625, 0.217498779296875, 0.2650604248046875, 0.3126220703125, 0.3601837158203125, 0.407745361328125, 0.4553070068359375, 0.50286865234375, 0.5504302978515625, 0.597991943359375, 0.6455535888671875, 0.693115234375, 0.7406768798828125, 0.788238525390625, 0.8358001708984375, 0.88336181640625, 0.9309234619140625, 0.978485107421875, 1.0260467529296875, 1.0736083984375, 1.1211700439453125, 1.168731689453125, 1.2162933349609375, 1.26385498046875, 1.3114166259765625, 1.358978271484375, 1.4065399169921875, 1.4541015625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 8.0, 11.0, 12.0, 20.0, 18.0, 26.0, 26.0, 45.0, 69.0, 99.0, 115.0, 133.0, 107.0, 76.0, 50.0, 38.0, 24.0, 20.0, 19.0, 16.0, 8.0, 7.0, 11.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001506805419921875, -0.0014551132917404175, -0.00140342116355896, -0.0013517290353775024, -0.001300036907196045, -0.0012483447790145874, -0.0011966526508331299, -0.0011449605226516724, -0.0010932683944702148, -0.0010415762662887573, -0.0009898841381072998, -0.0009381920099258423, -0.0008864998817443848, -0.0008348077535629272, -0.0007831156253814697, -0.0007314234972000122, -0.0006797313690185547, -0.0006280392408370972, -0.0005763471126556396, -0.0005246549844741821, -0.0004729628562927246, -0.0004212707281112671, -0.00036957859992980957, -0.00031788647174835205, -0.00026619434356689453, -0.000214502215385437, -0.0001628100872039795, -0.00011111795902252197, -5.942583084106445e-05, -7.733702659606934e-06, 4.3958425521850586e-05, 9.56505537033081e-05, 0.00014734268188476562, 0.00019903481006622314, 0.00025072693824768066, 0.0003024190664291382, 0.0003541111946105957, 0.0004058033227920532, 0.00045749545097351074, 0.0005091875791549683, 0.0005608797073364258, 0.0006125718355178833, 0.0006642639636993408, 0.0007159560918807983, 0.0007676482200622559, 0.0008193403482437134, 0.0008710324764251709, 0.0009227246046066284, 0.0009744167327880859, 0.0010261088609695435, 0.001077800989151001, 0.0011294931173324585, 0.001181185245513916, 0.0012328773736953735, 0.001284569501876831, 0.0013362616300582886, 0.001387953758239746, 0.0014396458864212036, 0.0014913380146026611, 0.0015430301427841187, 0.0015947222709655762, 0.0016464143991470337, 0.0016981065273284912, 0.0017497986555099487, 0.0018014907836914062]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 1.0, 5.0, 3.0, 3.0, 3.0, 4.0, 7.0, 10.0, 11.0, 20.0, 24.0, 23.0, 34.0, 35.0, 76.0, 92.0, 144.0, 256.0, 502.0, 1432.0, 1024169.0, 19978.0, 784.0, 347.0, 201.0, 108.0, 72.0, 52.0, 34.0, 33.0, 25.0, 13.0, 16.0, 11.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.035125732421875, -0.03411531448364258, -0.033104896545410156, -0.032094478607177734, -0.031084060668945312, -0.03007364273071289, -0.02906322479248047, -0.028052806854248047, -0.027042388916015625, -0.026031970977783203, -0.02502155303955078, -0.02401113510131836, -0.023000717163085938, -0.021990299224853516, -0.020979881286621094, -0.019969463348388672, -0.01895904541015625, -0.017948627471923828, -0.016938209533691406, -0.015927791595458984, -0.014917373657226562, -0.01390695571899414, -0.012896537780761719, -0.011886119842529297, -0.010875701904296875, -0.009865283966064453, -0.008854866027832031, -0.00784444808959961, -0.0068340301513671875, -0.005823612213134766, -0.004813194274902344, -0.003802776336669922, -0.0027923583984375, -0.0017819404602050781, -0.0007715225219726562, 0.00023889541625976562, 0.0012493133544921875, 0.0022597312927246094, 0.0032701492309570312, 0.004280567169189453, 0.005290985107421875, 0.006301403045654297, 0.007311820983886719, 0.00832223892211914, 0.009332656860351562, 0.010343074798583984, 0.011353492736816406, 0.012363910675048828, 0.01337432861328125, 0.014384746551513672, 0.015395164489746094, 0.016405582427978516, 0.017416000366210938, 0.01842641830444336, 0.01943683624267578, 0.020447254180908203, 0.021457672119140625, 0.022468090057373047, 0.02347850799560547, 0.02448892593383789, 0.025499343872070312, 0.026509761810302734, 0.027520179748535156, 0.028530597686767578, 0.029541015625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 12.0, 24.0, 94.0, 266.0, 334.0, 194.0, 59.0, 16.0, 8.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007651117048226297, -0.0007182001136243343, -0.000671288522426039, -0.0006243769312277436, -0.0005774653982371092, -0.0005305537488311529, -0.0004836422158405185, -0.0004367306246422231, -0.00038981903344392776, -0.0003429074422456324, -0.00029599585104733706, -0.00024908428895287216, -0.0002021726977545768, -0.00015526110655628145, -0.00010834954446181655, -6.14379532635212e-05, -1.452636206522584e-05, 3.23852218571119e-05, 7.929680577944964e-05, 0.00012620838242582977, 0.00017311997362412512, 0.00022003156482242048, 0.0002669431269168854, 0.00031385471811518073, 0.0003607663093134761, 0.00040767790051177144, 0.0004545894917100668, 0.0005015010247007012, 0.0005484126741066575, 0.000595324207097292, 0.0006422357982955873, 0.0006891473894938827, 0.0007360589224845171, 0.0007829705136828125, 0.0008298821048811078, 0.0008767936378717422, 0.0009237052872776985, 0.000970616820268333, 0.0010175283532589674, 0.0010644400026649237, 0.00111135165207088, 0.0011582631850615144, 0.0012051748344674706, 0.001252086367458105, 0.0012989980168640614, 0.0013459095498546958, 0.0013928210828453302, 0.0014397327322512865, 0.001486644265241921, 0.0015335557982325554, 0.0015804674476385117, 0.001627378980629146, 0.0016742906300351024, 0.0017212021630257368, 0.001768113812431693, 0.0018150253454223275, 0.001861936878412962, 0.0019088484114035964, 0.001955759944394231, 0.002002671593800187, 0.0020495832432061434, 0.0020964948926120996, 0.0021434063091874123, 0.0021903179585933685, 0.002237229607999325]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 10.0, 11.0, 9.0, 13.0, 20.0, 12.0, 24.0, 22.0, 41.0, 34.0, 43.0, 36.0, 43.0, 39.0, 48.0, 46.0, 56.0, 39.0, 45.0, 43.0, 42.0, 27.0, 45.0, 35.0, 35.0, 26.0, 27.0, 17.0, 21.0, 14.0, 14.0, 10.0, 11.0, 7.0, 6.0, 10.0, 5.0, 0.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006845593452453613, -0.0006617233157157898, -0.0006388872861862183, -0.0006160512566566467, -0.0005932152271270752, -0.0005703791975975037, -0.0005475431680679321, -0.0005247071385383606, -0.0005018711090087891, -0.00047903507947921753, -0.000456199049949646, -0.00043336302042007446, -0.00041052699089050293, -0.0003876909613609314, -0.00036485493183135986, -0.00034201890230178833, -0.0003191828727722168, -0.00029634684324264526, -0.00027351081371307373, -0.0002506747841835022, -0.00022783875465393066, -0.00020500272512435913, -0.0001821666955947876, -0.00015933066606521606, -0.00013649463653564453, -0.000113658607006073, -9.082257747650146e-05, -6.798654794692993e-05, -4.51505184173584e-05, -2.2314488887786865e-05, 5.21540641784668e-07, 2.33575701713562e-05, 4.6193599700927734e-05, 6.902962923049927e-05, 9.18656587600708e-05, 0.00011470168828964233, 0.00013753771781921387, 0.0001603737473487854, 0.00018320977687835693, 0.00020604580640792847, 0.0002288818359375, 0.00025171786546707153, 0.00027455389499664307, 0.0002973899245262146, 0.00032022595405578613, 0.00034306198358535767, 0.0003658980131149292, 0.00038873404264450073, 0.00041157007217407227, 0.0004344061017036438, 0.00045724213123321533, 0.00048007816076278687, 0.0005029141902923584, 0.0005257502198219299, 0.0005485862493515015, 0.000571422278881073, 0.0005942583084106445, 0.0006170943379402161, 0.0006399303674697876, 0.0006627663969993591, 0.0006856024265289307, 0.0007084384560585022, 0.0007312744855880737, 0.0007541105151176453, 0.0007769465446472168]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 9.0, 11.0, 10.0, 12.0, 15.0, 17.0, 23.0, 22.0, 31.0, 30.0, 33.0, 44.0, 42.0, 45.0, 44.0, 44.0, 56.0, 49.0, 59.0, 48.0, 44.0, 46.0, 41.0, 34.0, 40.0, 26.0, 15.0, 18.0, 12.0, 13.0, 15.0, 10.0, 9.0, 7.0, 9.0, 5.0, 0.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.42578125, -5.22357177734375, -5.0213623046875, -4.81915283203125, -4.616943359375, -4.41473388671875, -4.2125244140625, -4.01031494140625, -3.80810546875, -3.60589599609375, -3.4036865234375, -3.20147705078125, -2.999267578125, -2.79705810546875, -2.5948486328125, -2.39263916015625, -2.1904296875, -1.98822021484375, -1.7860107421875, -1.58380126953125, -1.381591796875, -1.17938232421875, -0.9771728515625, -0.77496337890625, -0.57275390625, -0.37054443359375, -0.1683349609375, 0.03387451171875, 0.236083984375, 0.43829345703125, 0.6405029296875, 0.84271240234375, 1.044921875, 1.24713134765625, 1.4493408203125, 1.65155029296875, 1.853759765625, 2.05596923828125, 2.2581787109375, 2.46038818359375, 2.66259765625, 2.86480712890625, 3.0670166015625, 3.26922607421875, 3.471435546875, 3.67364501953125, 3.8758544921875, 4.07806396484375, 4.2802734375, 4.48248291015625, 4.6846923828125, 4.88690185546875, 5.089111328125, 5.29132080078125, 5.4935302734375, 5.69573974609375, 5.89794921875, 6.10015869140625, 6.3023681640625, 6.50457763671875, 6.706787109375, 6.90899658203125, 7.1112060546875, 7.31341552734375, 7.515625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 4.0, 10.0, 18.0, 30.0, 36.0, 42.0, 91.0, 110.0, 167.0, 212.0, 286.0, 438.0, 645.0, 947.0, 1326.0, 2097.0, 3723.0, 9908.0, 94846.0, 781044.0, 130173.0, 11534.0, 4095.0, 2259.0, 1398.0, 908.0, 679.0, 459.0, 310.0, 222.0, 163.0, 119.0, 74.0, 59.0, 37.0, 29.0, 14.0, 14.0, 13.0, 6.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.765625, -18.2225341796875, -17.679443359375, -17.1363525390625, -16.59326171875, -16.0501708984375, -15.507080078125, -14.9639892578125, -14.4208984375, -13.8778076171875, -13.334716796875, -12.7916259765625, -12.24853515625, -11.7054443359375, -11.162353515625, -10.6192626953125, -10.076171875, -9.5330810546875, -8.989990234375, -8.4468994140625, -7.90380859375, -7.3607177734375, -6.817626953125, -6.2745361328125, -5.7314453125, -5.1883544921875, -4.645263671875, -4.1021728515625, -3.55908203125, -3.0159912109375, -2.472900390625, -1.9298095703125, -1.38671875, -0.8436279296875, -0.300537109375, 0.2425537109375, 0.78564453125, 1.3287353515625, 1.871826171875, 2.4149169921875, 2.9580078125, 3.5010986328125, 4.044189453125, 4.5872802734375, 5.13037109375, 5.6734619140625, 6.216552734375, 6.7596435546875, 7.302734375, 7.8458251953125, 8.388916015625, 8.9320068359375, 9.47509765625, 10.0181884765625, 10.561279296875, 11.1043701171875, 11.6474609375, 12.1905517578125, 12.733642578125, 13.2767333984375, 13.81982421875, 14.3629150390625, 14.906005859375, 15.4490966796875, 15.9921875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 10.0, 5.0, 10.0, 10.0, 10.0, 22.0, 15.0, 19.0, 21.0, 30.0, 30.0, 32.0, 41.0, 44.0, 61.0, 79.0, 203.0, 1546.0, 340.0, 123.0, 81.0, 58.0, 39.0, 28.0, 41.0, 31.0, 21.0, 18.0, 10.0, 12.0, 15.0, 7.0, 7.0, 2.0, 6.0, 6.0, 1.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.484375, -15.948486328125, -15.41259765625, -14.876708984375, -14.3408203125, -13.804931640625, -13.26904296875, -12.733154296875, -12.197265625, -11.661376953125, -11.12548828125, -10.589599609375, -10.0537109375, -9.517822265625, -8.98193359375, -8.446044921875, -7.91015625, -7.374267578125, -6.83837890625, -6.302490234375, -5.7666015625, -5.230712890625, -4.69482421875, -4.158935546875, -3.623046875, -3.087158203125, -2.55126953125, -2.015380859375, -1.4794921875, -0.943603515625, -0.40771484375, 0.128173828125, 0.6640625, 1.199951171875, 1.73583984375, 2.271728515625, 2.8076171875, 3.343505859375, 3.87939453125, 4.415283203125, 4.951171875, 5.487060546875, 6.02294921875, 6.558837890625, 7.0947265625, 7.630615234375, 8.16650390625, 8.702392578125, 9.23828125, 9.774169921875, 10.31005859375, 10.845947265625, 11.3818359375, 11.917724609375, 12.45361328125, 12.989501953125, 13.525390625, 14.061279296875, 14.59716796875, 15.133056640625, 15.6689453125, 16.204833984375, 16.74072265625, 17.276611328125, 17.8125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 8.0, 13.0, 13.0, 12.0, 16.0, 19.0, 27.0, 48.0, 57.0, 85.0, 103.0, 126.0, 197.0, 274.0, 552.0, 1076.0, 3537.0, 3045729.0, 89396.0, 2221.0, 767.0, 443.0, 287.0, 193.0, 128.0, 86.0, 64.0, 61.0, 31.0, 28.0, 22.0, 24.0, 8.0, 11.0, 5.0, 5.0, 5.0, 4.0, 8.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-54.71875, -53.0517578125, -51.384765625, -49.7177734375, -48.05078125, -46.3837890625, -44.716796875, -43.0498046875, -41.3828125, -39.7158203125, -38.048828125, -36.3818359375, -34.71484375, -33.0478515625, -31.380859375, -29.7138671875, -28.046875, -26.3798828125, -24.712890625, -23.0458984375, -21.37890625, -19.7119140625, -18.044921875, -16.3779296875, -14.7109375, -13.0439453125, -11.376953125, -9.7099609375, -8.04296875, -6.3759765625, -4.708984375, -3.0419921875, -1.375, 0.2919921875, 1.958984375, 3.6259765625, 5.29296875, 6.9599609375, 8.626953125, 10.2939453125, 11.9609375, 13.6279296875, 15.294921875, 16.9619140625, 18.62890625, 20.2958984375, 21.962890625, 23.6298828125, 25.296875, 26.9638671875, 28.630859375, 30.2978515625, 31.96484375, 33.6318359375, 35.298828125, 36.9658203125, 38.6328125, 40.2998046875, 41.966796875, 43.6337890625, 45.30078125, 46.9677734375, 48.634765625, 50.3017578125, 51.96875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 20.0, 38.0, 88.0, 125.0, 244.0, 227.0, 148.0, 58.0, 36.0, 12.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.71249389648438, -83.04866790771484, -81.38484191894531, -79.72101593017578, -78.05718994140625, -76.39336395263672, -74.72953796386719, -73.06571197509766, -71.40188598632812, -69.7380599975586, -68.07423400878906, -66.41040802001953, -64.74658203125, -63.08275604248047, -61.41893005371094, -59.755104064941406, -58.09128189086914, -56.42745590209961, -54.76362991333008, -53.09980392456055, -51.435977935791016, -49.772151947021484, -48.10832977294922, -46.44450378417969, -44.780677795410156, -43.116851806640625, -41.453025817871094, -39.78919982910156, -38.12537384033203, -36.4615478515625, -34.79772186279297, -33.13389587402344, -31.470069885253906, -29.806243896484375, -28.142417907714844, -26.478591918945312, -24.81476593017578, -23.15093994140625, -21.48711585998535, -19.82328987121582, -18.15946388244629, -16.495637893676758, -14.831811904907227, -13.167986869812012, -11.50416088104248, -9.84033489227295, -8.176509857177734, -6.512683868408203, -4.848857879638672, -3.1850321292877197, -1.5212063789367676, 0.14261913299560547, 1.8064451217651367, 3.470271110534668, 5.134096145629883, 6.797922134399414, 8.461748123168945, 10.125574111938477, 11.789400100708008, 13.453225135803223, 15.117051124572754, 16.78087615966797, 18.4447021484375, 20.10852813720703, 21.772354125976562]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 4.0, 3.0, 12.0, 9.0, 7.0, 12.0, 17.0, 11.0, 16.0, 18.0, 26.0, 23.0, 36.0, 35.0, 37.0, 36.0, 45.0, 48.0, 30.0, 45.0, 46.0, 46.0, 50.0, 41.0, 43.0, 27.0, 36.0, 27.0, 30.0, 22.0, 25.0, 20.0, 11.0, 20.0, 18.0, 14.0, 11.0, 12.0, 5.0, 6.0, 6.0, 3.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-43.41010665893555, -42.07524871826172, -40.740386962890625, -39.40552520751953, -38.0706672668457, -36.735809326171875, -35.40094757080078, -34.06608581542969, -32.73122787475586, -31.3963680267334, -30.061508178710938, -28.726648330688477, -27.391788482666016, -26.056928634643555, -24.722068786621094, -23.387208938598633, -22.052349090576172, -20.71748924255371, -19.38262939453125, -18.04776954650879, -16.712909698486328, -15.378049850463867, -14.043190002441406, -12.708330154418945, -11.373470306396484, -10.038610458374023, -8.703750610351562, -7.368890762329102, -6.034030914306641, -4.69917106628418, -3.3643112182617188, -2.029451370239258, -0.6945877075195312, 0.6402721405029297, 1.9751319885253906, 3.3099918365478516, 4.6448516845703125, 5.979711532592773, 7.314571380615234, 8.649431228637695, 9.984291076660156, 11.319150924682617, 12.654010772705078, 13.988870620727539, 15.32373046875, 16.65859031677246, 17.993450164794922, 19.328310012817383, 20.663169860839844, 21.998029708862305, 23.332889556884766, 24.667749404907227, 26.002609252929688, 27.33746910095215, 28.67232894897461, 30.00718879699707, 31.34204864501953, 32.676910400390625, 34.01176834106445, 35.34662628173828, 36.681488037109375, 38.01634979248047, 39.3512077331543, 40.686065673828125, 42.02092742919922]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 0.0, 4.0, 6.0, 7.0, 8.0, 7.0, 6.0, 8.0, 17.0, 10.0, 16.0, 5.0, 32.0, 18.0, 26.0, 28.0, 30.0, 36.0, 35.0, 41.0, 56.0, 36.0, 31.0, 43.0, 41.0, 49.0, 39.0, 29.0, 36.0, 41.0, 31.0, 32.0, 27.0, 27.0, 26.0, 14.0, 17.0, 9.0, 9.0, 20.0, 14.0, 5.0, 8.0, 5.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.5546875, -5.37420654296875, -5.1937255859375, -5.01324462890625, -4.832763671875, -4.65228271484375, -4.4718017578125, -4.29132080078125, -4.11083984375, -3.93035888671875, -3.7498779296875, -3.56939697265625, -3.388916015625, -3.20843505859375, -3.0279541015625, -2.84747314453125, -2.6669921875, -2.48651123046875, -2.3060302734375, -2.12554931640625, -1.945068359375, -1.76458740234375, -1.5841064453125, -1.40362548828125, -1.22314453125, -1.04266357421875, -0.8621826171875, -0.68170166015625, -0.501220703125, -0.32073974609375, -0.1402587890625, 0.04022216796875, 0.220703125, 0.40118408203125, 0.5816650390625, 0.76214599609375, 0.942626953125, 1.12310791015625, 1.3035888671875, 1.48406982421875, 1.66455078125, 1.84503173828125, 2.0255126953125, 2.20599365234375, 2.386474609375, 2.56695556640625, 2.7474365234375, 2.92791748046875, 3.1083984375, 3.28887939453125, 3.4693603515625, 3.64984130859375, 3.830322265625, 4.01080322265625, 4.1912841796875, 4.37176513671875, 4.55224609375, 4.73272705078125, 4.9132080078125, 5.09368896484375, 5.274169921875, 5.45465087890625, 5.6351318359375, 5.81561279296875, 5.99609375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 8.0, 6.0, 15.0, 11.0, 22.0, 20.0, 17.0, 25.0, 33.0, 40.0, 61.0, 83.0, 173.0, 239.0, 444.0, 957.0, 2286.0, 6496.0, 29746.0, 301516.0, 2311742.0, 1391874.0, 125159.0, 15855.0, 4208.0, 1595.0, 716.0, 343.0, 178.0, 113.0, 65.0, 48.0, 36.0, 24.0, 27.0, 21.0, 14.0, 13.0, 8.0, 8.0, 10.0, 9.0, 3.0, 3.0, 3.0, 6.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-12.3984375, -12.0089111328125, -11.619384765625, -11.2298583984375, -10.84033203125, -10.4508056640625, -10.061279296875, -9.6717529296875, -9.2822265625, -8.8927001953125, -8.503173828125, -8.1136474609375, -7.72412109375, -7.3345947265625, -6.945068359375, -6.5555419921875, -6.166015625, -5.7764892578125, -5.386962890625, -4.9974365234375, -4.60791015625, -4.2183837890625, -3.828857421875, -3.4393310546875, -3.0498046875, -2.6602783203125, -2.270751953125, -1.8812255859375, -1.49169921875, -1.1021728515625, -0.712646484375, -0.3231201171875, 0.06640625, 0.4559326171875, 0.845458984375, 1.2349853515625, 1.62451171875, 2.0140380859375, 2.403564453125, 2.7930908203125, 3.1826171875, 3.5721435546875, 3.961669921875, 4.3511962890625, 4.74072265625, 5.1302490234375, 5.519775390625, 5.9093017578125, 6.298828125, 6.6883544921875, 7.077880859375, 7.4674072265625, 7.85693359375, 8.2464599609375, 8.635986328125, 9.0255126953125, 9.4150390625, 9.8045654296875, 10.194091796875, 10.5836181640625, 10.97314453125, 11.3626708984375, 11.752197265625, 12.1417236328125, 12.53125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 10.0, 17.0, 43.0, 90.0, 187.0, 427.0, 750.0, 1106.0, 686.0, 385.0, 211.0, 91.0, 43.0, 16.0, 10.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.5625, -21.797607421875, -21.03271484375, -20.267822265625, -19.5029296875, -18.738037109375, -17.97314453125, -17.208251953125, -16.443359375, -15.678466796875, -14.91357421875, -14.148681640625, -13.3837890625, -12.618896484375, -11.85400390625, -11.089111328125, -10.32421875, -9.559326171875, -8.79443359375, -8.029541015625, -7.2646484375, -6.499755859375, -5.73486328125, -4.969970703125, -4.205078125, -3.440185546875, -2.67529296875, -1.910400390625, -1.1455078125, -0.380615234375, 0.38427734375, 1.149169921875, 1.9140625, 2.678955078125, 3.44384765625, 4.208740234375, 4.9736328125, 5.738525390625, 6.50341796875, 7.268310546875, 8.033203125, 8.798095703125, 9.56298828125, 10.327880859375, 11.0927734375, 11.857666015625, 12.62255859375, 13.387451171875, 14.15234375, 14.917236328125, 15.68212890625, 16.447021484375, 17.2119140625, 17.976806640625, 18.74169921875, 19.506591796875, 20.271484375, 21.036376953125, 21.80126953125, 22.566162109375, 23.3310546875, 24.095947265625, 24.86083984375, 25.625732421875, 26.390625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 12.0, 9.0, 19.0, 31.0, 65.0, 135.0, 377.0, 1011.0, 3629.0, 497735.0, 3683045.0, 6097.0, 1308.0, 474.0, 174.0, 76.0, 39.0, 13.0, 10.0, 8.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.90625, -52.37158203125, -50.8369140625, -49.30224609375, -47.767578125, -46.23291015625, -44.6982421875, -43.16357421875, -41.62890625, -40.09423828125, -38.5595703125, -37.02490234375, -35.490234375, -33.95556640625, -32.4208984375, -30.88623046875, -29.3515625, -27.81689453125, -26.2822265625, -24.74755859375, -23.212890625, -21.67822265625, -20.1435546875, -18.60888671875, -17.07421875, -15.53955078125, -14.0048828125, -12.47021484375, -10.935546875, -9.40087890625, -7.8662109375, -6.33154296875, -4.796875, -3.26220703125, -1.7275390625, -0.19287109375, 1.341796875, 2.87646484375, 4.4111328125, 5.94580078125, 7.48046875, 9.01513671875, 10.5498046875, 12.08447265625, 13.619140625, 15.15380859375, 16.6884765625, 18.22314453125, 19.7578125, 21.29248046875, 22.8271484375, 24.36181640625, 25.896484375, 27.43115234375, 28.9658203125, 30.50048828125, 32.03515625, 33.56982421875, 35.1044921875, 36.63916015625, 38.173828125, 39.70849609375, 41.2431640625, 42.77783203125, 44.3125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 14.0, 132.0, 449.0, 348.0, 62.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-205.23599243164062, -200.54342651367188, -195.85084533691406, -191.1582794189453, -186.4656982421875, -181.77313232421875, -177.08056640625, -172.3879852294922, -167.69541931152344, -163.0028533935547, -158.31027221679688, -153.61770629882812, -148.9251251220703, -144.23255920410156, -139.53997802734375, -134.847412109375, -130.15484619140625, -125.46227264404297, -120.76969909667969, -116.07713317871094, -111.38455963134766, -106.69198608398438, -101.9994125366211, -97.30683898925781, -92.6142578125, -87.92168426513672, -83.22911071777344, -78.53654479980469, -73.8439712524414, -69.15139770507812, -64.45882415771484, -59.76625442504883, -55.07367706298828, -50.381103515625, -45.688533782958984, -40.9959602355957, -36.30339050292969, -31.610816955566406, -26.918243408203125, -22.22567367553711, -17.533100128173828, -12.84052848815918, -8.147955894470215, -3.45538330078125, 1.2371883392333984, 5.929759979248047, 10.622333526611328, 15.314903259277344, 20.007476806640625, 24.700048446655273, 29.392620086669922, 34.0851936340332, 38.77776336669922, 43.4703369140625, 48.16291046142578, 52.8554801940918, 57.54805374145508, 62.24062728881836, 66.93319702148438, 71.62577056884766, 76.31834411621094, 81.01091003417969, 85.7034912109375, 90.39605712890625, 95.08863067626953]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 6.0, 5.0, 12.0, 8.0, 14.0, 11.0, 13.0, 16.0, 17.0, 24.0, 25.0, 28.0, 26.0, 23.0, 39.0, 22.0, 24.0, 39.0, 29.0, 45.0, 26.0, 42.0, 47.0, 38.0, 29.0, 39.0, 42.0, 32.0, 35.0, 29.0, 31.0, 31.0, 19.0, 20.0, 12.0, 18.0, 17.0, 6.0, 11.0, 11.0, 5.0, 3.0, 4.0, 5.0, 8.0, 6.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0], "bins": [-40.54632568359375, -39.32184600830078, -38.09736633300781, -36.872886657714844, -35.648406982421875, -34.423927307128906, -33.19944763183594, -31.974964141845703, -30.750484466552734, -29.526004791259766, -28.301525115966797, -27.077045440673828, -25.852563858032227, -24.628084182739258, -23.40360450744629, -22.179122924804688, -20.95464515686035, -19.730165481567383, -18.505685806274414, -17.281204223632812, -16.056724548339844, -14.832244873046875, -13.607765197753906, -12.383284568786621, -11.158804893493652, -9.934325218200684, -8.709844589233398, -7.48536491394043, -6.260884761810303, -5.036404609680176, -3.811924934387207, -2.587444305419922, -1.3629646301269531, -0.13848459720611572, 1.0859954357147217, 2.3104753494262695, 3.5349555015563965, 4.759435653686523, 5.983915328979492, 7.208395957946777, 8.432875633239746, 9.657355308532715, 10.8818359375, 12.106315612792969, 13.330795288085938, 14.555275917053223, 15.779755592346191, 17.004236221313477, 18.228715896606445, 19.453195571899414, 20.677675247192383, 21.902156829833984, 23.126636505126953, 24.351116180419922, 25.57559585571289, 26.80007553100586, 28.024555206298828, 29.249034881591797, 30.473514556884766, 31.697994232177734, 32.9224739074707, 34.14695739746094, 35.371437072753906, 36.595916748046875, 37.820396423339844]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 9.0, 4.0, 10.0, 14.0, 11.0, 23.0, 21.0, 28.0, 28.0, 33.0, 35.0, 26.0, 43.0, 47.0, 54.0, 47.0, 61.0, 40.0, 64.0, 53.0, 42.0, 33.0, 30.0, 48.0, 28.0, 23.0, 25.0, 24.0, 20.0, 20.0, 13.0, 15.0, 8.0, 3.0, 5.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8828125, -5.7059326171875, -5.529052734375, -5.3521728515625, -5.17529296875, -4.9984130859375, -4.821533203125, -4.6446533203125, -4.4677734375, -4.2908935546875, -4.114013671875, -3.9371337890625, -3.76025390625, -3.5833740234375, -3.406494140625, -3.2296142578125, -3.052734375, -2.8758544921875, -2.698974609375, -2.5220947265625, -2.34521484375, -2.1683349609375, -1.991455078125, -1.8145751953125, -1.6376953125, -1.4608154296875, -1.283935546875, -1.1070556640625, -0.93017578125, -0.7532958984375, -0.576416015625, -0.3995361328125, -0.22265625, -0.0457763671875, 0.131103515625, 0.3079833984375, 0.48486328125, 0.6617431640625, 0.838623046875, 1.0155029296875, 1.1923828125, 1.3692626953125, 1.546142578125, 1.7230224609375, 1.89990234375, 2.0767822265625, 2.253662109375, 2.4305419921875, 2.607421875, 2.7843017578125, 2.961181640625, 3.1380615234375, 3.31494140625, 3.4918212890625, 3.668701171875, 3.8455810546875, 4.0224609375, 4.1993408203125, 4.376220703125, 4.5531005859375, 4.72998046875, 4.9068603515625, 5.083740234375, 5.2606201171875, 5.4375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 13.0, 18.0, 25.0, 36.0, 41.0, 70.0, 131.0, 152.0, 306.0, 474.0, 737.0, 1189.0, 2026.0, 3363.0, 5930.0, 9814.0, 17221.0, 29763.0, 52600.0, 100635.0, 295068.0, 302427.0, 101671.0, 52959.0, 29995.0, 17270.0, 10093.0, 5857.0, 3400.0, 2078.0, 1204.0, 724.0, 467.0, 285.0, 179.0, 110.0, 65.0, 55.0, 36.0, 20.0, 13.0, 12.0, 7.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.37109375, -1.326873779296875, -1.28265380859375, -1.238433837890625, -1.1942138671875, -1.149993896484375, -1.10577392578125, -1.061553955078125, -1.017333984375, -0.973114013671875, -0.92889404296875, -0.884674072265625, -0.8404541015625, -0.796234130859375, -0.75201416015625, -0.707794189453125, -0.66357421875, -0.619354248046875, -0.57513427734375, -0.530914306640625, -0.4866943359375, -0.442474365234375, -0.39825439453125, -0.354034423828125, -0.309814453125, -0.265594482421875, -0.22137451171875, -0.177154541015625, -0.1329345703125, -0.088714599609375, -0.04449462890625, -0.000274658203125, 0.0439453125, 0.088165283203125, 0.13238525390625, 0.176605224609375, 0.2208251953125, 0.265045166015625, 0.30926513671875, 0.353485107421875, 0.397705078125, 0.441925048828125, 0.48614501953125, 0.530364990234375, 0.5745849609375, 0.618804931640625, 0.66302490234375, 0.707244873046875, 0.75146484375, 0.795684814453125, 0.83990478515625, 0.884124755859375, 0.9283447265625, 0.972564697265625, 1.01678466796875, 1.061004638671875, 1.105224609375, 1.149444580078125, 1.19366455078125, 1.237884521484375, 1.2821044921875, 1.326324462890625, 1.37054443359375, 1.414764404296875, 1.458984375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 10.0, 19.0, 19.0, 24.0, 21.0, 24.0, 24.0, 23.0, 25.0, 26.0, 39.0, 38.0, 38.0, 35.0, 42.0, 30.0, 31.0, 1057.0, 38.0, 29.0, 32.0, 51.0, 34.0, 35.0, 34.0, 26.0, 27.0, 24.0, 19.0, 29.0, 27.0, 16.0, 13.0, 11.0, 9.0, 10.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.724609375, -2.634552001953125, -2.54449462890625, -2.454437255859375, -2.3643798828125, -2.274322509765625, -2.18426513671875, -2.094207763671875, -2.004150390625, -1.914093017578125, -1.82403564453125, -1.733978271484375, -1.6439208984375, -1.553863525390625, -1.46380615234375, -1.373748779296875, -1.28369140625, -1.193634033203125, -1.10357666015625, -1.013519287109375, -0.9234619140625, -0.833404541015625, -0.74334716796875, -0.653289794921875, -0.563232421875, -0.473175048828125, -0.38311767578125, -0.293060302734375, -0.2030029296875, -0.112945556640625, -0.02288818359375, 0.067169189453125, 0.1572265625, 0.247283935546875, 0.33734130859375, 0.427398681640625, 0.5174560546875, 0.607513427734375, 0.69757080078125, 0.787628173828125, 0.877685546875, 0.967742919921875, 1.05780029296875, 1.147857666015625, 1.2379150390625, 1.327972412109375, 1.41802978515625, 1.508087158203125, 1.59814453125, 1.688201904296875, 1.77825927734375, 1.868316650390625, 1.9583740234375, 2.048431396484375, 2.13848876953125, 2.228546142578125, 2.318603515625, 2.408660888671875, 2.49871826171875, 2.588775634765625, 2.6788330078125, 2.768890380859375, 2.85894775390625, 2.949005126953125, 3.0390625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 5.0, 4.0, 17.0, 13.0, 19.0, 31.0, 52.0, 70.0, 93.0, 150.0, 239.0, 345.0, 558.0, 778.0, 1212.0, 1990.0, 3228.0, 5474.0, 8968.0, 15079.0, 25405.0, 43650.0, 78100.0, 149334.0, 1393670.0, 167007.0, 85568.0, 47351.0, 27490.0, 16121.0, 9693.0, 5818.0, 3574.0, 2199.0, 1337.0, 892.0, 573.0, 344.0, 241.0, 135.0, 103.0, 70.0, 33.0, 36.0, 24.0, 13.0, 15.0, 3.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.2294921875, -1.19287109375, -1.15625, -1.11962890625, -1.0830078125, -1.04638671875, -1.009765625, -0.97314453125, -0.9365234375, -0.89990234375, -0.86328125, -0.82666015625, -0.7900390625, -0.75341796875, -0.716796875, -0.68017578125, -0.6435546875, -0.60693359375, -0.5703125, -0.53369140625, -0.4970703125, -0.46044921875, -0.423828125, -0.38720703125, -0.3505859375, -0.31396484375, -0.27734375, -0.24072265625, -0.2041015625, -0.16748046875, -0.130859375, -0.09423828125, -0.0576171875, -0.02099609375, 0.015625, 0.05224609375, 0.0888671875, 0.12548828125, 0.162109375, 0.19873046875, 0.2353515625, 0.27197265625, 0.30859375, 0.34521484375, 0.3818359375, 0.41845703125, 0.455078125, 0.49169921875, 0.5283203125, 0.56494140625, 0.6015625, 0.63818359375, 0.6748046875, 0.71142578125, 0.748046875, 0.78466796875, 0.8212890625, 0.85791015625, 0.89453125, 0.93115234375, 0.9677734375, 1.00439453125, 1.041015625, 1.07763671875, 1.1142578125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 5.0, 6.0, 12.0, 9.0, 10.0, 16.0, 19.0, 23.0, 31.0, 37.0, 66.0, 87.0, 147.0, 146.0, 112.0, 78.0, 46.0, 31.0, 27.0, 26.0, 12.0, 9.0, 13.0, 4.0, 3.0, 5.0, 4.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0006079673767089844, -0.0005829855799674988, -0.0005580037832260132, -0.0005330219864845276, -0.000508040189743042, -0.0004830583930015564, -0.0004580765962600708, -0.0004330947995185852, -0.0004081130027770996, -0.000383131206035614, -0.0003581494092941284, -0.0003331676125526428, -0.0003081858158111572, -0.00028320401906967163, -0.00025822222232818604, -0.00023324042558670044, -0.00020825862884521484, -0.00018327683210372925, -0.00015829503536224365, -0.00013331323862075806, -0.00010833144187927246, -8.334964513778687e-05, -5.836784839630127e-05, -3.3386051654815674e-05, -8.404254913330078e-06, 1.6577541828155518e-05, 4.155933856964111e-05, 6.654113531112671e-05, 9.15229320526123e-05, 0.0001165047287940979, 0.0001414865255355835, 0.0001664683222770691, 0.0001914501190185547, 0.00021643191576004028, 0.00024141371250152588, 0.0002663955092430115, 0.00029137730598449707, 0.00031635910272598267, 0.00034134089946746826, 0.00036632269620895386, 0.00039130449295043945, 0.00041628628969192505, 0.00044126808643341064, 0.00046624988317489624, 0.0004912316799163818, 0.0005162134766578674, 0.000541195273399353, 0.0005661770701408386, 0.0005911588668823242, 0.0006161406636238098, 0.0006411224603652954, 0.000666104257106781, 0.0006910860538482666, 0.0007160678505897522, 0.0007410496473312378, 0.0007660314440727234, 0.000791013240814209, 0.0008159950375556946, 0.0008409768342971802, 0.0008659586310386658, 0.0008909404277801514, 0.000915922224521637, 0.0009409040212631226, 0.0009658858180046082, 0.0009908676147460938]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 2.0, 6.0, 7.0, 12.0, 16.0, 29.0, 26.0, 31.0, 50.0, 87.0, 104.0, 191.0, 295.0, 679.0, 2711.0, 1034795.0, 7598.0, 824.0, 376.0, 225.0, 150.0, 95.0, 45.0, 51.0, 36.0, 16.0, 18.0, 11.0, 8.0, 9.0, 11.0, 5.0, 8.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.018463134765625, -0.017984867095947266, -0.01750659942626953, -0.017028331756591797, -0.016550064086914062, -0.016071796417236328, -0.015593528747558594, -0.01511526107788086, -0.014636993408203125, -0.01415872573852539, -0.013680458068847656, -0.013202190399169922, -0.012723922729492188, -0.012245655059814453, -0.011767387390136719, -0.011289119720458984, -0.01081085205078125, -0.010332584381103516, -0.009854316711425781, -0.009376049041748047, -0.008897781372070312, -0.008419513702392578, -0.007941246032714844, -0.007462978363037109, -0.006984710693359375, -0.006506443023681641, -0.006028175354003906, -0.005549907684326172, -0.0050716400146484375, -0.004593372344970703, -0.004115104675292969, -0.0036368370056152344, -0.0031585693359375, -0.0026803016662597656, -0.0022020339965820312, -0.0017237663269042969, -0.0012454986572265625, -0.0007672309875488281, -0.00028896331787109375, 0.00018930435180664062, 0.000667572021484375, 0.0011458396911621094, 0.0016241073608398438, 0.002102375030517578, 0.0025806427001953125, 0.003058910369873047, 0.0035371780395507812, 0.004015445709228516, 0.00449371337890625, 0.004971981048583984, 0.005450248718261719, 0.005928516387939453, 0.0064067840576171875, 0.006885051727294922, 0.007363319396972656, 0.00784158706665039, 0.008319854736328125, 0.00879812240600586, 0.009276390075683594, 0.009754657745361328, 0.010232925415039062, 0.010711193084716797, 0.011189460754394531, 0.011667728424072266, 0.01214599609375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 30.0, 129.0, 296.0, 368.0, 140.0, 37.0, 8.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006605072994716465, -0.0006318026571534574, -0.0006030980148352683, -0.0005743933725170791, -0.0005456887884065509, -0.0005169841460883617, -0.0004882795037701726, -0.00045957486145198345, -0.0004308702191337943, -0.00040216557681560516, -0.000373460934497416, -0.00034475632128305733, -0.0003160516789648682, -0.00028734703664667904, -0.00025864242343232036, -0.0002299377811141312, -0.00020123313879594207, -0.00017252849647775292, -0.000143823868711479, -0.00011511923366924748, -8.641459862701595e-05, -5.7709956308826804e-05, -2.900532854255289e-05, -3.007007762789726e-07, 2.840394154191017e-05, 5.71085765841417e-05, 8.581321162637323e-05, 0.00011451784666860476, 0.0001432224817108363, 0.00017192712402902544, 0.00020063175179529935, 0.00022933637956157327, 0.0002580409636721015, 0.00028674560599029064, 0.0003154502483084798, 0.0003441548615228385, 0.0003728595038410276, 0.00040156414615921676, 0.00043026875937357545, 0.0004589734016917646, 0.00048767804400995374, 0.0005163826863281429, 0.000545087328646332, 0.0005737919709645212, 0.0006024965550750494, 0.0006312011973932385, 0.0006599058397114277, 0.0006886104820296168, 0.000717315124347806, 0.0007460197666659951, 0.0007747244089841843, 0.0008034290513023734, 0.0008321336936205626, 0.0008608383359387517, 0.0008895429200492799, 0.0009182475623674691, 0.0009469522046856582, 0.0009756568470038474, 0.0010043614311143756, 0.0010330660734325647, 0.0010617707157507539, 0.001090475358068943, 0.0011191800003871322, 0.0011478846427053213, 0.0011765892850235105]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 6.0, 4.0, 6.0, 11.0, 14.0, 6.0, 11.0, 15.0, 20.0, 12.0, 9.0, 12.0, 24.0, 29.0, 36.0, 36.0, 27.0, 28.0, 27.0, 33.0, 45.0, 44.0, 36.0, 38.0, 41.0, 35.0, 28.0, 32.0, 31.0, 29.0, 33.0, 36.0, 19.0, 18.0, 27.0, 26.0, 17.0, 26.0, 10.0, 10.0, 13.0, 16.0, 4.0, 7.0, 4.0, 7.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.00029647350311279297, -0.0002877218648791313, -0.00027897022664546967, -0.000270218588411808, -0.00026146695017814636, -0.0002527153119444847, -0.00024396367371082306, -0.0002352120354771614, -0.00022646039724349976, -0.0002177087590098381, -0.00020895712077617645, -0.0002002054825425148, -0.00019145384430885315, -0.0001827022060751915, -0.00017395056784152985, -0.0001651989296078682, -0.00015644729137420654, -0.0001476956531405449, -0.00013894401490688324, -0.0001301923766732216, -0.00012144073843955994, -0.00011268910020589828, -0.00010393746197223663, -9.518582373857498e-05, -8.643418550491333e-05, -7.768254727125168e-05, -6.893090903759003e-05, -6.0179270803928375e-05, -5.1427632570266724e-05, -4.267599433660507e-05, -3.392435610294342e-05, -2.517271786928177e-05, -1.6421079635620117e-05, -7.669441401958466e-06, 1.082196831703186e-06, 9.833835065364838e-06, 1.858547329902649e-05, 2.733711153268814e-05, 3.608874976634979e-05, 4.4840388000011444e-05, 5.3592026233673096e-05, 6.234366446733475e-05, 7.10953027009964e-05, 7.984694093465805e-05, 8.85985791683197e-05, 9.735021740198135e-05, 0.000106101855635643, 0.00011485349386930466, 0.0001236051321029663, 0.00013235677033662796, 0.0001411084085702896, 0.00014986004680395126, 0.00015861168503761292, 0.00016736332327127457, 0.00017611496150493622, 0.00018486659973859787, 0.00019361823797225952, 0.00020236987620592117, 0.00021112151443958282, 0.00021987315267324448, 0.00022862479090690613, 0.00023737642914056778, 0.00024612806737422943, 0.0002548797056078911, 0.00026363134384155273]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 9.0, 4.0, 10.0, 14.0, 11.0, 23.0, 21.0, 28.0, 28.0, 33.0, 35.0, 26.0, 43.0, 47.0, 54.0, 47.0, 61.0, 40.0, 64.0, 53.0, 42.0, 33.0, 30.0, 48.0, 27.0, 24.0, 25.0, 24.0, 20.0, 20.0, 13.0, 15.0, 8.0, 3.0, 5.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8828125, -5.7059326171875, -5.529052734375, -5.3521728515625, -5.17529296875, -4.9984130859375, -4.821533203125, -4.6446533203125, -4.4677734375, -4.2908935546875, -4.114013671875, -3.9371337890625, -3.76025390625, -3.5833740234375, -3.406494140625, -3.2296142578125, -3.052734375, -2.8758544921875, -2.698974609375, -2.5220947265625, -2.34521484375, -2.1683349609375, -1.991455078125, -1.8145751953125, -1.6376953125, -1.4608154296875, -1.283935546875, -1.1070556640625, -0.93017578125, -0.7532958984375, -0.576416015625, -0.3995361328125, -0.22265625, -0.0457763671875, 0.131103515625, 0.3079833984375, 0.48486328125, 0.6617431640625, 0.838623046875, 1.0155029296875, 1.1923828125, 1.3692626953125, 1.546142578125, 1.7230224609375, 1.89990234375, 2.0767822265625, 2.253662109375, 2.4305419921875, 2.607421875, 2.7843017578125, 2.961181640625, 3.1380615234375, 3.31494140625, 3.4918212890625, 3.668701171875, 3.8455810546875, 4.0224609375, 4.1993408203125, 4.376220703125, 4.5531005859375, 4.72998046875, 4.9068603515625, 5.083740234375, 5.2606201171875, 5.4375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 9.0, 14.0, 16.0, 22.0, 41.0, 49.0, 64.0, 87.0, 119.0, 161.0, 219.0, 312.0, 429.0, 642.0, 1074.0, 2028.0, 4172.0, 10842.0, 41189.0, 276733.0, 586309.0, 92021.0, 19034.0, 6249.0, 2652.0, 1397.0, 832.0, 549.0, 360.0, 252.0, 169.0, 136.0, 95.0, 81.0, 52.0, 38.0, 33.0, 17.0, 18.0, 13.0, 8.0, 10.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7421875, -8.4530029296875, -8.163818359375, -7.8746337890625, -7.58544921875, -7.2962646484375, -7.007080078125, -6.7178955078125, -6.4287109375, -6.1395263671875, -5.850341796875, -5.5611572265625, -5.27197265625, -4.9827880859375, -4.693603515625, -4.4044189453125, -4.115234375, -3.8260498046875, -3.536865234375, -3.2476806640625, -2.95849609375, -2.6693115234375, -2.380126953125, -2.0909423828125, -1.8017578125, -1.5125732421875, -1.223388671875, -0.9342041015625, -0.64501953125, -0.3558349609375, -0.066650390625, 0.2225341796875, 0.51171875, 0.8009033203125, 1.090087890625, 1.3792724609375, 1.66845703125, 1.9576416015625, 2.246826171875, 2.5360107421875, 2.8251953125, 3.1143798828125, 3.403564453125, 3.6927490234375, 3.98193359375, 4.2711181640625, 4.560302734375, 4.8494873046875, 5.138671875, 5.4278564453125, 5.717041015625, 6.0062255859375, 6.29541015625, 6.5845947265625, 6.873779296875, 7.1629638671875, 7.4521484375, 7.7413330078125, 8.030517578125, 8.3197021484375, 8.60888671875, 8.8980712890625, 9.187255859375, 9.4764404296875, 9.765625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 9.0, 7.0, 20.0, 17.0, 16.0, 25.0, 36.0, 47.0, 51.0, 49.0, 69.0, 112.0, 404.0, 1651.0, 124.0, 83.0, 77.0, 53.0, 30.0, 34.0, 28.0, 28.0, 10.0, 4.0, 12.0, 11.0, 8.0, 7.0, 7.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.953125, -19.351806640625, -18.75048828125, -18.149169921875, -17.5478515625, -16.946533203125, -16.34521484375, -15.743896484375, -15.142578125, -14.541259765625, -13.93994140625, -13.338623046875, -12.7373046875, -12.135986328125, -11.53466796875, -10.933349609375, -10.33203125, -9.730712890625, -9.12939453125, -8.528076171875, -7.9267578125, -7.325439453125, -6.72412109375, -6.122802734375, -5.521484375, -4.920166015625, -4.31884765625, -3.717529296875, -3.1162109375, -2.514892578125, -1.91357421875, -1.312255859375, -0.7109375, -0.109619140625, 0.49169921875, 1.093017578125, 1.6943359375, 2.295654296875, 2.89697265625, 3.498291015625, 4.099609375, 4.700927734375, 5.30224609375, 5.903564453125, 6.5048828125, 7.106201171875, 7.70751953125, 8.308837890625, 8.91015625, 9.511474609375, 10.11279296875, 10.714111328125, 11.3154296875, 11.916748046875, 12.51806640625, 13.119384765625, 13.720703125, 14.322021484375, 14.92333984375, 15.524658203125, 16.1259765625, 16.727294921875, 17.32861328125, 17.929931640625, 18.53125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 8.0, 4.0, 14.0, 6.0, 16.0, 25.0, 33.0, 55.0, 95.0, 113.0, 174.0, 339.0, 766.0, 5458.0, 3131864.0, 4998.0, 819.0, 336.0, 225.0, 115.0, 78.0, 51.0, 36.0, 28.0, 13.0, 15.0, 8.0, 5.0, 5.0, 0.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.59375, -47.09814453125, -45.6025390625, -44.10693359375, -42.611328125, -41.11572265625, -39.6201171875, -38.12451171875, -36.62890625, -35.13330078125, -33.6376953125, -32.14208984375, -30.646484375, -29.15087890625, -27.6552734375, -26.15966796875, -24.6640625, -23.16845703125, -21.6728515625, -20.17724609375, -18.681640625, -17.18603515625, -15.6904296875, -14.19482421875, -12.69921875, -11.20361328125, -9.7080078125, -8.21240234375, -6.716796875, -5.22119140625, -3.7255859375, -2.22998046875, -0.734375, 0.76123046875, 2.2568359375, 3.75244140625, 5.248046875, 6.74365234375, 8.2392578125, 9.73486328125, 11.23046875, 12.72607421875, 14.2216796875, 15.71728515625, 17.212890625, 18.70849609375, 20.2041015625, 21.69970703125, 23.1953125, 24.69091796875, 26.1865234375, 27.68212890625, 29.177734375, 30.67333984375, 32.1689453125, 33.66455078125, 35.16015625, 36.65576171875, 38.1513671875, 39.64697265625, 41.142578125, 42.63818359375, 44.1337890625, 45.62939453125, 47.125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 245.0, 734.0, 33.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.6597900390625, -97.63075256347656, -93.60172271728516, -89.57269287109375, -85.54365539550781, -81.51461791992188, -77.48558807373047, -73.45655822753906, -69.42752075195312, -65.39848327636719, -61.36945343017578, -57.34041976928711, -53.31138610839844, -49.282352447509766, -45.253318786621094, -41.22428512573242, -37.19525146484375, -33.16621780395508, -29.137184143066406, -25.108150482177734, -21.079116821289062, -17.05008316040039, -13.021049499511719, -8.992015838623047, -4.962982177734375, -0.9339485168457031, 3.0950851440429688, 7.124118804931641, 11.153152465820312, 15.182186126708984, 19.211219787597656, 23.240253448486328, 27.269302368164062, 31.298336029052734, 35.327369689941406, 39.35640335083008, 43.38543701171875, 47.41447067260742, 51.443504333496094, 55.472537994384766, 59.50157165527344, 63.53060531616211, 67.55963897705078, 71.58866882324219, 75.61770629882812, 79.64674377441406, 83.67577362060547, 87.70480346679688, 91.73384094238281, 95.76287841796875, 99.79190826416016, 103.82093811035156, 107.8499755859375, 111.87901306152344, 115.90804290771484, 119.93707275390625, 123.96611022949219, 127.99514770507812, 132.024169921875, 136.05320739746094, 140.08224487304688, 144.1112823486328, 148.14031982421875, 152.16934204101562, 156.19837951660156]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 4.0, 3.0, 10.0, 16.0, 8.0, 15.0, 19.0, 19.0, 19.0, 18.0, 14.0, 26.0, 31.0, 36.0, 31.0, 27.0, 45.0, 37.0, 44.0, 56.0, 42.0, 54.0, 38.0, 35.0, 40.0, 40.0, 37.0, 20.0, 36.0, 22.0, 28.0, 19.0, 23.0, 19.0, 16.0, 16.0, 10.0, 10.0, 4.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-35.77206039428711, -34.684051513671875, -33.59604263305664, -32.508033752441406, -31.420026779174805, -30.33201789855957, -29.24401092529297, -28.156002044677734, -27.0679931640625, -25.979984283447266, -24.89197540283203, -23.80396842956543, -22.715959548950195, -21.62795066833496, -20.53994369506836, -19.451934814453125, -18.36392593383789, -17.275917053222656, -16.187908172607422, -15.09990119934082, -14.011892318725586, -12.923883438110352, -11.835875511169434, -10.747867584228516, -9.659858703613281, -8.571849822998047, -7.483841896057129, -6.395833492279053, -5.307825088500977, -4.2198166847229, -3.131808280944824, -2.043799877166748, -0.9557952880859375, 0.13221311569213867, 1.2202215194702148, 2.308229923248291, 3.396238327026367, 4.484246730804443, 5.5722551345825195, 6.660263538360596, 7.748271942138672, 8.836280822753906, 9.924288749694824, 11.012296676635742, 12.100305557250977, 13.188314437866211, 14.276322364807129, 15.364330291748047, 16.45233917236328, 17.540348052978516, 18.62835693359375, 19.71636390686035, 20.804372787475586, 21.89238166809082, 22.980388641357422, 24.068397521972656, 25.15640640258789, 26.244415283203125, 27.33242416381836, 28.42043113708496, 29.508440017700195, 30.59644889831543, 31.68445587158203, 32.772464752197266, 33.8604736328125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 7.0, 12.0, 8.0, 7.0, 10.0, 15.0, 12.0, 20.0, 27.0, 28.0, 38.0, 32.0, 41.0, 38.0, 32.0, 36.0, 33.0, 41.0, 31.0, 48.0, 29.0, 45.0, 45.0, 40.0, 33.0, 28.0, 43.0, 25.0, 31.0, 21.0, 23.0, 8.0, 20.0, 16.0, 15.0, 10.0, 12.0, 4.0, 12.0, 5.0, 3.0, 7.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.49609375, -5.31622314453125, -5.1363525390625, -4.95648193359375, -4.776611328125, -4.59674072265625, -4.4168701171875, -4.23699951171875, -4.05712890625, -3.87725830078125, -3.6973876953125, -3.51751708984375, -3.337646484375, -3.15777587890625, -2.9779052734375, -2.79803466796875, -2.6181640625, -2.43829345703125, -2.2584228515625, -2.07855224609375, -1.898681640625, -1.71881103515625, -1.5389404296875, -1.35906982421875, -1.17919921875, -0.99932861328125, -0.8194580078125, -0.63958740234375, -0.459716796875, -0.27984619140625, -0.0999755859375, 0.07989501953125, 0.259765625, 0.43963623046875, 0.6195068359375, 0.79937744140625, 0.979248046875, 1.15911865234375, 1.3389892578125, 1.51885986328125, 1.69873046875, 1.87860107421875, 2.0584716796875, 2.23834228515625, 2.418212890625, 2.59808349609375, 2.7779541015625, 2.95782470703125, 3.1376953125, 3.31756591796875, 3.4974365234375, 3.67730712890625, 3.857177734375, 4.03704833984375, 4.2169189453125, 4.39678955078125, 4.57666015625, 4.75653076171875, 4.9364013671875, 5.11627197265625, 5.296142578125, 5.47601318359375, 5.6558837890625, 5.83575439453125, 6.015625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 10.0, 6.0, 12.0, 23.0, 25.0, 28.0, 47.0, 37.0, 56.0, 79.0, 98.0, 135.0, 157.0, 244.0, 321.0, 527.0, 803.0, 1399.0, 5190.0, 543685.0, 3604393.0, 31283.0, 2525.0, 1024.0, 626.0, 404.0, 263.0, 210.0, 178.0, 102.0, 86.0, 70.0, 47.0, 46.0, 29.0, 29.0, 21.0, 12.0, 11.0, 12.0, 10.0, 6.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.84375, -28.82421875, -27.8046875, -26.78515625, -25.765625, -24.74609375, -23.7265625, -22.70703125, -21.6875, -20.66796875, -19.6484375, -18.62890625, -17.609375, -16.58984375, -15.5703125, -14.55078125, -13.53125, -12.51171875, -11.4921875, -10.47265625, -9.453125, -8.43359375, -7.4140625, -6.39453125, -5.375, -4.35546875, -3.3359375, -2.31640625, -1.296875, -0.27734375, 0.7421875, 1.76171875, 2.78125, 3.80078125, 4.8203125, 5.83984375, 6.859375, 7.87890625, 8.8984375, 9.91796875, 10.9375, 11.95703125, 12.9765625, 13.99609375, 15.015625, 16.03515625, 17.0546875, 18.07421875, 19.09375, 20.11328125, 21.1328125, 22.15234375, 23.171875, 24.19140625, 25.2109375, 26.23046875, 27.25, 28.26953125, 29.2890625, 30.30859375, 31.328125, 32.34765625, 33.3671875, 34.38671875, 35.40625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 18.0, 19.0, 24.0, 40.0, 98.0, 160.0, 335.0, 590.0, 853.0, 806.0, 519.0, 290.0, 140.0, 66.0, 42.0, 23.0, 21.0, 3.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.234375, -15.782958984375, -15.33154296875, -14.880126953125, -14.4287109375, -13.977294921875, -13.52587890625, -13.074462890625, -12.623046875, -12.171630859375, -11.72021484375, -11.268798828125, -10.8173828125, -10.365966796875, -9.91455078125, -9.463134765625, -9.01171875, -8.560302734375, -8.10888671875, -7.657470703125, -7.2060546875, -6.754638671875, -6.30322265625, -5.851806640625, -5.400390625, -4.948974609375, -4.49755859375, -4.046142578125, -3.5947265625, -3.143310546875, -2.69189453125, -2.240478515625, -1.7890625, -1.337646484375, -0.88623046875, -0.434814453125, 0.0166015625, 0.468017578125, 0.91943359375, 1.370849609375, 1.822265625, 2.273681640625, 2.72509765625, 3.176513671875, 3.6279296875, 4.079345703125, 4.53076171875, 4.982177734375, 5.43359375, 5.885009765625, 6.33642578125, 6.787841796875, 7.2392578125, 7.690673828125, 8.14208984375, 8.593505859375, 9.044921875, 9.496337890625, 9.94775390625, 10.399169921875, 10.8505859375, 11.302001953125, 11.75341796875, 12.204833984375, 12.65625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 6.0, 8.0, 8.0, 18.0, 27.0, 47.0, 101.0, 234.0, 522.0, 1296.0, 4476.0, 29440.0, 1028206.0, 3041436.0, 77940.0, 7320.0, 1904.0, 728.0, 299.0, 123.0, 49.0, 29.0, 20.0, 15.0, 10.0, 2.0, 4.0, 3.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.953125, -13.457763671875, -12.96240234375, -12.467041015625, -11.9716796875, -11.476318359375, -10.98095703125, -10.485595703125, -9.990234375, -9.494873046875, -8.99951171875, -8.504150390625, -8.0087890625, -7.513427734375, -7.01806640625, -6.522705078125, -6.02734375, -5.531982421875, -5.03662109375, -4.541259765625, -4.0458984375, -3.550537109375, -3.05517578125, -2.559814453125, -2.064453125, -1.569091796875, -1.07373046875, -0.578369140625, -0.0830078125, 0.412353515625, 0.90771484375, 1.403076171875, 1.8984375, 2.393798828125, 2.88916015625, 3.384521484375, 3.8798828125, 4.375244140625, 4.87060546875, 5.365966796875, 5.861328125, 6.356689453125, 6.85205078125, 7.347412109375, 7.8427734375, 8.338134765625, 8.83349609375, 9.328857421875, 9.82421875, 10.319580078125, 10.81494140625, 11.310302734375, 11.8056640625, 12.301025390625, 12.79638671875, 13.291748046875, 13.787109375, 14.282470703125, 14.77783203125, 15.273193359375, 15.7685546875, 16.263916015625, 16.75927734375, 17.254638671875, 17.75]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 14.0, 23.0, 49.0, 84.0, 106.0, 154.0, 145.0, 158.0, 97.0, 69.0, 42.0, 30.0, 12.0, 8.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.885250091552734, -51.268924713134766, -48.65260314941406, -46.036277770996094, -43.419952392578125, -40.803627014160156, -38.18730545043945, -35.570980072021484, -32.95465850830078, -30.338335037231445, -27.722009658813477, -25.10568618774414, -22.489360809326172, -19.873037338256836, -17.2567138671875, -14.640388488769531, -12.024063110351562, -9.40773868560791, -6.791414737701416, -4.175090789794922, -1.5587663650512695, 1.0575580596923828, 3.6738815307617188, 6.2902069091796875, 8.906530380249023, 11.522854804992676, 14.139179229736328, 16.755502700805664, 19.371826171875, 21.98815155029297, 24.604475021362305, 27.220800399780273, 29.837127685546875, 32.453453063964844, 35.06977462768555, 37.686100006103516, 40.302425384521484, 42.91874694824219, 45.535072326660156, 48.151397705078125, 50.767723083496094, 53.38404846191406, 56.000370025634766, 58.616695404052734, 61.2330207824707, 63.849342346191406, 66.46566772460938, 69.08199310302734, 71.69831848144531, 74.31464385986328, 76.93096923828125, 79.54728698730469, 82.16361236572266, 84.77993774414062, 87.3962631225586, 90.01258850097656, 92.62890625, 95.24523162841797, 97.86155700683594, 100.47787475585938, 103.09420013427734, 105.71052551269531, 108.32685089111328, 110.94317626953125, 113.55950164794922]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 8.0, 9.0, 11.0, 15.0, 12.0, 10.0, 12.0, 20.0, 12.0, 25.0, 38.0, 31.0, 27.0, 40.0, 28.0, 38.0, 42.0, 39.0, 48.0, 41.0, 47.0, 27.0, 43.0, 43.0, 45.0, 53.0, 32.0, 29.0, 35.0, 20.0, 19.0, 18.0, 10.0, 23.0, 12.0, 8.0, 7.0, 8.0, 6.0, 4.0, 5.0, 0.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-32.498497009277344, -31.512523651123047, -30.52655029296875, -29.540576934814453, -28.55460548400879, -27.568632125854492, -26.582658767700195, -25.5966854095459, -24.610713958740234, -23.624740600585938, -22.63876724243164, -21.652793884277344, -20.66682243347168, -19.680849075317383, -18.694875717163086, -17.70890235900879, -16.722929000854492, -15.736955642700195, -14.750983238220215, -13.765009880065918, -12.779037475585938, -11.79306411743164, -10.807090759277344, -9.821117401123047, -8.835144996643066, -7.849172115325928, -6.863199234008789, -5.877225875854492, -4.8912529945373535, -3.905280113220215, -2.919306755065918, -1.9333338737487793, -0.9473609924316406, 0.0386120080947876, 1.0245850086212158, 2.0105581283569336, 2.9965310096740723, 3.982503890991211, 4.968477249145508, 5.9544501304626465, 6.940423011779785, 7.926395893096924, 8.912368774414062, 9.89834213256836, 10.884315490722656, 11.870287895202637, 12.856261253356934, 13.842233657836914, 14.828207015991211, 15.814180374145508, 16.800153732299805, 17.78612518310547, 18.772098541259766, 19.758071899414062, 20.74404525756836, 21.730018615722656, 22.715991973876953, 23.70196533203125, 24.687938690185547, 25.673912048339844, 26.659883499145508, 27.645856857299805, 28.6318302154541, 29.6178035736084, 30.603775024414062]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 6.0, 14.0, 8.0, 9.0, 12.0, 13.0, 16.0, 15.0, 21.0, 22.0, 25.0, 35.0, 30.0, 46.0, 31.0, 41.0, 34.0, 42.0, 50.0, 49.0, 27.0, 45.0, 53.0, 51.0, 38.0, 26.0, 37.0, 41.0, 23.0, 24.0, 25.0, 13.0, 20.0, 9.0, 9.0, 11.0, 5.0, 8.0, 4.0, 2.0, 7.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-58.78125, -57.125, -55.46875, -53.8125, -52.15625, -50.5, -48.84375, -47.1875, -45.53125, -43.875, -42.21875, -40.5625, -38.90625, -37.25, -35.59375, -33.9375, -32.28125, -30.625, -28.96875, -27.3125, -25.65625, -24.0, -22.34375, -20.6875, -19.03125, -17.375, -15.71875, -14.0625, -12.40625, -10.75, -9.09375, -7.4375, -5.78125, -4.125, -2.46875, -0.8125, 0.84375, 2.5, 4.15625, 5.8125, 7.46875, 9.125, 10.78125, 12.4375, 14.09375, 15.75, 17.40625, 19.0625, 20.71875, 22.375, 24.03125, 25.6875, 27.34375, 29.0, 30.65625, 32.3125, 33.96875, 35.625, 37.28125, 38.9375, 40.59375, 42.25, 43.90625, 45.5625, 47.21875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 12.0, 19.0, 23.0, 30.0, 57.0, 88.0, 105.0, 160.0, 277.0, 429.0, 631.0, 981.0, 1503.0, 2290.0, 3632.0, 5645.0, 9074.0, 14748.0, 24521.0, 41020.0, 71545.0, 138227.0, 359680.0, 170974.0, 83221.0, 46981.0, 27783.0, 16878.0, 10342.0, 6330.0, 3998.0, 2521.0, 1677.0, 1083.0, 692.0, 470.0, 311.0, 202.0, 134.0, 83.0, 69.0, 34.0, 27.0, 16.0, 12.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.546875, -11.1817626953125, -10.816650390625, -10.4515380859375, -10.08642578125, -9.7213134765625, -9.356201171875, -8.9910888671875, -8.6259765625, -8.2608642578125, -7.895751953125, -7.5306396484375, -7.16552734375, -6.8004150390625, -6.435302734375, -6.0701904296875, -5.705078125, -5.3399658203125, -4.974853515625, -4.6097412109375, -4.24462890625, -3.8795166015625, -3.514404296875, -3.1492919921875, -2.7841796875, -2.4190673828125, -2.053955078125, -1.6888427734375, -1.32373046875, -0.9586181640625, -0.593505859375, -0.2283935546875, 0.13671875, 0.5018310546875, 0.866943359375, 1.2320556640625, 1.59716796875, 1.9622802734375, 2.327392578125, 2.6925048828125, 3.0576171875, 3.4227294921875, 3.787841796875, 4.1529541015625, 4.51806640625, 4.8831787109375, 5.248291015625, 5.6134033203125, 5.978515625, 6.3436279296875, 6.708740234375, 7.0738525390625, 7.43896484375, 7.8040771484375, 8.169189453125, 8.5343017578125, 8.8994140625, 9.2645263671875, 9.629638671875, 9.9947509765625, 10.35986328125, 10.7249755859375, 11.090087890625, 11.4552001953125, 11.8203125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 8.0, 4.0, 7.0, 8.0, 8.0, 12.0, 11.0, 11.0, 16.0, 20.0, 15.0, 21.0, 22.0, 30.0, 24.0, 35.0, 28.0, 36.0, 40.0, 36.0, 44.0, 31.0, 33.0, 1053.0, 30.0, 41.0, 51.0, 32.0, 36.0, 31.0, 26.0, 36.0, 22.0, 31.0, 24.0, 22.0, 25.0, 13.0, 12.0, 9.0, 5.0, 8.0, 3.0, 6.0, 5.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-28.109375, -27.172607421875, -26.23583984375, -25.299072265625, -24.3623046875, -23.425537109375, -22.48876953125, -21.552001953125, -20.615234375, -19.678466796875, -18.74169921875, -17.804931640625, -16.8681640625, -15.931396484375, -14.99462890625, -14.057861328125, -13.12109375, -12.184326171875, -11.24755859375, -10.310791015625, -9.3740234375, -8.437255859375, -7.50048828125, -6.563720703125, -5.626953125, -4.690185546875, -3.75341796875, -2.816650390625, -1.8798828125, -0.943115234375, -0.00634765625, 0.930419921875, 1.8671875, 2.803955078125, 3.74072265625, 4.677490234375, 5.6142578125, 6.551025390625, 7.48779296875, 8.424560546875, 9.361328125, 10.298095703125, 11.23486328125, 12.171630859375, 13.1083984375, 14.045166015625, 14.98193359375, 15.918701171875, 16.85546875, 17.792236328125, 18.72900390625, 19.665771484375, 20.6025390625, 21.539306640625, 22.47607421875, 23.412841796875, 24.349609375, 25.286376953125, 26.22314453125, 27.159912109375, 28.0966796875, 29.033447265625, 29.97021484375, 30.906982421875, 31.84375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 9.0, 4.0, 7.0, 20.0, 21.0, 29.0, 28.0, 46.0, 84.0, 92.0, 137.0, 223.0, 325.0, 486.0, 747.0, 1266.0, 1913.0, 3156.0, 4824.0, 7897.0, 12776.0, 21550.0, 36454.0, 64890.0, 122692.0, 1365933.0, 220241.0, 98654.0, 54378.0, 30995.0, 18198.0, 10855.0, 6677.0, 4074.0, 2488.0, 1651.0, 1156.0, 703.0, 494.0, 313.0, 236.0, 140.0, 87.0, 69.0, 38.0, 29.0, 16.0, 17.0, 6.0, 6.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-13.0625, -12.676513671875, -12.29052734375, -11.904541015625, -11.5185546875, -11.132568359375, -10.74658203125, -10.360595703125, -9.974609375, -9.588623046875, -9.20263671875, -8.816650390625, -8.4306640625, -8.044677734375, -7.65869140625, -7.272705078125, -6.88671875, -6.500732421875, -6.11474609375, -5.728759765625, -5.3427734375, -4.956787109375, -4.57080078125, -4.184814453125, -3.798828125, -3.412841796875, -3.02685546875, -2.640869140625, -2.2548828125, -1.868896484375, -1.48291015625, -1.096923828125, -0.7109375, -0.324951171875, 0.06103515625, 0.447021484375, 0.8330078125, 1.218994140625, 1.60498046875, 1.990966796875, 2.376953125, 2.762939453125, 3.14892578125, 3.534912109375, 3.9208984375, 4.306884765625, 4.69287109375, 5.078857421875, 5.46484375, 5.850830078125, 6.23681640625, 6.622802734375, 7.0087890625, 7.394775390625, 7.78076171875, 8.166748046875, 8.552734375, 8.938720703125, 9.32470703125, 9.710693359375, 10.0966796875, 10.482666015625, 10.86865234375, 11.254638671875, 11.640625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 2.0, 5.0, 3.0, 7.0, 3.0, 11.0, 15.0, 13.0, 19.0, 24.0, 17.0, 35.0, 44.0, 53.0, 73.0, 141.0, 133.0, 119.0, 87.0, 31.0, 28.0, 26.0, 25.0, 17.0, 13.0, 10.0, 11.0, 6.0, 9.0, 2.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01409912109375, -0.013649225234985352, -0.013199329376220703, -0.012749433517456055, -0.012299537658691406, -0.011849641799926758, -0.01139974594116211, -0.010949850082397461, -0.010499954223632812, -0.010050058364868164, -0.009600162506103516, -0.009150266647338867, -0.008700370788574219, -0.00825047492980957, -0.007800579071044922, -0.0073506832122802734, -0.006900787353515625, -0.0064508914947509766, -0.006000995635986328, -0.00555109977722168, -0.005101203918457031, -0.004651308059692383, -0.004201412200927734, -0.003751516342163086, -0.0033016204833984375, -0.002851724624633789, -0.0024018287658691406, -0.0019519329071044922, -0.0015020370483398438, -0.0010521411895751953, -0.0006022453308105469, -0.00015234947204589844, 0.00029754638671875, 0.0007474422454833984, 0.0011973381042480469, 0.0016472339630126953, 0.0020971298217773438, 0.002547025680541992, 0.0029969215393066406, 0.003446817398071289, 0.0038967132568359375, 0.004346609115600586, 0.004796504974365234, 0.005246400833129883, 0.005696296691894531, 0.00614619255065918, 0.006596088409423828, 0.0070459842681884766, 0.007495880126953125, 0.007945775985717773, 0.008395671844482422, 0.00884556770324707, 0.009295463562011719, 0.009745359420776367, 0.010195255279541016, 0.010645151138305664, 0.011095046997070312, 0.011544942855834961, 0.01199483871459961, 0.012444734573364258, 0.012894630432128906, 0.013344526290893555, 0.013794422149658203, 0.014244318008422852, 0.0146942138671875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 6.0, 5.0, 6.0, 14.0, 12.0, 20.0, 36.0, 34.0, 64.0, 60.0, 96.0, 157.0, 225.0, 358.0, 648.0, 1281.0, 3201.0, 10472.0, 45642.0, 390281.0, 521284.0, 55642.0, 12110.0, 3631.0, 1389.0, 701.0, 374.0, 219.0, 168.0, 103.0, 98.0, 40.0, 41.0, 38.0, 22.0, 15.0, 16.0, 13.0, 4.0, 5.0, 9.0, 3.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0838623046875, -0.08132553100585938, -0.07878875732421875, -0.07625198364257812, -0.0737152099609375, -0.07117843627929688, -0.06864166259765625, -0.06610488891601562, -0.063568115234375, -0.061031341552734375, -0.05849456787109375, -0.055957794189453125, -0.0534210205078125, -0.050884246826171875, -0.04834747314453125, -0.045810699462890625, -0.04327392578125, -0.040737152099609375, -0.03820037841796875, -0.035663604736328125, -0.0331268310546875, -0.030590057373046875, -0.02805328369140625, -0.025516510009765625, -0.022979736328125, -0.020442962646484375, -0.01790618896484375, -0.015369415283203125, -0.0128326416015625, -0.010295867919921875, -0.00775909423828125, -0.005222320556640625, -0.002685546875, -0.000148773193359375, 0.00238800048828125, 0.004924774169921875, 0.0074615478515625, 0.009998321533203125, 0.01253509521484375, 0.015071868896484375, 0.017608642578125, 0.020145416259765625, 0.02268218994140625, 0.025218963623046875, 0.0277557373046875, 0.030292510986328125, 0.03282928466796875, 0.035366058349609375, 0.03790283203125, 0.040439605712890625, 0.04297637939453125, 0.045513153076171875, 0.0480499267578125, 0.050586700439453125, 0.05312347412109375, 0.055660247802734375, 0.058197021484375, 0.060733795166015625, 0.06327056884765625, 0.06580734252929688, 0.0683441162109375, 0.07088088989257812, 0.07341766357421875, 0.07595443725585938, 0.0784912109375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 7.0, 14.0, 41.0, 58.0, 103.0, 146.0, 193.0, 170.0, 107.0, 67.0, 49.0, 23.0, 5.0, 7.0, 3.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01397439930588007, -0.013517401181161404, -0.013060402125120163, -0.012603404000401497, -0.012146404944360256, -0.01168940681964159, -0.01123240776360035, -0.010775409638881683, -0.010318411514163017, -0.009861413389444351, -0.00940441433340311, -0.008947416208684444, -0.008490417152643204, -0.008033419027924538, -0.007576420437544584, -0.007119421847164631, -0.0066624232567846775, -0.006205424666404724, -0.005748426076024771, -0.005291427485644817, -0.004834429360926151, -0.004377430770546198, -0.0039204321801662445, -0.0034634338226169348, -0.0030064352322369814, -0.002549436641857028, -0.0020924382843077183, -0.001635439693927765, -0.0011784412199631333, -0.0007214427459985018, -0.0002644441556185484, 0.00019255420193076134, 0.0006495527923107147, 0.0011065512662753463, 0.0015635497402399778, 0.0020205483306199312, 0.002477546688169241, 0.0029345452785491943, 0.0033915438689291477, 0.0038485422264784575, 0.004305540584027767, 0.0047625391744077206, 0.005219537764787674, 0.00567653588950634, 0.006133534479886293, 0.006590533070266247, 0.0070475316606462, 0.0075045302510261536, 0.00796152837574482, 0.008418526500463486, 0.008875525556504726, 0.009332523681223392, 0.009789522737264633, 0.0102465208619833, 0.010703518986701965, 0.011160518042743206, 0.011617517098784447, 0.012074515223503113, 0.012531514279544353, 0.01298851240426302, 0.01344551146030426, 0.013902509585022926, 0.014359507709741592, 0.014816506765782833, 0.0152735048905015]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 1.0, 4.0, 3.0, 4.0, 7.0, 4.0, 10.0, 3.0, 5.0, 7.0, 12.0, 18.0, 22.0, 13.0, 22.0, 29.0, 25.0, 31.0, 35.0, 24.0, 28.0, 32.0, 39.0, 53.0, 50.0, 38.0, 39.0, 44.0, 40.0, 29.0, 42.0, 43.0, 30.0, 22.0, 21.0, 16.0, 27.0, 24.0, 25.0, 16.0, 11.0, 10.0, 15.0, 9.0, 8.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005554914474487305, -0.00538150779902935, -0.005208101123571396, -0.0050346944481134415, -0.004861287772655487, -0.004687881097197533, -0.004514474421739578, -0.004341067746281624, -0.004167661070823669, -0.003994254395365715, -0.0038208477199077606, -0.003647441044449806, -0.003474034368991852, -0.0033006276935338974, -0.003127221018075943, -0.0029538143426179886, -0.002780407667160034, -0.0026070009917020798, -0.0024335943162441254, -0.002260187640786171, -0.0020867809653282166, -0.0019133742898702621, -0.0017399676144123077, -0.0015665609389543533, -0.001393154263496399, -0.0012197475880384445, -0.0010463409125804901, -0.0008729342371225357, -0.0006995275616645813, -0.0005261208862066269, -0.0003527142107486725, -0.00017930753529071808, -5.900859832763672e-06, 0.00016750581562519073, 0.00034091249108314514, 0.0005143191665410995, 0.000687725841999054, 0.0008611325174570084, 0.0010345391929149628, 0.0012079458683729172, 0.0013813525438308716, 0.001554759219288826, 0.0017281658947467804, 0.0019015725702047348, 0.002074979245662689, 0.0022483859211206436, 0.002421792596578598, 0.0025951992720365524, 0.002768605947494507, 0.0029420126229524612, 0.0031154192984104156, 0.00328882597386837, 0.0034622326493263245, 0.003635639324784279, 0.0038090460002422333, 0.003982452675700188, 0.004155859351158142, 0.0043292660266160965, 0.004502672702074051, 0.004676079377532005, 0.00484948605298996, 0.005022892728447914, 0.0051962994039058685, 0.005369706079363823, 0.005543112754821777]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 6.0, 14.0, 8.0, 9.0, 12.0, 13.0, 16.0, 16.0, 20.0, 22.0, 25.0, 35.0, 31.0, 45.0, 31.0, 40.0, 35.0, 42.0, 50.0, 49.0, 26.0, 46.0, 53.0, 51.0, 38.0, 25.0, 38.0, 41.0, 24.0, 23.0, 26.0, 12.0, 19.0, 10.0, 9.0, 12.0, 4.0, 8.0, 4.0, 2.0, 7.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-58.78125, -57.125, -55.46875, -53.8125, -52.15625, -50.5, -48.84375, -47.1875, -45.53125, -43.875, -42.21875, -40.5625, -38.90625, -37.25, -35.59375, -33.9375, -32.28125, -30.625, -28.96875, -27.3125, -25.65625, -24.0, -22.34375, -20.6875, -19.03125, -17.375, -15.71875, -14.0625, -12.40625, -10.75, -9.09375, -7.4375, -5.78125, -4.125, -2.46875, -0.8125, 0.84375, 2.5, 4.15625, 5.8125, 7.46875, 9.125, 10.78125, 12.4375, 14.09375, 15.75, 17.40625, 19.0625, 20.71875, 22.375, 24.03125, 25.6875, 27.34375, 29.0, 30.65625, 32.3125, 33.96875, 35.625, 37.28125, 38.9375, 40.59375, 42.25, 43.90625, 45.5625, 47.21875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 0.0, 0.0, 11.0, 4.0, 7.0, 10.0, 19.0, 21.0, 32.0, 48.0, 62.0, 86.0, 139.0, 210.0, 365.0, 724.0, 1256.0, 2651.0, 6187.0, 18908.0, 84961.0, 463472.0, 377346.0, 66016.0, 15549.0, 5377.0, 2373.0, 1098.0, 625.0, 357.0, 220.0, 126.0, 97.0, 51.0, 40.0, 26.0, 25.0, 15.0, 13.0, 8.0, 9.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.375, -11.9991455078125, -11.623291015625, -11.2474365234375, -10.87158203125, -10.4957275390625, -10.119873046875, -9.7440185546875, -9.3681640625, -8.9923095703125, -8.616455078125, -8.2406005859375, -7.86474609375, -7.4888916015625, -7.113037109375, -6.7371826171875, -6.361328125, -5.9854736328125, -5.609619140625, -5.2337646484375, -4.85791015625, -4.4820556640625, -4.106201171875, -3.7303466796875, -3.3544921875, -2.9786376953125, -2.602783203125, -2.2269287109375, -1.85107421875, -1.4752197265625, -1.099365234375, -0.7235107421875, -0.34765625, 0.0281982421875, 0.404052734375, 0.7799072265625, 1.15576171875, 1.5316162109375, 1.907470703125, 2.2833251953125, 2.6591796875, 3.0350341796875, 3.410888671875, 3.7867431640625, 4.16259765625, 4.5384521484375, 4.914306640625, 5.2901611328125, 5.666015625, 6.0418701171875, 6.417724609375, 6.7935791015625, 7.16943359375, 7.5452880859375, 7.921142578125, 8.2969970703125, 8.6728515625, 9.0487060546875, 9.424560546875, 9.8004150390625, 10.17626953125, 10.5521240234375, 10.927978515625, 11.3038330078125, 11.6796875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 9.0, 6.0, 15.0, 29.0, 33.0, 36.0, 58.0, 57.0, 70.0, 69.0, 1781.0, 445.0, 93.0, 69.0, 66.0, 53.0, 49.0, 42.0, 21.0, 14.0, 9.0, 10.0, 6.0, 0.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.9375, -123.5205078125, -119.103515625, -114.6865234375, -110.26953125, -105.8525390625, -101.435546875, -97.0185546875, -92.6015625, -88.1845703125, -83.767578125, -79.3505859375, -74.93359375, -70.5166015625, -66.099609375, -61.6826171875, -57.265625, -52.8486328125, -48.431640625, -44.0146484375, -39.59765625, -35.1806640625, -30.763671875, -26.3466796875, -21.9296875, -17.5126953125, -13.095703125, -8.6787109375, -4.26171875, 0.1552734375, 4.572265625, 8.9892578125, 13.40625, 17.8232421875, 22.240234375, 26.6572265625, 31.07421875, 35.4912109375, 39.908203125, 44.3251953125, 48.7421875, 53.1591796875, 57.576171875, 61.9931640625, 66.41015625, 70.8271484375, 75.244140625, 79.6611328125, 84.078125, 88.4951171875, 92.912109375, 97.3291015625, 101.74609375, 106.1630859375, 110.580078125, 114.9970703125, 119.4140625, 123.8310546875, 128.248046875, 132.6650390625, 137.08203125, 141.4990234375, 145.916015625, 150.3330078125, 154.75]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 8.0, 9.0, 10.0, 18.0, 19.0, 26.0, 42.0, 64.0, 80.0, 111.0, 200.0, 332.0, 498.0, 929.0, 1871.0, 7691.0, 103064.0, 2915671.0, 103053.0, 7723.0, 2004.0, 867.0, 490.0, 328.0, 191.0, 147.0, 77.0, 52.0, 40.0, 26.0, 21.0, 13.0, 4.0, 7.0, 2.0, 5.0, 0.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.78125, -23.111328125, -22.44140625, -21.771484375, -21.1015625, -20.431640625, -19.76171875, -19.091796875, -18.421875, -17.751953125, -17.08203125, -16.412109375, -15.7421875, -15.072265625, -14.40234375, -13.732421875, -13.0625, -12.392578125, -11.72265625, -11.052734375, -10.3828125, -9.712890625, -9.04296875, -8.373046875, -7.703125, -7.033203125, -6.36328125, -5.693359375, -5.0234375, -4.353515625, -3.68359375, -3.013671875, -2.34375, -1.673828125, -1.00390625, -0.333984375, 0.3359375, 1.005859375, 1.67578125, 2.345703125, 3.015625, 3.685546875, 4.35546875, 5.025390625, 5.6953125, 6.365234375, 7.03515625, 7.705078125, 8.375, 9.044921875, 9.71484375, 10.384765625, 11.0546875, 11.724609375, 12.39453125, 13.064453125, 13.734375, 14.404296875, 15.07421875, 15.744140625, 16.4140625, 17.083984375, 17.75390625, 18.423828125, 19.09375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 8.0, 31.0, 56.0, 177.0, 320.0, 234.0, 107.0, 34.0, 16.0, 9.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-244.5985107421875, -236.3458251953125, -228.09315490722656, -219.84046936035156, -211.58779907226562, -203.33511352539062, -195.08242797851562, -186.82974243164062, -178.5770721435547, -170.3243865966797, -162.07171630859375, -153.81903076171875, -145.56634521484375, -137.3136749267578, -129.0609893798828, -120.80831146240234, -112.55563354492188, -104.3029556274414, -96.05027770996094, -87.79759216308594, -79.54491424560547, -71.292236328125, -63.039554595947266, -54.78687286376953, -46.53419494628906, -38.281517028808594, -30.02883529663086, -21.776155471801758, -13.523475646972656, -5.2707977294921875, 2.981884002685547, 11.234565734863281, 19.487213134765625, 27.739892959594727, 35.99257278442383, 44.24525451660156, 52.49793243408203, 60.7506103515625, 69.0032958984375, 77.25597381591797, 85.50865173339844, 93.7613296508789, 102.01400756835938, 110.26669311523438, 118.51937103271484, 126.77204895019531, 135.0247344970703, 143.27740478515625, 151.53009033203125, 159.78277587890625, 168.0354461669922, 176.2881317138672, 184.54080200195312, 192.79348754882812, 201.04617309570312, 209.29885864257812, 217.55152893066406, 225.80421447753906, 234.056884765625, 242.3095703125, 250.562255859375, 258.81494140625, 267.0675964355469, 275.3202819824219, 283.5729675292969]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 6.0, 10.0, 13.0, 16.0, 18.0, 27.0, 41.0, 37.0, 38.0, 38.0, 46.0, 51.0, 59.0, 60.0, 51.0, 56.0, 66.0, 46.0, 48.0, 44.0, 30.0, 35.0, 23.0, 23.0, 19.0, 15.0, 13.0, 16.0, 11.0, 9.0, 3.0, 4.0, 4.0, 1.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.2759780883789, -110.3872299194336, -106.49848937988281, -102.6097412109375, -98.72099304199219, -94.83224487304688, -90.94349670410156, -87.05475616455078, -83.16600799560547, -79.27725982666016, -75.38851928710938, -71.49977111816406, -67.61102294921875, -63.72227478027344, -59.83353042602539, -55.944786071777344, -52.05603790283203, -48.16728973388672, -44.27854537963867, -40.389801025390625, -36.50105285644531, -32.6123046875, -28.723560333251953, -24.834814071655273, -20.946067810058594, -17.057321548461914, -13.168575286865234, -9.279829025268555, -5.391082763671875, -1.5023365020751953, 2.3864097595214844, 6.275156021118164, 10.163894653320312, 14.052640914916992, 17.941387176513672, 21.83013343811035, 25.71887969970703, 29.60762596130371, 33.49637222290039, 37.38511657714844, 41.27386474609375, 45.16261291503906, 49.05135726928711, 52.940101623535156, 56.82884979248047, 60.71759796142578, 64.60633850097656, 68.49508666992188, 72.38383483886719, 76.2725830078125, 80.16133117675781, 84.0500717163086, 87.9388198852539, 91.82756805419922, 95.71630859375, 99.60505676269531, 103.49380493164062, 107.38255310058594, 111.27130126953125, 115.16004180908203, 119.04878997802734, 122.93753814697266, 126.82627868652344, 130.71502685546875, 134.60377502441406]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 11.0, 12.0, 18.0, 22.0, 26.0, 42.0, 57.0, 88.0, 116.0, 195.0, 303.0, 452.0, 635.0, 1072.0, 1629.0, 2534.0, 3845.0, 5803.0, 1020115.0, 4063.0, 2544.0, 1664.0, 1132.0, 761.0, 450.0, 284.0, 210.0, 144.0, 86.0, 63.0, 36.0, 36.0, 25.0, 17.0, 9.0, 10.0, 7.0, 10.0, 5.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-26.637210845947266, -25.898723602294922, -25.160236358642578, -24.421749114990234, -23.68326187133789, -22.944774627685547, -22.206287384033203, -21.46780014038086, -20.729312896728516, -19.990825653076172, -19.252338409423828, -18.513851165771484, -17.77536392211914, -17.036876678466797, -16.298389434814453, -15.55990219116211, -14.821415901184082, -14.082928657531738, -13.344441413879395, -12.60595417022705, -11.867466926574707, -11.128979682922363, -10.390493392944336, -9.652006149291992, -8.913518905639648, -8.175031661987305, -7.436544418334961, -6.698057174682617, -5.959569931030273, -5.22108268737793, -4.482595920562744, -3.7441086769104004, -3.0056209564208984, -2.2671337127685547, -1.5286465883255005, -0.7901594638824463, -0.05167222023010254, 0.6868150234222412, 1.4253020286560059, 2.1637892723083496, 2.9022765159606934, 3.640763759613037, 4.379251003265381, 5.117737770080566, 5.85622501373291, 6.594712257385254, 7.333199501037598, 8.071686744689941, 8.810173988342285, 9.548661231994629, 10.287148475646973, 11.025635719299316, 11.76412296295166, 12.502610206604004, 13.241096496582031, 13.979583740234375, 14.718070983886719, 15.456558227539062, 16.195045471191406, 16.93353271484375, 17.672019958496094, 18.410507202148438, 19.14899444580078, 19.887481689453125, 20.62596893310547]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 10.0, 5.0, 16.0, 44.0, 48.0, 78.0, 355.0, 51462120.0, 231.0, 89.0, 24.0, 21.0, 16.0, 22.0, 20.0, 17.0, 21.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8247.9609375, -7994.0458984375, -7740.13037109375, -7486.21533203125, -7232.2998046875, -6978.384765625, -6724.4697265625, -6470.5546875, -6216.63916015625, -5962.72412109375, -5708.80859375, -5454.8935546875, -5200.978515625, -4947.06298828125, -4693.14794921875, -4439.232421875, -4185.3173828125, -3931.402099609375, -3677.48681640625, -3423.57177734375, -3169.656494140625, -2915.7412109375, -2661.826171875, -2407.910888671875, -2153.99560546875, -1900.080322265625, -1646.1651611328125, -1392.25, -1138.334716796875, -884.41943359375, -630.5042724609375, -376.589111328125, -122.67333984375, 131.24188232421875, 385.1571044921875, 639.0723266601562, 892.987548828125, 1146.90283203125, 1400.8179931640625, 1654.733154296875, 1908.6484375, 2162.563720703125, 2416.47900390625, 2670.39404296875, 2924.309326171875, 3178.224609375, 3432.1396484375, 3686.054931640625, 3939.97021484375, 4193.88525390625, 4447.80078125, 4701.7158203125, 4955.630859375, 5209.54638671875, 5463.46142578125, 5717.376953125, 5971.2919921875, 6225.20703125, 6479.12255859375, 6733.03759765625, 6986.953125, 7240.8681640625, 7494.783203125, 7748.6982421875, 8002.61376953125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 3.0, 12.0, 22.0, 28.0, 34.0, 46.0, 79.0, 117.0, 175.0, 261.0, 344.0, 485.0, 734.0, 1064.0, 1455.0, 2309.0, 3058.0, 4636.0, 6736.0, 9847.0, 14510.0, 22155.0, 32900.0, 50738.0, 78129.0, 127197.0, 215189.0, 440147.0, 3874563.0, 714150.0, 267705.0, 152500.0, 93010.0, 59932.0, 38481.0, 25382.0, 16725.0, 11482.0, 7755.0, 5409.0, 3608.0, 2622.0, 1739.0, 1273.0, 836.0, 598.0, 365.0, 253.0, 251.0, 137.0, 75.0, 65.0, 34.0, 31.0, 25.0, 9.0, 7.0, 5.0, 3.0, 3.0, 3.0], "bins": [-4.69140625, -4.5433349609375, -4.395263671875, -4.2471923828125, -4.09912109375, -3.9510498046875, -3.802978515625, -3.6549072265625, -3.5068359375, -3.3587646484375, -3.210693359375, -3.0626220703125, -2.91455078125, -2.7664794921875, -2.618408203125, -2.4703369140625, -2.322265625, -2.1741943359375, -2.026123046875, -1.8780517578125, -1.72998046875, -1.5819091796875, -1.433837890625, -1.2857666015625, -1.1376953125, -0.9896240234375, -0.841552734375, -0.6934814453125, -0.54541015625, -0.3973388671875, -0.249267578125, -0.1011962890625, 0.046875, 0.1949462890625, 0.343017578125, 0.4910888671875, 0.63916015625, 0.7872314453125, 0.935302734375, 1.0833740234375, 1.2314453125, 1.3795166015625, 1.527587890625, 1.6756591796875, 1.82373046875, 1.9718017578125, 2.119873046875, 2.2679443359375, 2.416015625, 2.5640869140625, 2.712158203125, 2.8602294921875, 3.00830078125, 3.1563720703125, 3.304443359375, 3.4525146484375, 3.6005859375, 3.7486572265625, 3.896728515625, 4.0447998046875, 4.19287109375, 4.3409423828125, 4.489013671875, 4.6370849609375, 4.78515625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 6.0, 9.0, 7.0, 12.0, 14.0, 8.0, 22.0, 12.0, 17.0, 29.0, 38.0, 25.0, 32.0, 30.0, 39.0, 38.0, 38.0, 51.0, 112.0, 489.0, 420.0, 119.0, 78.0, 50.0, 27.0, 37.0, 28.0, 33.0, 32.0, 34.0, 34.0, 15.0, 21.0, 14.0, 6.0, 13.0, 7.0, 9.0, 5.0, 2.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.4140625, -11.0677490234375, -10.721435546875, -10.3751220703125, -10.02880859375, -9.6824951171875, -9.336181640625, -8.9898681640625, -8.6435546875, -8.2972412109375, -7.950927734375, -7.6046142578125, -7.25830078125, -6.9119873046875, -6.565673828125, -6.2193603515625, -5.873046875, -5.5267333984375, -5.180419921875, -4.8341064453125, -4.48779296875, -4.1414794921875, -3.795166015625, -3.4488525390625, -3.1025390625, -2.7562255859375, -2.409912109375, -2.0635986328125, -1.71728515625, -1.3709716796875, -1.024658203125, -0.6783447265625, -0.33203125, 0.0142822265625, 0.360595703125, 0.7069091796875, 1.05322265625, 1.3995361328125, 1.745849609375, 2.0921630859375, 2.4384765625, 2.7847900390625, 3.131103515625, 3.4774169921875, 3.82373046875, 4.1700439453125, 4.516357421875, 4.8626708984375, 5.208984375, 5.5552978515625, 5.901611328125, 6.2479248046875, 6.59423828125, 6.9405517578125, 7.286865234375, 7.6331787109375, 7.9794921875, 8.3258056640625, 8.672119140625, 9.0184326171875, 9.36474609375, 9.7110595703125, 10.057373046875, 10.4036865234375, 10.75]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 5.0, 5.0, 13.0, 16.0, 5.0, 25.0, 35.0, 55.0, 71.0, 118.0, 220.0, 308.0, 479.0, 666.0, 971.0, 1348.0, 1795.0, 2952.0, 4595.0, 6967.0, 10305.0, 14677.0, 22015.0, 33608.0, 54609.0, 86491.0, 148523.0, 283714.0, 805877.0, 3790786.0, 482128.0, 215769.0, 120129.0, 72001.0, 43642.0, 29207.0, 19466.0, 12282.0, 8026.0, 5714.0, 3957.0, 2626.0, 1869.0, 1104.0, 764.0, 513.0, 346.0, 214.0, 120.0, 78.0, 85.0, 41.0, 29.0, 37.0, 11.0, 18.0, 6.0, 2.0, 3.0, 11.0], "bins": [-5.37109375, -5.2098388671875, -5.048583984375, -4.8873291015625, -4.72607421875, -4.5648193359375, -4.403564453125, -4.2423095703125, -4.0810546875, -3.9197998046875, -3.758544921875, -3.5972900390625, -3.43603515625, -3.2747802734375, -3.113525390625, -2.9522705078125, -2.791015625, -2.6297607421875, -2.468505859375, -2.3072509765625, -2.14599609375, -1.9847412109375, -1.823486328125, -1.6622314453125, -1.5009765625, -1.3397216796875, -1.178466796875, -1.0172119140625, -0.85595703125, -0.6947021484375, -0.533447265625, -0.3721923828125, -0.2109375, -0.0496826171875, 0.111572265625, 0.2728271484375, 0.43408203125, 0.5953369140625, 0.756591796875, 0.9178466796875, 1.0791015625, 1.2403564453125, 1.401611328125, 1.5628662109375, 1.72412109375, 1.8853759765625, 2.046630859375, 2.2078857421875, 2.369140625, 2.5303955078125, 2.691650390625, 2.8529052734375, 3.01416015625, 3.1754150390625, 3.336669921875, 3.4979248046875, 3.6591796875, 3.8204345703125, 3.981689453125, 4.1429443359375, 4.30419921875, 4.4654541015625, 4.626708984375, 4.7879638671875, 4.94921875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 6.0, 8.0, 8.0, 8.0, 12.0, 13.0, 8.0, 8.0, 14.0, 22.0, 26.0, 27.0, 20.0, 37.0, 31.0, 31.0, 43.0, 48.0, 58.0, 89.0, 199.0, 579.0, 195.0, 94.0, 63.0, 39.0, 50.0, 36.0, 42.0, 29.0, 22.0, 21.0, 17.0, 18.0, 19.0, 17.0, 18.0, 9.0, 11.0, 6.0, 7.0, 5.0, 4.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-8.0390625, -7.7984619140625, -7.557861328125, -7.3172607421875, -7.07666015625, -6.8360595703125, -6.595458984375, -6.3548583984375, -6.1142578125, -5.8736572265625, -5.633056640625, -5.3924560546875, -5.15185546875, -4.9112548828125, -4.670654296875, -4.4300537109375, -4.189453125, -3.9488525390625, -3.708251953125, -3.4676513671875, -3.22705078125, -2.9864501953125, -2.745849609375, -2.5052490234375, -2.2646484375, -2.0240478515625, -1.783447265625, -1.5428466796875, -1.30224609375, -1.0616455078125, -0.821044921875, -0.5804443359375, -0.33984375, -0.0992431640625, 0.141357421875, 0.3819580078125, 0.62255859375, 0.8631591796875, 1.103759765625, 1.3443603515625, 1.5849609375, 1.8255615234375, 2.066162109375, 2.3067626953125, 2.54736328125, 2.7879638671875, 3.028564453125, 3.2691650390625, 3.509765625, 3.7503662109375, 3.990966796875, 4.2315673828125, 4.47216796875, 4.7127685546875, 4.953369140625, 5.1939697265625, 5.4345703125, 5.6751708984375, 5.915771484375, 6.1563720703125, 6.39697265625, 6.6375732421875, 6.878173828125, 7.1187744140625, 7.359375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 6.0, 3.0, 0.0, 13.0, 21.0, 20.0, 44.0, 35.0, 39.0, 75.0, 62.0, 98.0, 152.0, 206.0, 303.0, 348.0, 416.0, 719.0, 1019.0, 1409.0, 2710.0, 4214.0, 8607.0, 18882.0, 60060.0, 5808777.0, 304903.0, 44994.0, 15539.0, 6999.0, 3710.0, 2218.0, 1505.0, 949.0, 638.0, 474.0, 275.0, 302.0, 202.0, 103.0, 94.0, 74.0, 30.0, 41.0, 36.0, 31.0, 14.0, 16.0, 23.0, 11.0, 6.0, 13.0, 0.0, 0.0, 0.0, 6.0], "bins": [-20.1875, -19.591796875, -18.99609375, -18.400390625, -17.8046875, -17.208984375, -16.61328125, -16.017578125, -15.421875, -14.826171875, -14.23046875, -13.634765625, -13.0390625, -12.443359375, -11.84765625, -11.251953125, -10.65625, -10.060546875, -9.46484375, -8.869140625, -8.2734375, -7.677734375, -7.08203125, -6.486328125, -5.890625, -5.294921875, -4.69921875, -4.103515625, -3.5078125, -2.912109375, -2.31640625, -1.720703125, -1.125, -0.529296875, 0.06640625, 0.662109375, 1.2578125, 1.853515625, 2.44921875, 3.044921875, 3.640625, 4.236328125, 4.83203125, 5.427734375, 6.0234375, 6.619140625, 7.21484375, 7.810546875, 8.40625, 9.001953125, 9.59765625, 10.193359375, 10.7890625, 11.384765625, 11.98046875, 12.576171875, 13.171875, 13.767578125, 14.36328125, 14.958984375, 15.5546875, 16.150390625, 16.74609375, 17.341796875, 17.9375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 7.0, 9.0, 13.0, 16.0, 16.0, 20.0, 27.0, 21.0, 36.0, 27.0, 41.0, 46.0, 37.0, 53.0, 75.0, 141.0, 345.0, 397.0, 163.0, 97.0, 66.0, 66.0, 48.0, 40.0, 23.0, 29.0, 14.0, 27.0, 12.0, 17.0, 14.0, 15.0, 11.0, 7.0, 4.0, 7.0, 3.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0], "bins": [-6.97265625, -6.77923583984375, -6.5858154296875, -6.39239501953125, -6.198974609375, -6.00555419921875, -5.8121337890625, -5.61871337890625, -5.42529296875, -5.23187255859375, -5.0384521484375, -4.84503173828125, -4.651611328125, -4.45819091796875, -4.2647705078125, -4.07135009765625, -3.8779296875, -3.68450927734375, -3.4910888671875, -3.29766845703125, -3.104248046875, -2.91082763671875, -2.7174072265625, -2.52398681640625, -2.33056640625, -2.13714599609375, -1.9437255859375, -1.75030517578125, -1.556884765625, -1.36346435546875, -1.1700439453125, -0.97662353515625, -0.783203125, -0.58978271484375, -0.3963623046875, -0.20294189453125, -0.009521484375, 0.18389892578125, 0.3773193359375, 0.57073974609375, 0.76416015625, 0.95758056640625, 1.1510009765625, 1.34442138671875, 1.537841796875, 1.73126220703125, 1.9246826171875, 2.11810302734375, 2.3115234375, 2.50494384765625, 2.6983642578125, 2.89178466796875, 3.085205078125, 3.27862548828125, 3.4720458984375, 3.66546630859375, 3.85888671875, 4.05230712890625, 4.2457275390625, 4.43914794921875, 4.632568359375, 4.82598876953125, 5.0194091796875, 5.21282958984375, 5.40625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 25.0, 57.0, 465.0, 372.0, 55.0, 23.0, 7.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.42376136779785, -16.574420928955078, -14.725079536437988, -12.875739097595215, -11.026397705078125, -9.177057266235352, -7.327716827392578, -5.478375434875488, -3.629034996032715, -1.7796941995620728, 0.06964659690856934, 1.9189872741699219, 3.7683281898498535, 5.617669105529785, 7.467009544372559, 9.316350936889648, 11.165691375732422, 13.015031814575195, 14.864373207092285, 16.713714599609375, 18.56305503845215, 20.412395477294922, 22.261735916137695, 24.11107635498047, 25.960418701171875, 27.80975914001465, 29.659099578857422, 31.508441925048828, 33.35778045654297, 35.207122802734375, 37.05646514892578, 38.90580368041992, 40.75514602661133, 42.604488372802734, 44.453826904296875, 46.30316925048828, 48.15250778198242, 50.00185012817383, 51.85118865966797, 53.700531005859375, 55.54987335205078, 57.39921569824219, 59.24855422973633, 61.097896575927734, 62.947235107421875, 64.79657745361328, 66.64591979980469, 68.4952621459961, 70.34459686279297, 72.19393920898438, 74.04328155517578, 75.89261627197266, 77.74195861816406, 79.59130096435547, 81.44064331054688, 83.28998565673828, 85.13932800292969, 86.9886703491211, 88.8380126953125, 90.68734741210938, 92.53668975830078, 94.38603210449219, 96.2353744506836, 98.084716796875, 99.93405151367188]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 4.0, 2.0, 7.0, 7.0, 15.0, 3.0, 11.0, 10.0, 11.0, 25.0, 24.0, 19.0, 25.0, 36.0, 27.0, 32.0, 26.0, 46.0, 33.0, 33.0, 50.0, 36.0, 47.0, 36.0, 39.0, 49.0, 39.0, 50.0, 38.0, 25.0, 26.0, 24.0, 25.0, 25.0, 18.0, 12.0, 18.0, 11.0, 3.0, 6.0, 8.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0], "bins": [-9.475214004516602, -9.20776653289795, -8.940320014953613, -8.672872543334961, -8.405425071716309, -8.137977600097656, -7.87053108215332, -7.603083610534668, -7.335636615753174, -7.06818962097168, -6.800742149353027, -6.533295154571533, -6.265848159790039, -5.998400688171387, -5.730953693389893, -5.463506698608398, -5.196059226989746, -4.928612232208252, -4.6611647605896, -4.3937177658081055, -4.126270294189453, -3.858823299407959, -3.591376304626465, -3.3239290714263916, -3.0564818382263184, -2.789034605026245, -2.521587371826172, -2.2541403770446777, -1.9866931438446045, -1.7192459106445312, -1.4517987966537476, -1.1843516826629639, -0.9169044494628906, -0.6494572758674622, -0.3820101022720337, -0.11456292867660522, 0.15288424491882324, 0.4203314781188965, 0.6877785921096802, 0.9552257061004639, 1.222672939300537, 1.4901201725006104, 1.757567286491394, 2.0250144004821777, 2.292461633682251, 2.559908866882324, 2.8273558616638184, 3.0948030948638916, 3.362250328063965, 3.629697561264038, 3.8971447944641113, 4.1645917892456055, 4.432039260864258, 4.699486255645752, 4.966933250427246, 5.234380722045898, 5.501827716827393, 5.769274711608887, 6.036722183227539, 6.304169178009033, 6.571616172790527, 6.83906364440918, 7.106510639190674, 7.373957633972168, 7.64140510559082]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 12.0, 10.0, 13.0, 13.0, 11.0, 27.0, 36.0, 44.0, 57.0, 102.0, 170.0, 307.0, 521.0, 1041.0, 2218.0, 5508.0, 19240.0, 4009994.0, 135246.0, 12026.0, 4043.0, 1732.0, 831.0, 445.0, 220.0, 139.0, 78.0, 62.0, 27.0, 25.0, 15.0, 15.0, 9.0, 8.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.039398193359375, -0.0381627082824707, -0.036927223205566406, -0.03569173812866211, -0.03445625305175781, -0.033220767974853516, -0.03198528289794922, -0.030749797821044922, -0.029514312744140625, -0.028278827667236328, -0.02704334259033203, -0.025807857513427734, -0.024572372436523438, -0.02333688735961914, -0.022101402282714844, -0.020865917205810547, -0.01963043212890625, -0.018394947052001953, -0.017159461975097656, -0.01592397689819336, -0.014688491821289062, -0.013453006744384766, -0.012217521667480469, -0.010982036590576172, -0.009746551513671875, -0.008511066436767578, -0.007275581359863281, -0.006040096282958984, -0.0048046112060546875, -0.0035691261291503906, -0.0023336410522460938, -0.0010981559753417969, 0.0001373291015625, 0.0013728141784667969, 0.0026082992553710938, 0.0038437843322753906, 0.0050792694091796875, 0.006314754486083984, 0.007550239562988281, 0.008785724639892578, 0.010021209716796875, 0.011256694793701172, 0.012492179870605469, 0.013727664947509766, 0.014963150024414062, 0.01619863510131836, 0.017434120178222656, 0.018669605255126953, 0.01990509033203125, 0.021140575408935547, 0.022376060485839844, 0.02361154556274414, 0.024847030639648438, 0.026082515716552734, 0.02731800079345703, 0.028553485870361328, 0.029788970947265625, 0.031024456024169922, 0.03225994110107422, 0.033495426177978516, 0.03473091125488281, 0.03596639633178711, 0.037201881408691406, 0.0384373664855957, 0.0396728515625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 4.0, 8.0, 7.0, 8.0, 6.0, 7.0, 21.0, 14.0, 11.0, 11.0, 20.0, 762.0, 23.0, 14.0, 21.0, 10.0, 12.0, 3.0, 4.0, 3.0, 3.0, 7.0, 5.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.004222869873046875, -0.004107028245925903, -0.003991186618804932, -0.00387534499168396, -0.0037595033645629883, -0.0036436617374420166, -0.003527820110321045, -0.0034119784832000732, -0.0032961368560791016, -0.00318029522895813, -0.003064453601837158, -0.0029486119747161865, -0.002832770347595215, -0.002716928720474243, -0.0026010870933532715, -0.0024852454662323, -0.002369403839111328, -0.0022535622119903564, -0.0021377205848693848, -0.002021878957748413, -0.0019060373306274414, -0.0017901957035064697, -0.001674354076385498, -0.0015585124492645264, -0.0014426708221435547, -0.001326829195022583, -0.0012109875679016113, -0.0010951459407806396, -0.000979304313659668, -0.0008634626865386963, -0.0007476210594177246, -0.0006317794322967529, -0.0005159378051757812, -0.00040009617805480957, -0.0002842545509338379, -0.0001684129238128662, -5.257129669189453e-05, 6.327033042907715e-05, 0.00017911195755004883, 0.0002949535846710205, 0.0004107952117919922, 0.0005266368389129639, 0.0006424784660339355, 0.0007583200931549072, 0.0008741617202758789, 0.0009900033473968506, 0.0011058449745178223, 0.001221686601638794, 0.0013375282287597656, 0.0014533698558807373, 0.001569211483001709, 0.0016850531101226807, 0.0018008947372436523, 0.001916736364364624, 0.0020325779914855957, 0.0021484196186065674, 0.002264261245727539, 0.0023801028728485107, 0.0024959444999694824, 0.002611786127090454, 0.0027276277542114258, 0.0028434693813323975, 0.002959311008453369, 0.003075152635574341, 0.0031909942626953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 9.0, 11.0, 15.0, 14.0, 22.0, 37.0, 56.0, 89.0, 137.0, 185.0, 347.0, 556.0, 1114.0, 2370.0, 5879.0, 17850.0, 80682.0, 3492036.0, 524193.0, 47802.0, 12362.0, 4397.0, 1839.0, 946.0, 517.0, 291.0, 170.0, 117.0, 79.0, 52.0, 32.0, 21.0, 16.0, 13.0, 11.0, 10.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031890869140625, -0.03092026710510254, -0.029949665069580078, -0.028979063034057617, -0.028008460998535156, -0.027037858963012695, -0.026067256927490234, -0.025096654891967773, -0.024126052856445312, -0.02315545082092285, -0.02218484878540039, -0.02121424674987793, -0.02024364471435547, -0.019273042678833008, -0.018302440643310547, -0.017331838607788086, -0.016361236572265625, -0.015390634536743164, -0.014420032501220703, -0.013449430465698242, -0.012478828430175781, -0.01150822639465332, -0.01053762435913086, -0.009567022323608398, -0.008596420288085938, -0.0076258182525634766, -0.006655216217041016, -0.005684614181518555, -0.004714012145996094, -0.003743410110473633, -0.002772808074951172, -0.001802206039428711, -0.00083160400390625, 0.00013899803161621094, 0.0011096000671386719, 0.002080202102661133, 0.0030508041381835938, 0.004021406173706055, 0.004992008209228516, 0.0059626102447509766, 0.0069332122802734375, 0.007903814315795898, 0.00887441635131836, 0.00984501838684082, 0.010815620422363281, 0.011786222457885742, 0.012756824493408203, 0.013727426528930664, 0.014698028564453125, 0.015668630599975586, 0.016639232635498047, 0.017609834671020508, 0.01858043670654297, 0.01955103874206543, 0.02052164077758789, 0.02149224281311035, 0.022462844848632812, 0.023433446884155273, 0.024404048919677734, 0.025374650955200195, 0.026345252990722656, 0.027315855026245117, 0.028286457061767578, 0.02925705909729004, 0.0302276611328125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 2.0, 11.0, 10.0, 21.0, 19.0, 31.0, 39.0, 59.0, 65.0, 90.0, 143.0, 203.0, 704.0, 1880.0, 307.0, 140.0, 104.0, 64.0, 46.0, 23.0, 26.0, 24.0, 14.0, 9.0, 11.0, 5.0, 5.0, 1.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00608062744140625, -0.0058858394622802734, -0.005691051483154297, -0.00549626350402832, -0.005301475524902344, -0.005106687545776367, -0.004911899566650391, -0.004717111587524414, -0.0045223236083984375, -0.004327535629272461, -0.004132747650146484, -0.003937959671020508, -0.0037431716918945312, -0.0035483837127685547, -0.003353595733642578, -0.0031588077545166016, -0.002964019775390625, -0.0027692317962646484, -0.002574443817138672, -0.0023796558380126953, -0.0021848678588867188, -0.001990079879760742, -0.0017952919006347656, -0.001600503921508789, -0.0014057159423828125, -0.001210927963256836, -0.0010161399841308594, -0.0008213520050048828, -0.0006265640258789062, -0.0004317760467529297, -0.00023698806762695312, -4.220008850097656e-05, 0.000152587890625, 0.00034737586975097656, 0.0005421638488769531, 0.0007369518280029297, 0.0009317398071289062, 0.0011265277862548828, 0.0013213157653808594, 0.001516103744506836, 0.0017108917236328125, 0.001905679702758789, 0.0021004676818847656, 0.002295255661010742, 0.0024900436401367188, 0.0026848316192626953, 0.002879619598388672, 0.0030744075775146484, 0.003269195556640625, 0.0034639835357666016, 0.003658771514892578, 0.0038535594940185547, 0.004048347473144531, 0.004243135452270508, 0.004437923431396484, 0.004632711410522461, 0.0048274993896484375, 0.005022287368774414, 0.005217075347900391, 0.005411863327026367, 0.005606651306152344, 0.00580143928527832, 0.005996227264404297, 0.0061910152435302734, 0.00638580322265625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 7.0, 2.0, 9.0, 27.0, 78.0, 303.0, 422.0, 123.0, 26.0, 9.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1435861587524414, -0.14048056304454803, -0.13737498223781586, -0.13426938652992249, -0.1311637908220291, -0.12805821001529694, -0.12495261430740356, -0.12184701859951019, -0.11874143034219742, -0.11563584208488464, -0.11253024637699127, -0.1094246581196785, -0.10631906986236572, -0.10321347415447235, -0.10010788589715958, -0.0970022976398468, -0.09389670193195343, -0.09079111367464066, -0.08768551796674728, -0.08457992970943451, -0.08147434145212173, -0.07836874574422836, -0.07526315748691559, -0.07215756177902222, -0.06905198097229004, -0.06594639271497726, -0.06284079700708389, -0.05973520874977112, -0.056629616767168045, -0.05352402478456497, -0.0504184365272522, -0.047312844544649124, -0.04420725256204605, -0.04110166057944298, -0.0379960723221302, -0.03489048033952713, -0.03178488835692406, -0.028679298236966133, -0.02557370811700821, -0.022468116134405136, -0.019362526014447212, -0.01625693589448929, -0.013151343911886215, -0.010045753791928291, -0.006940162740647793, -0.0038345716893672943, -0.0007289815694093704, 0.0023766104131937027, 0.005482200533151627, 0.008587791584432125, 0.011693382635712624, 0.014798972755670547, 0.01790456473827362, 0.021010154858231544, 0.02411574497818947, 0.02722133696079254, 0.030326927080750465, 0.03343251720070839, 0.03653810918331146, 0.03964369744062424, 0.04274928942322731, 0.04585488140583038, 0.04896046966314316, 0.05206606537103653, 0.055171653628349304]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 17.0, 14.0, 18.0, 19.0, 24.0, 34.0, 26.0, 40.0, 38.0, 48.0, 44.0, 52.0, 54.0, 63.0, 58.0, 56.0, 53.0, 60.0, 47.0, 37.0, 35.0, 33.0, 35.0, 23.0, 9.0, 13.0, 16.0, 11.0, 4.0, 6.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.017418265342712402, -0.016780920326709747, -0.01614357717335224, -0.015506233088672161, -0.01486888900399208, -0.014231544919312, -0.01359420083463192, -0.01295685674995184, -0.012319512665271759, -0.011682168580591679, -0.011044824495911598, -0.010407480411231518, -0.009770136326551437, -0.009132792241871357, -0.008495448157191277, -0.007858104072511196, -0.007220759987831116, -0.006583415903151035, -0.005946071818470955, -0.0053087277337908745, -0.004671383649110794, -0.004034039564430714, -0.0033966954797506332, -0.002759351395070553, -0.0021220073103904724, -0.001484663225710392, -0.0008473191410303116, -0.00020997505635023117, 0.00042736902832984924, 0.0010647131130099297, 0.00170205719769001, 0.0023394012823700905, 0.002976745367050171, 0.0036140894517302513, 0.004251433536410332, 0.004888777621090412, 0.0055261217057704926, 0.006163465790450573, 0.006800809875130653, 0.007438153959810734, 0.008075498044490814, 0.008712842129170895, 0.009350186213850975, 0.009987530298531055, 0.010624874383211136, 0.011262218467891216, 0.011899562552571297, 0.012536906637251377, 0.013174250721931458, 0.013811594806611538, 0.014448938891291618, 0.015086282975971699, 0.01572362706065178, 0.016360972076654434, 0.01699831523001194, 0.017635658383369446, 0.0182730033993721, 0.018910348415374756, 0.01954769156873226, 0.020185034722089767, 0.020822379738092422, 0.021459724754095078, 0.022097067907452583, 0.02273441106081009, 0.023371756076812744]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 1.0, 4.0, 4.0, 12.0, 7.0, 11.0, 20.0, 19.0, 45.0, 48.0, 75.0, 102.0, 133.0, 215.0, 309.0, 495.0, 717.0, 1243.0, 2069.0, 3611.0, 6892.0, 14739.0, 41398.0, 888360.0, 54608.0, 16114.0, 7499.0, 3946.0, 2176.0, 1317.0, 792.0, 530.0, 334.0, 209.0, 155.0, 104.0, 56.0, 54.0, 33.0, 30.0, 19.0, 17.0, 12.0, 8.0, 1.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0382080078125, -0.03706979751586914, -0.03593158721923828, -0.03479337692260742, -0.03365516662597656, -0.0325169563293457, -0.031378746032714844, -0.030240535736083984, -0.029102325439453125, -0.027964115142822266, -0.026825904846191406, -0.025687694549560547, -0.024549484252929688, -0.023411273956298828, -0.02227306365966797, -0.02113485336303711, -0.01999664306640625, -0.01885843276977539, -0.01772022247314453, -0.016582012176513672, -0.015443801879882812, -0.014305591583251953, -0.013167381286621094, -0.012029170989990234, -0.010890960693359375, -0.009752750396728516, -0.008614540100097656, -0.007476329803466797, -0.0063381195068359375, -0.005199909210205078, -0.004061698913574219, -0.0029234886169433594, -0.0017852783203125, -0.0006470680236816406, 0.0004911422729492188, 0.0016293525695800781, 0.0027675628662109375, 0.003905773162841797, 0.005043983459472656, 0.006182193756103516, 0.007320404052734375, 0.008458614349365234, 0.009596824645996094, 0.010735034942626953, 0.011873245239257812, 0.013011455535888672, 0.014149665832519531, 0.01528787612915039, 0.01642608642578125, 0.01756429672241211, 0.01870250701904297, 0.019840717315673828, 0.020978927612304688, 0.022117137908935547, 0.023255348205566406, 0.024393558502197266, 0.025531768798828125, 0.026669979095458984, 0.027808189392089844, 0.028946399688720703, 0.030084609985351562, 0.031222820281982422, 0.03236103057861328, 0.03349924087524414, 0.034637451171875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 1.0, 4.0, 2.0, 6.0, 6.0, 9.0, 7.0, 10.0, 11.0, 16.0, 12.0, 19.0, 46.0, 332.0, 368.0, 69.0, 18.0, 8.0, 16.0, 8.0, 2.0, 7.0, 3.0, 5.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.004180908203125, -0.004064470529556274, -0.003948032855987549, -0.0038315951824188232, -0.0037151575088500977, -0.003598719835281372, -0.0034822821617126465, -0.003365844488143921, -0.0032494068145751953, -0.0031329691410064697, -0.003016531467437744, -0.0029000937938690186, -0.002783656120300293, -0.0026672184467315674, -0.002550780773162842, -0.002434343099594116, -0.0023179054260253906, -0.002201467752456665, -0.0020850300788879395, -0.001968592405319214, -0.0018521547317504883, -0.0017357170581817627, -0.0016192793846130371, -0.0015028417110443115, -0.001386404037475586, -0.0012699663639068604, -0.0011535286903381348, -0.0010370910167694092, -0.0009206533432006836, -0.000804215669631958, -0.0006877779960632324, -0.0005713403224945068, -0.00045490264892578125, -0.00033846497535705566, -0.00022202730178833008, -0.00010558962821960449, 1.0848045349121094e-05, 0.00012728571891784668, 0.00024372339248657227, 0.00036016106605529785, 0.00047659873962402344, 0.000593036413192749, 0.0007094740867614746, 0.0008259117603302002, 0.0009423494338989258, 0.0010587871074676514, 0.001175224781036377, 0.0012916624546051025, 0.0014081001281738281, 0.0015245378017425537, 0.0016409754753112793, 0.0017574131488800049, 0.0018738508224487305, 0.001990288496017456, 0.0021067261695861816, 0.0022231638431549072, 0.002339601516723633, 0.0024560391902923584, 0.002572476863861084, 0.0026889145374298096, 0.002805352210998535, 0.0029217898845672607, 0.0030382275581359863, 0.003154665231704712, 0.0032711029052734375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 5.0, 6.0, 7.0, 9.0, 29.0, 28.0, 36.0, 43.0, 54.0, 80.0, 140.0, 196.0, 250.0, 360.0, 645.0, 1107.0, 1850.0, 3812.0, 9320.0, 41818.0, 761933.0, 194365.0, 19795.0, 6023.0, 2825.0, 1386.0, 825.0, 512.0, 330.0, 249.0, 153.0, 105.0, 65.0, 46.0, 39.0, 27.0, 21.0, 23.0, 7.0, 9.0, 7.0, 5.0, 2.0, 5.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.057708740234375, -0.05613994598388672, -0.05457115173339844, -0.053002357482910156, -0.051433563232421875, -0.049864768981933594, -0.04829597473144531, -0.04672718048095703, -0.04515838623046875, -0.04358959197998047, -0.04202079772949219, -0.040452003479003906, -0.038883209228515625, -0.037314414978027344, -0.03574562072753906, -0.03417682647705078, -0.0326080322265625, -0.03103923797607422, -0.029470443725585938, -0.027901649475097656, -0.026332855224609375, -0.024764060974121094, -0.023195266723632812, -0.02162647247314453, -0.02005767822265625, -0.01848888397216797, -0.016920089721679688, -0.015351295471191406, -0.013782501220703125, -0.012213706970214844, -0.010644912719726562, -0.009076118469238281, -0.00750732421875, -0.005938529968261719, -0.0043697357177734375, -0.0028009414672851562, -0.001232147216796875, 0.00033664703369140625, 0.0019054412841796875, 0.0034742355346679688, 0.00504302978515625, 0.006611824035644531, 0.008180618286132812, 0.009749412536621094, 0.011318206787109375, 0.012887001037597656, 0.014455795288085938, 0.01602458953857422, 0.0175933837890625, 0.01916217803955078, 0.020730972290039062, 0.022299766540527344, 0.023868560791015625, 0.025437355041503906, 0.027006149291992188, 0.02857494354248047, 0.03014373779296875, 0.03171253204345703, 0.03328132629394531, 0.034850120544433594, 0.036418914794921875, 0.037987709045410156, 0.03955650329589844, 0.04112529754638672, 0.042694091796875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 3.0, 5.0, 5.0, 6.0, 8.0, 16.0, 8.0, 19.0, 21.0, 21.0, 16.0, 29.0, 32.0, 23.0, 33.0, 45.0, 26.0, 41.0, 42.0, 31.0, 47.0, 35.0, 37.0, 32.0, 33.0, 33.0, 39.0, 30.0, 39.0, 31.0, 28.0, 27.0, 19.0, 22.0, 18.0, 15.0, 12.0, 15.0, 11.0, 11.0, 4.0, 9.0, 8.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0128021240234375, -0.012413501739501953, -0.012024879455566406, -0.01163625717163086, -0.011247634887695312, -0.010859012603759766, -0.010470390319824219, -0.010081768035888672, -0.009693145751953125, -0.009304523468017578, -0.008915901184082031, -0.008527278900146484, -0.008138656616210938, -0.007750034332275391, -0.007361412048339844, -0.006972789764404297, -0.00658416748046875, -0.006195545196533203, -0.005806922912597656, -0.005418300628662109, -0.0050296783447265625, -0.004641056060791016, -0.004252433776855469, -0.003863811492919922, -0.003475189208984375, -0.003086566925048828, -0.0026979446411132812, -0.0023093223571777344, -0.0019207000732421875, -0.0015320777893066406, -0.0011434555053710938, -0.0007548332214355469, -0.0003662109375, 2.2411346435546875e-05, 0.00041103363037109375, 0.0007996559143066406, 0.0011882781982421875, 0.0015769004821777344, 0.0019655227661132812, 0.002354145050048828, 0.002742767333984375, 0.003131389617919922, 0.0035200119018554688, 0.003908634185791016, 0.0042972564697265625, 0.004685878753662109, 0.005074501037597656, 0.005463123321533203, 0.00585174560546875, 0.006240367889404297, 0.006628990173339844, 0.007017612457275391, 0.0074062347412109375, 0.007794857025146484, 0.008183479309082031, 0.008572101593017578, 0.008960723876953125, 0.009349346160888672, 0.009737968444824219, 0.010126590728759766, 0.010515213012695312, 0.01090383529663086, 0.011292457580566406, 0.011681079864501953, 0.0120697021484375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 5.0, 8.0, 7.0, 14.0, 15.0, 22.0, 38.0, 55.0, 73.0, 110.0, 206.0, 282.0, 504.0, 1043.0, 2443.0, 8236.0, 82512.0, 920127.0, 24687.0, 4671.0, 1623.0, 725.0, 452.0, 241.0, 149.0, 87.0, 61.0, 47.0, 33.0, 16.0, 23.0, 14.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.075927734375, -0.07333564758300781, -0.07074356079101562, -0.06815147399902344, -0.06555938720703125, -0.06296730041503906, -0.060375213623046875, -0.05778312683105469, -0.0551910400390625, -0.05259895324707031, -0.050006866455078125, -0.04741477966308594, -0.04482269287109375, -0.04223060607910156, -0.039638519287109375, -0.03704643249511719, -0.034454345703125, -0.03186225891113281, -0.029270172119140625, -0.026678085327148438, -0.02408599853515625, -0.021493911743164062, -0.018901824951171875, -0.016309738159179688, -0.0137176513671875, -0.011125564575195312, -0.008533477783203125, -0.0059413909912109375, -0.00334930419921875, -0.0007572174072265625, 0.001834869384765625, 0.0044269561767578125, 0.00701904296875, 0.009611129760742188, 0.012203216552734375, 0.014795303344726562, 0.01738739013671875, 0.019979476928710938, 0.022571563720703125, 0.025163650512695312, 0.0277557373046875, 0.030347824096679688, 0.032939910888671875, 0.03553199768066406, 0.03812408447265625, 0.04071617126464844, 0.043308258056640625, 0.04590034484863281, 0.048492431640625, 0.05108451843261719, 0.053676605224609375, 0.05626869201660156, 0.05886077880859375, 0.06145286560058594, 0.06404495239257812, 0.06663703918457031, 0.0692291259765625, 0.07182121276855469, 0.07441329956054688, 0.07700538635253906, 0.07959747314453125, 0.08218955993652344, 0.08478164672851562, 0.08737373352050781, 0.0899658203125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 3.0, 7.0, 6.0, 11.0, 12.0, 14.0, 12.0, 22.0, 18.0, 25.0, 47.0, 101.0, 210.0, 192.0, 92.0, 46.0, 35.0, 29.0, 28.0, 12.0, 7.0, 10.0, 15.0, 7.0, 7.0, 7.0, 2.0, 2.0, 8.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014486312866210938, -0.0014046579599380493, -0.0013606846332550049, -0.0013167113065719604, -0.001272737979888916, -0.0012287646532058716, -0.0011847913265228271, -0.0011408179998397827, -0.0010968446731567383, -0.0010528713464736938, -0.0010088980197906494, -0.000964924693107605, -0.0009209513664245605, -0.0008769780397415161, -0.0008330047130584717, -0.0007890313863754272, -0.0007450580596923828, -0.0007010847330093384, -0.0006571114063262939, -0.0006131380796432495, -0.0005691647529602051, -0.0005251914262771606, -0.0004812180995941162, -0.0004372447729110718, -0.00039327144622802734, -0.0003492981195449829, -0.0003053247928619385, -0.00026135146617889404, -0.0002173781394958496, -0.00017340481281280518, -0.00012943148612976074, -8.545815944671631e-05, -4.1484832763671875e-05, 2.4884939193725586e-06, 4.646182060241699e-05, 9.043514728546143e-05, 0.00013440847396850586, 0.0001783818006515503, 0.00022235512733459473, 0.00026632845401763916, 0.0003103017807006836, 0.00035427510738372803, 0.00039824843406677246, 0.0004422217607498169, 0.00048619508743286133, 0.0005301684141159058, 0.0005741417407989502, 0.0006181150674819946, 0.0006620883941650391, 0.0007060617208480835, 0.0007500350475311279, 0.0007940083742141724, 0.0008379817008972168, 0.0008819550275802612, 0.0009259283542633057, 0.0009699016809463501, 0.0010138750076293945, 0.001057848334312439, 0.0011018216609954834, 0.0011457949876785278, 0.0011897683143615723, 0.0012337416410446167, 0.0012777149677276611, 0.0013216882944107056, 0.00136566162109375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 7.0, 8.0, 18.0, 13.0, 23.0, 34.0, 42.0, 84.0, 112.0, 186.0, 321.0, 607.0, 1112.0, 2374.0, 5740.0, 17261.0, 80469.0, 839659.0, 73760.0, 16323.0, 5578.0, 2316.0, 1107.0, 579.0, 319.0, 182.0, 108.0, 57.0, 54.0, 38.0, 17.0, 15.0, 6.0, 9.0, 8.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06622314453125, -0.06418418884277344, -0.062145233154296875, -0.06010627746582031, -0.05806732177734375, -0.05602836608886719, -0.053989410400390625, -0.05195045471191406, -0.0499114990234375, -0.04787254333496094, -0.045833587646484375, -0.04379463195800781, -0.04175567626953125, -0.03971672058105469, -0.037677764892578125, -0.03563880920410156, -0.033599853515625, -0.03156089782714844, -0.029521942138671875, -0.027482986450195312, -0.02544403076171875, -0.023405075073242188, -0.021366119384765625, -0.019327163696289062, -0.0172882080078125, -0.015249252319335938, -0.013210296630859375, -0.011171340942382812, -0.00913238525390625, -0.0070934295654296875, -0.005054473876953125, -0.0030155181884765625, -0.0009765625, 0.0010623931884765625, 0.003101348876953125, 0.0051403045654296875, 0.00717926025390625, 0.009218215942382812, 0.011257171630859375, 0.013296127319335938, 0.0153350830078125, 0.017374038696289062, 0.019412994384765625, 0.021451950073242188, 0.02349090576171875, 0.025529861450195312, 0.027568817138671875, 0.029607772827148438, 0.031646728515625, 0.03368568420410156, 0.035724639892578125, 0.03776359558105469, 0.03980255126953125, 0.04184150695800781, 0.043880462646484375, 0.04591941833496094, 0.0479583740234375, 0.04999732971191406, 0.052036285400390625, 0.05407524108886719, 0.05611419677734375, 0.05815315246582031, 0.060192108154296875, 0.06223106384277344, 0.06427001953125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 7.0, 8.0, 14.0, 13.0, 10.0, 15.0, 13.0, 28.0, 29.0, 47.0, 69.0, 104.0, 274.0, 107.0, 67.0, 57.0, 27.0, 16.0, 27.0, 13.0, 8.0, 11.0, 8.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041656494140625, -0.040377140045166016, -0.03909778594970703, -0.03781843185424805, -0.03653907775878906, -0.03525972366333008, -0.033980369567871094, -0.03270101547241211, -0.031421661376953125, -0.03014230728149414, -0.028862953186035156, -0.027583599090576172, -0.026304244995117188, -0.025024890899658203, -0.02374553680419922, -0.022466182708740234, -0.02118682861328125, -0.019907474517822266, -0.01862812042236328, -0.017348766326904297, -0.016069412231445312, -0.014790058135986328, -0.013510704040527344, -0.01223134994506836, -0.010951995849609375, -0.00967264175415039, -0.008393287658691406, -0.007113933563232422, -0.0058345794677734375, -0.004555225372314453, -0.0032758712768554688, -0.0019965171813964844, -0.0007171630859375, 0.0005621910095214844, 0.0018415451049804688, 0.003120899200439453, 0.0044002532958984375, 0.005679607391357422, 0.006958961486816406, 0.00823831558227539, 0.009517669677734375, 0.01079702377319336, 0.012076377868652344, 0.013355731964111328, 0.014635086059570312, 0.015914440155029297, 0.01719379425048828, 0.018473148345947266, 0.01975250244140625, 0.021031856536865234, 0.02231121063232422, 0.023590564727783203, 0.024869918823242188, 0.026149272918701172, 0.027428627014160156, 0.02870798110961914, 0.029987335205078125, 0.03126668930053711, 0.032546043395996094, 0.03382539749145508, 0.03510475158691406, 0.03638410568237305, 0.03766345977783203, 0.038942813873291016, 0.04022216796875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 9.0, 29.0, 141.0, 557.0, 169.0, 53.0, 12.0, 10.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0424519777297974, -1.0166871547698975, -0.9909223914146423, -0.9651575684547424, -0.9393928050994873, -0.9136279821395874, -0.8878631591796875, -0.8620983362197876, -0.8363335728645325, -0.8105687499046326, -0.7848039865493774, -0.7590391635894775, -0.7332743406295776, -0.7075095772743225, -0.6817447543144226, -0.6559799909591675, -0.6302151679992676, -0.6044503450393677, -0.5786855816841125, -0.5529207587242126, -0.5271559953689575, -0.5013911724090576, -0.4756263494491577, -0.4498615562915802, -0.4240967631340027, -0.39833196997642517, -0.37256717681884766, -0.34680235385894775, -0.32103756070137024, -0.2952727675437927, -0.2695079445838928, -0.2437431514263153, -0.21797829866409302, -0.1922135055065155, -0.1664486974477768, -0.14068388938903809, -0.11491909623146057, -0.08915430307388306, -0.06338949501514435, -0.03762468695640564, -0.011859893798828125, 0.013904906809329987, 0.0396697074174881, 0.06543450802564621, 0.09119930863380432, 0.11696410179138184, 0.14272890985012054, 0.16849371790885925, 0.19425851106643677, 0.22002330422401428, 0.245788112282753, 0.2715529203414917, 0.2973177134990692, 0.32308250665664673, 0.34884732961654663, 0.37461212277412415, 0.40037691593170166, 0.4261417090892792, 0.4519065022468567, 0.4776713252067566, 0.5034360885620117, 0.5292009115219116, 0.5549657344818115, 0.5807305574417114, 0.6064953207969666]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 6.0, 8.0, 7.0, 9.0, 13.0, 8.0, 23.0, 32.0, 54.0, 100.0, 105.0, 128.0, 132.0, 116.0, 77.0, 64.0, 30.0, 21.0, 13.0, 14.0, 10.0, 7.0, 5.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3502047061920166, -0.34066644310951233, -0.33112815022468567, -0.3215898871421814, -0.3120516240596771, -0.30251336097717285, -0.2929750680923462, -0.2834368050098419, -0.27389854192733765, -0.2643602788448334, -0.2548219859600067, -0.24528372287750244, -0.23574545979499817, -0.2262071818113327, -0.21666890382766724, -0.20713064074516296, -0.1975923478603363, -0.18805406987667084, -0.17851580679416656, -0.1689775288105011, -0.15943926572799683, -0.14990098774433136, -0.1403627097606659, -0.13082444667816162, -0.12128616869449615, -0.11174789816141129, -0.10220962762832642, -0.09267134964466095, -0.08313307911157608, -0.07359480857849121, -0.06405653059482574, -0.054518260061740875, -0.044979989528656006, -0.035441718995571136, -0.02590344473719597, -0.01636517234146595, -0.006826899945735931, 0.002711370587348938, 0.012249644845724106, 0.021787919104099274, 0.03132618963718414, 0.04086446017026901, 0.05040273442864418, 0.05994100868701935, 0.06947927922010422, 0.07901754975318909, 0.08855582773685455, 0.09809409826993942, 0.10763236880302429, 0.11717063933610916, 0.12670890986919403, 0.1362471878528595, 0.14578545093536377, 0.15532372891902924, 0.1648620069026947, 0.17440026998519897, 0.18393854796886444, 0.1934768259525299, 0.20301508903503418, 0.21255336701869965, 0.2220916450023651, 0.23162990808486938, 0.24116818606853485, 0.2507064640522003, 0.2602447271347046]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 2.0, 4.0, 4.0, 6.0, 8.0, 10.0, 8.0, 17.0, 18.0, 25.0, 29.0, 58.0, 133.0, 949.0, 27346.0, 4160409.0, 4832.0, 215.0, 63.0, 32.0, 15.0, 24.0, 14.0, 12.0, 5.0, 9.0, 7.0, 7.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.568359375, -2.49761962890625, -2.4268798828125, -2.35614013671875, -2.285400390625, -2.21466064453125, -2.1439208984375, -2.07318115234375, -2.00244140625, -1.93170166015625, -1.8609619140625, -1.79022216796875, -1.719482421875, -1.64874267578125, -1.5780029296875, -1.50726318359375, -1.4365234375, -1.36578369140625, -1.2950439453125, -1.22430419921875, -1.153564453125, -1.08282470703125, -1.0120849609375, -0.94134521484375, -0.87060546875, -0.79986572265625, -0.7291259765625, -0.65838623046875, -0.587646484375, -0.51690673828125, -0.4461669921875, -0.37542724609375, -0.3046875, -0.23394775390625, -0.1632080078125, -0.09246826171875, -0.021728515625, 0.04901123046875, 0.1197509765625, 0.19049072265625, 0.26123046875, 0.33197021484375, 0.4027099609375, 0.47344970703125, 0.544189453125, 0.61492919921875, 0.6856689453125, 0.75640869140625, 0.8271484375, 0.89788818359375, 0.9686279296875, 1.03936767578125, 1.110107421875, 1.18084716796875, 1.2515869140625, 1.32232666015625, 1.39306640625, 1.46380615234375, 1.5345458984375, 1.60528564453125, 1.676025390625, 1.74676513671875, 1.8175048828125, 1.88824462890625, 1.958984375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 6.0, 11.0, 9.0, 12.0, 12.0, 13.0, 29.0, 58.0, 121.0, 252.0, 198.0, 144.0, 53.0, 27.0, 14.0, 14.0, 6.0, 4.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.005809783935546875, -0.005685657262802124, -0.005561530590057373, -0.005437403917312622, -0.005313277244567871, -0.00518915057182312, -0.005065023899078369, -0.004940897226333618, -0.004816770553588867, -0.004692643880844116, -0.004568517208099365, -0.004444390535354614, -0.004320263862609863, -0.004196137189865112, -0.004072010517120361, -0.00394788384437561, -0.0038237571716308594, -0.0036996304988861084, -0.0035755038261413574, -0.0034513771533966064, -0.0033272504806518555, -0.0032031238079071045, -0.0030789971351623535, -0.0029548704624176025, -0.0028307437896728516, -0.0027066171169281006, -0.0025824904441833496, -0.0024583637714385986, -0.0023342370986938477, -0.0022101104259490967, -0.0020859837532043457, -0.0019618570804595947, -0.0018377304077148438, -0.0017136037349700928, -0.0015894770622253418, -0.0014653503894805908, -0.0013412237167358398, -0.0012170970439910889, -0.0010929703712463379, -0.0009688436985015869, -0.0008447170257568359, -0.000720590353012085, -0.000596463680267334, -0.000472337007522583, -0.00034821033477783203, -0.00022408366203308105, -9.995698928833008e-05, 2.41696834564209e-05, 0.00014829635620117188, 0.00027242302894592285, 0.00039654970169067383, 0.0005206763744354248, 0.0006448030471801758, 0.0007689297199249268, 0.0008930563926696777, 0.0010171830654144287, 0.0011413097381591797, 0.0012654364109039307, 0.0013895630836486816, 0.0015136897563934326, 0.0016378164291381836, 0.0017619431018829346, 0.0018860697746276855, 0.0020101964473724365, 0.0021343231201171875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 6.0, 5.0, 5.0, 5.0, 9.0, 21.0, 17.0, 20.0, 29.0, 39.0, 42.0, 57.0, 84.0, 89.0, 142.0, 243.0, 1657.0, 4059588.0, 130466.0, 893.0, 210.0, 118.0, 95.0, 91.0, 84.0, 67.0, 46.0, 42.0, 25.0, 24.0, 11.0, 12.0, 11.0, 7.0, 7.0, 7.0, 3.0, 0.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.51025390625, -0.4951896667480469, -0.48012542724609375, -0.4650611877441406, -0.4499969482421875, -0.4349327087402344, -0.41986846923828125, -0.4048042297363281, -0.389739990234375, -0.3746757507324219, -0.35961151123046875, -0.3445472717285156, -0.3294830322265625, -0.3144187927246094, -0.29935455322265625, -0.2842903137207031, -0.26922607421875, -0.2541618347167969, -0.23909759521484375, -0.22403335571289062, -0.2089691162109375, -0.19390487670898438, -0.17884063720703125, -0.16377639770507812, -0.148712158203125, -0.13364791870117188, -0.11858367919921875, -0.10351943969726562, -0.0884552001953125, -0.07339096069335938, -0.05832672119140625, -0.043262481689453125, -0.0281982421875, -0.013134002685546875, 0.00193023681640625, 0.016994476318359375, 0.0320587158203125, 0.047122955322265625, 0.06218719482421875, 0.07725143432617188, 0.092315673828125, 0.10737991333007812, 0.12244415283203125, 0.13750839233398438, 0.1525726318359375, 0.16763687133789062, 0.18270111083984375, 0.19776535034179688, 0.21282958984375, 0.22789382934570312, 0.24295806884765625, 0.2580223083496094, 0.2730865478515625, 0.2881507873535156, 0.30321502685546875, 0.3182792663574219, 0.333343505859375, 0.3484077453613281, 0.36347198486328125, 0.3785362243652344, 0.3936004638671875, 0.4086647033691406, 0.42372894287109375, 0.4387931823730469, 0.453857421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 3.0, 12.0, 6.0, 7.0, 13.0, 10.0, 14.0, 25.0, 33.0, 43.0, 54.0, 79.0, 76.0, 138.0, 173.0, 289.0, 520.0, 1288.0, 347.0, 205.0, 163.0, 127.0, 114.0, 68.0, 66.0, 44.0, 29.0, 21.0, 19.0, 18.0, 17.0, 5.0, 12.0, 12.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0051727294921875, -0.005016624927520752, -0.004860520362854004, -0.004704415798187256, -0.004548311233520508, -0.00439220666885376, -0.004236102104187012, -0.004079997539520264, -0.003923892974853516, -0.0037677884101867676, -0.0036116838455200195, -0.0034555792808532715, -0.0032994747161865234, -0.0031433701515197754, -0.0029872655868530273, -0.0028311610221862793, -0.0026750564575195312, -0.002518951892852783, -0.002362847328186035, -0.002206742763519287, -0.002050638198852539, -0.001894533634185791, -0.001738429069519043, -0.001582324504852295, -0.0014262199401855469, -0.0012701153755187988, -0.0011140108108520508, -0.0009579062461853027, -0.0008018016815185547, -0.0006456971168518066, -0.0004895925521850586, -0.00033348798751831055, -0.0001773834228515625, -2.1278858184814453e-05, 0.0001348257064819336, 0.00029093027114868164, 0.0004470348358154297, 0.0006031394004821777, 0.0007592439651489258, 0.0009153485298156738, 0.0010714530944824219, 0.00122755765914917, 0.001383662223815918, 0.001539766788482666, 0.001695871353149414, 0.0018519759178161621, 0.00200808048248291, 0.002164185047149658, 0.0023202896118164062, 0.0024763941764831543, 0.0026324987411499023, 0.0027886033058166504, 0.0029447078704833984, 0.0031008124351501465, 0.0032569169998168945, 0.0034130215644836426, 0.0035691261291503906, 0.0037252306938171387, 0.0038813352584838867, 0.004037439823150635, 0.004193544387817383, 0.004349648952484131, 0.004505753517150879, 0.004661858081817627, 0.004817962646484375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 8.0, 130.0, 810.0, 58.0, 10.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10178752988576889, -0.08207255601882935, -0.0623575821518898, -0.042642608284950256, -0.02292763441801071, -0.003212660551071167, 0.016502313315868378, 0.036217279732227325, 0.05593226104974747, 0.07564723491668701, 0.09536220878362656, 0.1150771826505661, 0.13479214906692505, 0.1545071303844452, 0.17422211170196533, 0.19393706321716309, 0.21365204453468323, 0.23336702585220337, 0.2530819773674011, 0.27279695868492126, 0.2925119400024414, 0.31222692131996155, 0.3319419026374817, 0.35165685415267944, 0.3713718354701996, 0.3910868167877197, 0.4108017683029175, 0.4305167496204376, 0.45023173093795776, 0.4699467122554779, 0.48966169357299805, 0.5093766450881958, 0.5290915966033936, 0.5488065481185913, 0.5685215592384338, 0.5882365107536316, 0.6079515218734741, 0.6276664733886719, 0.6473814249038696, 0.6670963764190674, 0.6868113875389099, 0.7065263390541077, 0.7262413501739502, 0.745956301689148, 0.7656712532043457, 0.7853862643241882, 0.805101215839386, 0.8248162269592285, 0.8445311784744263, 0.864246129989624, 0.8839611411094666, 0.9036760926246643, 0.9233911037445068, 0.9431060552597046, 0.9628210067749023, 0.9825359582901001, 1.0022509098052979, 1.0219658613204956, 1.0416808128356934, 1.0613958835601807, 1.0811108350753784, 1.1008257865905762, 1.120540738105774, 1.1402556896209717, 1.159970760345459]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 14.0, 20.0, 32.0, 50.0, 51.0, 78.0, 101.0, 112.0, 89.0, 104.0, 96.0, 85.0, 55.0, 41.0, 24.0, 15.0, 13.0, 6.0, 4.0, 10.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04989194869995117, -0.04710703343153, -0.04432211443781853, -0.041537195444107056, -0.03875228017568588, -0.03596736490726471, -0.03318244591355324, -0.030397528782486916, -0.027612611651420593, -0.02482769452035427, -0.02204277738928795, -0.019257860258221626, -0.016472943127155304, -0.013688025996088982, -0.01090310886502266, -0.008118191733956337, -0.005333274602890015, -0.0025483574718236923, 0.00023655965924263, 0.0030214767903089523, 0.005806393921375275, 0.008591311052441597, 0.01137622818350792, 0.014161145314574242, 0.016946062445640564, 0.019730979576706886, 0.02251589670777321, 0.02530081383883953, 0.028085730969905853, 0.030870648100972176, 0.0336555652320385, 0.03644048422574997, 0.03922539949417114, 0.042010314762592316, 0.04479523375630379, 0.04758015275001526, 0.05036506801843643, 0.053149983286857605, 0.05593490228056908, 0.05871982127428055, 0.06150473654270172, 0.0642896518111229, 0.06707456707954407, 0.06985948979854584, 0.07264440506696701, 0.07542932033538818, 0.07821424305438995, 0.08099915832281113, 0.0837840735912323, 0.08656898885965347, 0.08935390412807465, 0.09213882684707642, 0.09492374211549759, 0.09770865738391876, 0.10049358010292053, 0.1032784953713417, 0.10606341063976288, 0.10884832590818405, 0.11163324117660522, 0.114418163895607, 0.11720307916402817, 0.11998799443244934, 0.12277291715145111, 0.1255578249692917, 0.12834274768829346]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 5.0, 7.0, 8.0, 8.0, 1.0, 7.0, 10.0, 16.0, 20.0, 19.0, 17.0, 40.0, 54.0, 90.0, 159.0, 324.0, 619.0, 1258.0, 2751.0, 6437.0, 20102.0, 154438.0, 787852.0, 53820.0, 12113.0, 4324.0, 1978.0, 949.0, 472.0, 219.0, 135.0, 69.0, 49.0, 47.0, 26.0, 23.0, 18.0, 16.0, 8.0, 11.0, 6.0, 8.0, 7.0, 5.0, 5.0, 1.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.051788330078125, -0.05018472671508789, -0.04858112335205078, -0.04697751998901367, -0.04537391662597656, -0.04377031326293945, -0.042166709899902344, -0.040563106536865234, -0.038959503173828125, -0.037355899810791016, -0.035752296447753906, -0.0341486930847168, -0.03254508972167969, -0.030941486358642578, -0.02933788299560547, -0.02773427963256836, -0.02613067626953125, -0.02452707290649414, -0.02292346954345703, -0.021319866180419922, -0.019716262817382812, -0.018112659454345703, -0.016509056091308594, -0.014905452728271484, -0.013301849365234375, -0.011698246002197266, -0.010094642639160156, -0.008491039276123047, -0.0068874359130859375, -0.005283832550048828, -0.0036802291870117188, -0.0020766258239746094, -0.0004730224609375, 0.0011305809020996094, 0.0027341842651367188, 0.004337787628173828, 0.0059413909912109375, 0.007544994354248047, 0.009148597717285156, 0.010752201080322266, 0.012355804443359375, 0.013959407806396484, 0.015563011169433594, 0.017166614532470703, 0.018770217895507812, 0.020373821258544922, 0.02197742462158203, 0.02358102798461914, 0.02518463134765625, 0.02678823471069336, 0.02839183807373047, 0.029995441436767578, 0.03159904479980469, 0.0332026481628418, 0.034806251525878906, 0.036409854888916016, 0.038013458251953125, 0.039617061614990234, 0.041220664978027344, 0.04282426834106445, 0.04442787170410156, 0.04603147506713867, 0.04763507843017578, 0.04923868179321289, 0.05084228515625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 10.0, 13.0, 15.0, 37.0, 66.0, 185.0, 233.0, 219.0, 115.0, 50.0, 27.0, 14.0, 7.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00316619873046875, -0.0029876232147216797, -0.0028090476989746094, -0.002630472183227539, -0.0024518966674804688, -0.0022733211517333984, -0.002094745635986328, -0.0019161701202392578, -0.0017375946044921875, -0.0015590190887451172, -0.0013804435729980469, -0.0012018680572509766, -0.0010232925415039062, -0.0008447170257568359, -0.0006661415100097656, -0.0004875659942626953, -0.000308990478515625, -0.0001304149627685547, 4.8160552978515625e-05, 0.00022673606872558594, 0.00040531158447265625, 0.0005838871002197266, 0.0007624626159667969, 0.0009410381317138672, 0.0011196136474609375, 0.0012981891632080078, 0.0014767646789550781, 0.0016553401947021484, 0.0018339157104492188, 0.002012491226196289, 0.0021910667419433594, 0.0023696422576904297, 0.0025482177734375, 0.0027267932891845703, 0.0029053688049316406, 0.003083944320678711, 0.0032625198364257812, 0.0034410953521728516, 0.003619670867919922, 0.003798246383666992, 0.0039768218994140625, 0.004155397415161133, 0.004333972930908203, 0.0045125484466552734, 0.004691123962402344, 0.004869699478149414, 0.005048274993896484, 0.005226850509643555, 0.005405426025390625, 0.005584001541137695, 0.005762577056884766, 0.005941152572631836, 0.006119728088378906, 0.0062983036041259766, 0.006476879119873047, 0.006655454635620117, 0.0068340301513671875, 0.007012605667114258, 0.007191181182861328, 0.0073697566986083984, 0.007548332214355469, 0.007726907730102539, 0.00790548324584961, 0.00808405876159668, 0.00826263427734375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 4.0, 6.0, 7.0, 7.0, 9.0, 11.0, 13.0, 16.0, 11.0, 17.0, 24.0, 31.0, 27.0, 44.0, 61.0, 142.0, 375.0, 2037.0, 21600.0, 834700.0, 180876.0, 7059.0, 889.0, 237.0, 80.0, 55.0, 33.0, 38.0, 21.0, 13.0, 17.0, 21.0, 11.0, 12.0, 7.0, 11.0, 8.0, 5.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0], "bins": [-0.08465576171875, -0.0824732780456543, -0.0802907943725586, -0.07810831069946289, -0.07592582702636719, -0.07374334335327148, -0.07156085968017578, -0.06937837600708008, -0.06719589233398438, -0.06501340866088867, -0.06283092498779297, -0.060648441314697266, -0.05846595764160156, -0.05628347396850586, -0.054100990295410156, -0.05191850662231445, -0.04973602294921875, -0.04755353927612305, -0.045371055603027344, -0.04318857192993164, -0.04100608825683594, -0.038823604583740234, -0.03664112091064453, -0.03445863723754883, -0.032276153564453125, -0.030093669891357422, -0.02791118621826172, -0.025728702545166016, -0.023546218872070312, -0.02136373519897461, -0.019181251525878906, -0.016998767852783203, -0.0148162841796875, -0.012633800506591797, -0.010451316833496094, -0.00826883316040039, -0.0060863494873046875, -0.0039038658142089844, -0.0017213821411132812, 0.0004611015319824219, 0.002643585205078125, 0.004826068878173828, 0.007008552551269531, 0.009191036224365234, 0.011373519897460938, 0.01355600357055664, 0.015738487243652344, 0.017920970916748047, 0.02010345458984375, 0.022285938262939453, 0.024468421936035156, 0.02665090560913086, 0.028833389282226562, 0.031015872955322266, 0.03319835662841797, 0.03538084030151367, 0.037563323974609375, 0.03974580764770508, 0.04192829132080078, 0.044110774993896484, 0.04629325866699219, 0.04847574234008789, 0.050658226013183594, 0.0528407096862793, 0.055023193359375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 12.0, 10.0, 9.0, 14.0, 6.0, 12.0, 15.0, 19.0, 28.0, 22.0, 26.0, 28.0, 39.0, 52.0, 32.0, 42.0, 40.0, 49.0, 44.0, 52.0, 43.0, 45.0, 46.0, 45.0, 37.0, 28.0, 26.0, 24.0, 24.0, 21.0, 23.0, 18.0, 9.0, 9.0, 12.0, 7.0, 10.0, 7.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.0099945068359375, -0.00970447063446045, -0.009414434432983398, -0.009124398231506348, -0.008834362030029297, -0.008544325828552246, -0.008254289627075195, -0.007964253425598145, -0.007674217224121094, -0.007384181022644043, -0.007094144821166992, -0.006804108619689941, -0.006514072418212891, -0.00622403621673584, -0.005934000015258789, -0.005643963813781738, -0.0053539276123046875, -0.005063891410827637, -0.004773855209350586, -0.004483819007873535, -0.004193782806396484, -0.0039037466049194336, -0.003613710403442383, -0.003323674201965332, -0.0030336380004882812, -0.0027436017990112305, -0.0024535655975341797, -0.002163529396057129, -0.0018734931945800781, -0.0015834569931030273, -0.0012934207916259766, -0.0010033845901489258, -0.000713348388671875, -0.0004233121871948242, -0.00013327598571777344, 0.00015676021575927734, 0.0004467964172363281, 0.0007368326187133789, 0.0010268688201904297, 0.0013169050216674805, 0.0016069412231445312, 0.001896977424621582, 0.002187013626098633, 0.0024770498275756836, 0.0027670860290527344, 0.003057122230529785, 0.003347158432006836, 0.0036371946334838867, 0.0039272308349609375, 0.004217267036437988, 0.004507303237915039, 0.00479733943939209, 0.005087375640869141, 0.005377411842346191, 0.005667448043823242, 0.005957484245300293, 0.006247520446777344, 0.0065375566482543945, 0.006827592849731445, 0.007117629051208496, 0.007407665252685547, 0.007697701454162598, 0.007987737655639648, 0.0082777738571167, 0.00856781005859375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 5.0, 1.0, 8.0, 7.0, 6.0, 7.0, 9.0, 13.0, 16.0, 17.0, 37.0, 132.0, 753.0, 17768.0, 1024926.0, 4220.0, 405.0, 100.0, 27.0, 14.0, 16.0, 10.0, 8.0, 6.0, 13.0, 6.0, 8.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.240966796875, -0.2337360382080078, -0.22650527954101562, -0.21927452087402344, -0.21204376220703125, -0.20481300354003906, -0.19758224487304688, -0.1903514862060547, -0.1831207275390625, -0.1758899688720703, -0.16865921020507812, -0.16142845153808594, -0.15419769287109375, -0.14696693420410156, -0.13973617553710938, -0.1325054168701172, -0.125274658203125, -0.11804389953613281, -0.11081314086914062, -0.10358238220214844, -0.09635162353515625, -0.08912086486816406, -0.08189010620117188, -0.07465934753417969, -0.0674285888671875, -0.06019783020019531, -0.052967071533203125, -0.04573631286621094, -0.03850555419921875, -0.03127479553222656, -0.024044036865234375, -0.016813278198242188, -0.00958251953125, -0.0023517608642578125, 0.004878997802734375, 0.012109756469726562, 0.01934051513671875, 0.026571273803710938, 0.033802032470703125, 0.04103279113769531, 0.0482635498046875, 0.05549430847167969, 0.06272506713867188, 0.06995582580566406, 0.07718658447265625, 0.08441734313964844, 0.09164810180664062, 0.09887886047363281, 0.106109619140625, 0.11334037780761719, 0.12057113647460938, 0.12780189514160156, 0.13503265380859375, 0.14226341247558594, 0.14949417114257812, 0.1567249298095703, 0.1639556884765625, 0.1711864471435547, 0.17841720581054688, 0.18564796447753906, 0.19287872314453125, 0.20010948181152344, 0.20734024047851562, 0.2145709991455078, 0.2218017578125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 4.0, 11.0, 12.0, 8.0, 9.0, 14.0, 25.0, 16.0, 22.0, 25.0, 375.0, 370.0, 22.0, 15.0, 17.0, 7.0, 7.0, 3.0, 8.0, 7.0, 4.0, 1.0, 4.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014333724975585938, -0.0013839006423950195, -0.0013344287872314453, -0.001284956932067871, -0.0012354850769042969, -0.0011860132217407227, -0.0011365413665771484, -0.0010870695114135742, -0.00103759765625, -0.0009881258010864258, -0.0009386539459228516, -0.0008891820907592773, -0.0008397102355957031, -0.0007902383804321289, -0.0007407665252685547, -0.0006912946701049805, -0.0006418228149414062, -0.000592350959777832, -0.0005428791046142578, -0.0004934072494506836, -0.0004439353942871094, -0.00039446353912353516, -0.00034499168395996094, -0.0002955198287963867, -0.0002460479736328125, -0.00019657611846923828, -0.00014710426330566406, -9.763240814208984e-05, -4.8160552978515625e-05, 1.3113021850585938e-06, 5.078315734863281e-05, 0.00010025501251220703, 0.00014972686767578125, 0.00019919872283935547, 0.0002486705780029297, 0.0002981424331665039, 0.0003476142883300781, 0.00039708614349365234, 0.00044655799865722656, 0.0004960298538208008, 0.000545501708984375, 0.0005949735641479492, 0.0006444454193115234, 0.0006939172744750977, 0.0007433891296386719, 0.0007928609848022461, 0.0008423328399658203, 0.0008918046951293945, 0.0009412765502929688, 0.000990748405456543, 0.0010402202606201172, 0.0010896921157836914, 0.0011391639709472656, 0.0011886358261108398, 0.001238107681274414, 0.0012875795364379883, 0.0013370513916015625, 0.0013865232467651367, 0.001435995101928711, 0.0014854669570922852, 0.0015349388122558594, 0.0015844106674194336, 0.0016338825225830078, 0.001683354377746582, 0.0017328262329101562]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 11.0, 10.0, 25.0, 52.0, 139.0, 389.0, 1713.0, 40684.0, 995399.0, 8742.0, 916.0, 247.0, 112.0, 45.0, 23.0, 11.0, 12.0, 6.0, 3.0, 4.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1424560546875, -0.1379070281982422, -0.13335800170898438, -0.12880897521972656, -0.12425994873046875, -0.11971092224121094, -0.11516189575195312, -0.11061286926269531, -0.1060638427734375, -0.10151481628417969, -0.09696578979492188, -0.09241676330566406, -0.08786773681640625, -0.08331871032714844, -0.07876968383789062, -0.07422065734863281, -0.069671630859375, -0.06512260437011719, -0.060573577880859375, -0.05602455139160156, -0.05147552490234375, -0.04692649841308594, -0.042377471923828125, -0.03782844543457031, -0.0332794189453125, -0.028730392456054688, -0.024181365966796875, -0.019632339477539062, -0.01508331298828125, -0.010534286499023438, -0.005985260009765625, -0.0014362335205078125, 0.00311279296875, 0.0076618194580078125, 0.012210845947265625, 0.016759872436523438, 0.02130889892578125, 0.025857925415039062, 0.030406951904296875, 0.03495597839355469, 0.0395050048828125, 0.04405403137207031, 0.048603057861328125, 0.05315208435058594, 0.05770111083984375, 0.06225013732910156, 0.06679916381835938, 0.07134819030761719, 0.075897216796875, 0.08044624328613281, 0.08499526977539062, 0.08954429626464844, 0.09409332275390625, 0.09864234924316406, 0.10319137573242188, 0.10774040222167969, 0.1122894287109375, 0.11683845520019531, 0.12138748168945312, 0.12593650817871094, 0.13048553466796875, 0.13503456115722656, 0.13958358764648438, 0.1441326141357422, 0.148681640625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 8.0, 7.0, 18.0, 22.0, 20.0, 43.0, 53.0, 90.0, 277.0, 197.0, 79.0, 62.0, 41.0, 26.0, 18.0, 13.0, 10.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024139404296875, -0.023126602172851562, -0.022113800048828125, -0.021100997924804688, -0.02008819580078125, -0.019075393676757812, -0.018062591552734375, -0.017049789428710938, -0.0160369873046875, -0.015024185180664062, -0.014011383056640625, -0.012998580932617188, -0.01198577880859375, -0.010972976684570312, -0.009960174560546875, -0.008947372436523438, -0.0079345703125, -0.0069217681884765625, -0.005908966064453125, -0.0048961639404296875, -0.00388336181640625, -0.0028705596923828125, -0.001857757568359375, -0.0008449554443359375, 0.0001678466796875, 0.0011806488037109375, 0.002193450927734375, 0.0032062530517578125, 0.00421905517578125, 0.0052318572998046875, 0.006244659423828125, 0.0072574615478515625, 0.008270263671875, 0.009283065795898438, 0.010295867919921875, 0.011308670043945312, 0.01232147216796875, 0.013334274291992188, 0.014347076416015625, 0.015359878540039062, 0.0163726806640625, 0.017385482788085938, 0.018398284912109375, 0.019411087036132812, 0.02042388916015625, 0.021436691284179688, 0.022449493408203125, 0.023462295532226562, 0.02447509765625, 0.025487899780273438, 0.026500701904296875, 0.027513504028320312, 0.02852630615234375, 0.029539108276367188, 0.030551910400390625, 0.03156471252441406, 0.0325775146484375, 0.03359031677246094, 0.034603118896484375, 0.03561592102050781, 0.03662872314453125, 0.03764152526855469, 0.038654327392578125, 0.03966712951660156, 0.040679931640625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 34.0, 401.0, 507.0, 47.0, 12.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6720820069313049, -0.6529055833816528, -0.633729100227356, -0.6145526766777039, -0.595376193523407, -0.5761997699737549, -0.557023286819458, -0.5378468632698059, -0.5186704397201538, -0.4994939863681793, -0.48031753301620483, -0.46114107966423035, -0.44196462631225586, -0.42278820276260376, -0.4036117494106293, -0.3844352960586548, -0.3652588129043579, -0.3460823595523834, -0.32690590620040894, -0.30772945284843445, -0.28855299949645996, -0.26937657594680786, -0.2502001225948334, -0.2310236692428589, -0.2118472158908844, -0.1926707625389099, -0.17349430918693542, -0.15431787073612213, -0.13514141738414764, -0.11596496403217316, -0.09678851813077927, -0.07761207222938538, -0.05843555927276611, -0.039259109646081924, -0.020082660019397736, -0.0009062103927135468, 0.018270239233970642, 0.03744669258594513, 0.05662313848733902, 0.07579958438873291, 0.0949760377407074, 0.11415249109268188, 0.13332894444465637, 0.15250538289546967, 0.17168183624744415, 0.19085828959941864, 0.21003472805023193, 0.22921118140220642, 0.2483876347541809, 0.2675640881061554, 0.2867405414581299, 0.30591699481010437, 0.32509344816207886, 0.34426987171173096, 0.36344632506370544, 0.38262277841567993, 0.4017992317676544, 0.4209756851196289, 0.4401521384716034, 0.4593285918235779, 0.47850501537323, 0.49768149852752686, 0.516857922077179, 0.536034345626831, 0.5552108287811279]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 12.0, 10.0, 13.0, 15.0, 32.0, 34.0, 51.0, 53.0, 63.0, 82.0, 97.0, 68.0, 89.0, 73.0, 56.0, 53.0, 50.0, 42.0, 22.0, 21.0, 17.0, 13.0, 9.0, 2.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09995931386947632, -0.09662645310163498, -0.09329359233379364, -0.0899607315659523, -0.08662787079811096, -0.08329501003026962, -0.07996214926242828, -0.07662928849458694, -0.0732964277267456, -0.06996356695890427, -0.06663070619106293, -0.06329784542322159, -0.05996498465538025, -0.05663212388753891, -0.05329926311969757, -0.04996640235185623, -0.04663354158401489, -0.04330068081617355, -0.039967820048332214, -0.036634959280490875, -0.033302098512649536, -0.029969237744808197, -0.026636376976966858, -0.02330351620912552, -0.01997065544128418, -0.01663779467344284, -0.013304933905601501, -0.009972073137760162, -0.006639212369918823, -0.003306351602077484, 2.650916576385498e-05, 0.003359369933605194, 0.006692230701446533, 0.010025091469287872, 0.013357952237129211, 0.01669081300497055, 0.02002367377281189, 0.02335653454065323, 0.026689395308494568, 0.030022256076335907, 0.033355116844177246, 0.036687977612018585, 0.040020838379859924, 0.04335369914770126, 0.0466865599155426, 0.05001942068338394, 0.05335228145122528, 0.05668514221906662, 0.06001800298690796, 0.0633508637547493, 0.06668372452259064, 0.07001658529043198, 0.07334944605827332, 0.07668230682611465, 0.080015167593956, 0.08334802836179733, 0.08668088912963867, 0.09001374989748001, 0.09334661066532135, 0.09667947143316269, 0.10001233220100403, 0.10334519296884537, 0.1066780537366867, 0.11001091450452805, 0.11334377527236938]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 8.0, 2.0, 4.0, 2.0, 8.0, 10.0, 8.0, 16.0, 8.0, 16.0, 20.0, 12.0, 22.0, 32.0, 39.0, 193.0, 4191515.0, 2010.0, 160.0, 28.0, 28.0, 25.0, 18.0, 20.0, 6.0, 6.0, 6.0, 8.0, 6.0, 4.0, 2.0, 2.0, 6.0, 0.0, 4.0, 2.0, 4.0, 6.0, 4.0, 4.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.6142578125, -1.570343017578125, -1.52642822265625, -1.482513427734375, -1.4385986328125, -1.394683837890625, -1.35076904296875, -1.306854248046875, -1.262939453125, -1.219024658203125, -1.17510986328125, -1.131195068359375, -1.0872802734375, -1.043365478515625, -0.99945068359375, -0.955535888671875, -0.91162109375, -0.867706298828125, -0.82379150390625, -0.779876708984375, -0.7359619140625, -0.692047119140625, -0.64813232421875, -0.604217529296875, -0.560302734375, -0.516387939453125, -0.47247314453125, -0.428558349609375, -0.3846435546875, -0.340728759765625, -0.29681396484375, -0.252899169921875, -0.208984375, -0.165069580078125, -0.12115478515625, -0.077239990234375, -0.0333251953125, 0.010589599609375, 0.05450439453125, 0.098419189453125, 0.142333984375, 0.186248779296875, 0.23016357421875, 0.274078369140625, 0.3179931640625, 0.361907958984375, 0.40582275390625, 0.449737548828125, 0.49365234375, 0.537567138671875, 0.58148193359375, 0.625396728515625, 0.6693115234375, 0.713226318359375, 0.75714111328125, 0.801055908203125, 0.844970703125, 0.888885498046875, 0.93280029296875, 0.976715087890625, 1.0206298828125, 1.064544677734375, 1.10845947265625, 1.152374267578125, 1.1962890625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 8.0, 13.0, 18.0, 30.0, 62.0, 112.0, 163.0, 176.0, 158.0, 96.0, 79.0, 30.0, 17.0, 17.0, 11.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003265380859375, -0.003126859664916992, -0.0029883384704589844, -0.0028498172760009766, -0.0027112960815429688, -0.002572774887084961, -0.002434253692626953, -0.0022957324981689453, -0.0021572113037109375, -0.0020186901092529297, -0.0018801689147949219, -0.001741647720336914, -0.0016031265258789062, -0.0014646053314208984, -0.0013260841369628906, -0.0011875629425048828, -0.001049041748046875, -0.0009105205535888672, -0.0007719993591308594, -0.0006334781646728516, -0.0004949569702148438, -0.00035643577575683594, -0.00021791458129882812, -7.939338684082031e-05, 5.91278076171875e-05, 0.0001976490020751953, 0.0003361701965332031, 0.00047469139099121094, 0.0006132125854492188, 0.0007517337799072266, 0.0008902549743652344, 0.0010287761688232422, 0.00116729736328125, 0.0013058185577392578, 0.0014443397521972656, 0.0015828609466552734, 0.0017213821411132812, 0.001859903335571289, 0.001998424530029297, 0.0021369457244873047, 0.0022754669189453125, 0.0024139881134033203, 0.002552509307861328, 0.002691030502319336, 0.0028295516967773438, 0.0029680728912353516, 0.0031065940856933594, 0.003245115280151367, 0.003383636474609375, 0.003522157669067383, 0.0036606788635253906, 0.0037992000579833984, 0.003937721252441406, 0.004076242446899414, 0.004214763641357422, 0.00435328483581543, 0.0044918060302734375, 0.004630327224731445, 0.004768848419189453, 0.004907369613647461, 0.005045890808105469, 0.0051844120025634766, 0.005322933197021484, 0.005461454391479492, 0.0055999755859375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 1.0, 9.0, 9.0, 12.0, 21.0, 23.0, 45.0, 81.0, 180.0, 1503.0, 4186945.0, 4973.0, 245.0, 87.0, 68.0, 25.0, 22.0, 9.0, 9.0, 5.0, 5.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.708984375, -0.6930961608886719, -0.6772079467773438, -0.6613197326660156, -0.6454315185546875, -0.6295433044433594, -0.6136550903320312, -0.5977668762207031, -0.581878662109375, -0.5659904479980469, -0.5501022338867188, -0.5342140197753906, -0.5183258056640625, -0.5024375915527344, -0.48654937744140625, -0.4706611633300781, -0.45477294921875, -0.4388847351074219, -0.42299652099609375, -0.4071083068847656, -0.3912200927734375, -0.3753318786621094, -0.35944366455078125, -0.3435554504394531, -0.327667236328125, -0.3117790222167969, -0.29589080810546875, -0.2800025939941406, -0.2641143798828125, -0.24822616577148438, -0.23233795166015625, -0.21644973754882812, -0.2005615234375, -0.18467330932617188, -0.16878509521484375, -0.15289688110351562, -0.1370086669921875, -0.12112045288085938, -0.10523223876953125, -0.08934402465820312, -0.073455810546875, -0.057567596435546875, -0.04167938232421875, -0.025791168212890625, -0.0099029541015625, 0.005985260009765625, 0.02187347412109375, 0.037761688232421875, 0.05364990234375, 0.06953811645507812, 0.08542633056640625, 0.10131454467773438, 0.1172027587890625, 0.13309097290039062, 0.14897918701171875, 0.16486740112304688, 0.180755615234375, 0.19664382934570312, 0.21253204345703125, 0.22842025756835938, 0.2443084716796875, 0.2601966857910156, 0.27608489990234375, 0.2919731140136719, 0.307861328125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 5.0, 12.0, 14.0, 14.0, 30.0, 38.0, 57.0, 139.0, 357.0, 2333.0, 648.0, 189.0, 94.0, 42.0, 27.0, 15.0, 23.0, 7.0, 10.0, 12.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00911712646484375, -0.008854448795318604, -0.008591771125793457, -0.00832909345626831, -0.008066415786743164, -0.007803738117218018, -0.007541060447692871, -0.007278382778167725, -0.007015705108642578, -0.006753027439117432, -0.006490349769592285, -0.006227672100067139, -0.005964994430541992, -0.005702316761016846, -0.005439639091491699, -0.005176961421966553, -0.004914283752441406, -0.00465160608291626, -0.004388928413391113, -0.004126250743865967, -0.0038635730743408203, -0.003600895404815674, -0.0033382177352905273, -0.003075540065765381, -0.0028128623962402344, -0.002550184726715088, -0.0022875070571899414, -0.002024829387664795, -0.0017621517181396484, -0.001499474048614502, -0.0012367963790893555, -0.000974118709564209, -0.0007114410400390625, -0.000448763370513916, -0.00018608570098876953, 7.659196853637695e-05, 0.00033926963806152344, 0.0006019473075866699, 0.0008646249771118164, 0.0011273026466369629, 0.0013899803161621094, 0.0016526579856872559, 0.0019153356552124023, 0.002178013324737549, 0.0024406909942626953, 0.002703368663787842, 0.0029660463333129883, 0.0032287240028381348, 0.0034914016723632812, 0.0037540793418884277, 0.004016757011413574, 0.004279434680938721, 0.004542112350463867, 0.004804790019989014, 0.00506746768951416, 0.005330145359039307, 0.005592823028564453, 0.0058555006980896, 0.006118178367614746, 0.006380856037139893, 0.006643533706665039, 0.0069062113761901855, 0.007168889045715332, 0.0074315667152404785, 0.007694244384765625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1008.0, 7.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7073004245758057, -1.6781212091445923, -1.648941993713379, -1.619762659072876, -1.5905834436416626, -1.5614042282104492, -1.5322248935699463, -1.503045678138733, -1.4738664627075195, -1.4446872472763062, -1.4155080318450928, -1.3863286972045898, -1.3571494817733765, -1.327970266342163, -1.2987909317016602, -1.2696117162704468, -1.2404325008392334, -1.21125328540802, -1.1820740699768066, -1.1528947353363037, -1.1237155199050903, -1.094536304473877, -1.065356969833374, -1.0361777544021606, -1.0069985389709473, -0.9778193235397339, -0.9486400485038757, -0.9194607734680176, -0.8902815580368042, -0.8611023426055908, -0.8319230675697327, -0.8027437925338745, -0.7735645174980164, -0.7443852424621582, -0.7152060270309448, -0.6860268115997314, -0.6568475365638733, -0.6276682615280151, -0.5984890460968018, -0.5693098306655884, -0.5401305556297302, -0.5109512805938721, -0.4817720651626587, -0.4525928199291229, -0.42341357469558716, -0.3942343294620514, -0.3650550842285156, -0.33587583899497986, -0.3066965937614441, -0.2775173485279083, -0.24833810329437256, -0.2191588580608368, -0.18997961282730103, -0.16080036759376526, -0.1316211223602295, -0.10244187712669373, -0.07326263189315796, -0.04408338665962219, -0.014904141426086426, 0.01427510380744934, 0.04345434904098511, 0.07263359427452087, 0.10181283950805664, 0.1309920847415924, 0.16017132997512817]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 6.0, 11.0, 24.0, 28.0, 48.0, 77.0, 86.0, 122.0, 116.0, 118.0, 121.0, 83.0, 60.0, 37.0, 29.0, 13.0, 9.0, 10.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0659530758857727, -0.06450649350881577, -0.06305990368127823, -0.06161332130432129, -0.06016673520207405, -0.05872014909982681, -0.05727356672286987, -0.055826980620622635, -0.0543803945183754, -0.05293380841612816, -0.05148722231388092, -0.05004063993692398, -0.04859405383467674, -0.047147467732429504, -0.045700885355472565, -0.04425429925322533, -0.04280771315097809, -0.04136112704873085, -0.03991454094648361, -0.03846795856952667, -0.037021372467279434, -0.035574786365032196, -0.034128203988075256, -0.03268161788582802, -0.03123503178358078, -0.029788445681333542, -0.028341861441731453, -0.026895277202129364, -0.025448691099882126, -0.024002104997634888, -0.0225555207580328, -0.02110893651843071, -0.01966235041618347, -0.018215764313936234, -0.016769180074334145, -0.015322594903409481, -0.013876009732484818, -0.012429424561560154, -0.01098283939063549, -0.009536254219710827, -0.008089669048786163, -0.0066430838778615, -0.005196498706936836, -0.0037499135360121727, -0.002303328365087509, -0.0008567431941628456, 0.0005898419767618179, 0.0020364271476864815, 0.003483012318611145, 0.0049295974895358086, 0.006376182660460472, 0.007822767831385136, 0.0092693530023098, 0.010715938173234463, 0.012162523344159126, 0.01360910851508379, 0.015055693686008453, 0.01650227978825569, 0.01794886402785778, 0.01939544826745987, 0.020842034369707108, 0.022288620471954346, 0.023735204711556435, 0.025181788951158524, 0.02662837505340576]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 1.0, 3.0, 7.0, 3.0, 2.0, 7.0, 13.0, 5.0, 11.0, 8.0, 16.0, 21.0, 36.0, 33.0, 49.0, 55.0, 94.0, 308.0, 4936.0, 877870.0, 162880.0, 1689.0, 183.0, 67.0, 57.0, 44.0, 41.0, 24.0, 16.0, 17.0, 12.0, 10.0, 5.0, 6.0, 4.0, 11.0, 2.0, 6.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.11590576171875, -0.112579345703125, -0.1092529296875, -0.105926513671875, -0.10260009765625, -0.099273681640625, -0.095947265625, -0.092620849609375, -0.08929443359375, -0.085968017578125, -0.0826416015625, -0.079315185546875, -0.07598876953125, -0.072662353515625, -0.0693359375, -0.066009521484375, -0.06268310546875, -0.059356689453125, -0.0560302734375, -0.052703857421875, -0.04937744140625, -0.046051025390625, -0.042724609375, -0.039398193359375, -0.03607177734375, -0.032745361328125, -0.0294189453125, -0.026092529296875, -0.02276611328125, -0.019439697265625, -0.01611328125, -0.012786865234375, -0.00946044921875, -0.006134033203125, -0.0028076171875, 0.000518798828125, 0.00384521484375, 0.007171630859375, 0.010498046875, 0.013824462890625, 0.01715087890625, 0.020477294921875, 0.0238037109375, 0.027130126953125, 0.03045654296875, 0.033782958984375, 0.037109375, 0.040435791015625, 0.04376220703125, 0.047088623046875, 0.0504150390625, 0.053741455078125, 0.05706787109375, 0.060394287109375, 0.063720703125, 0.067047119140625, 0.07037353515625, 0.073699951171875, 0.0770263671875, 0.080352783203125, 0.08367919921875, 0.087005615234375, 0.09033203125, 0.093658447265625, 0.09698486328125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 4.0, 6.0, 20.0, 42.0, 58.0, 108.0, 163.0, 168.0, 134.0, 119.0, 83.0, 61.0, 21.0, 11.0, 9.0, 2.0, 1.0, 1.0], "bins": [-0.0087890625, -0.008625015616416931, -0.008460968732833862, -0.008296921849250793, -0.008132874965667725, -0.007968828082084656, -0.007804781198501587, -0.007640734314918518, -0.007476687431335449, -0.00731264054775238, -0.0071485936641693115, -0.006984546780586243, -0.006820499897003174, -0.006656453013420105, -0.006492406129837036, -0.006328359246253967, -0.0061643123626708984, -0.00600026547908783, -0.005836218595504761, -0.005672171711921692, -0.005508124828338623, -0.005344077944755554, -0.005180031061172485, -0.0050159841775894165, -0.004851937294006348, -0.004687890410423279, -0.00452384352684021, -0.004359796643257141, -0.004195749759674072, -0.004031702876091003, -0.0038676559925079346, -0.0037036091089248657, -0.003539562225341797, -0.003375515341758728, -0.003211468458175659, -0.0030474215745925903, -0.0028833746910095215, -0.0027193278074264526, -0.002555280923843384, -0.002391234040260315, -0.002227187156677246, -0.0020631402730941772, -0.0018990933895111084, -0.0017350465059280396, -0.0015709996223449707, -0.0014069527387619019, -0.001242905855178833, -0.0010788589715957642, -0.0009148120880126953, -0.0007507652044296265, -0.0005867183208465576, -0.00042267143726348877, -0.0002586245536804199, -9.457767009735107e-05, 6.946921348571777e-05, 0.00023351609706878662, 0.00039756298065185547, 0.0005616098642349243, 0.0007256567478179932, 0.000889703631401062, 0.0010537505149841309, 0.0012177973985671997, 0.0013818442821502686, 0.0015458911657333374, 0.0017099380493164062]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 4.0, 14.0, 19.0, 25.0, 37.0, 43.0, 68.0, 109.0, 170.0, 354.0, 865.0, 3749.0, 32256.0, 622783.0, 364585.0, 19291.0, 2639.0, 739.0, 326.0, 159.0, 100.0, 60.0, 47.0, 41.0, 20.0, 11.0, 9.0, 5.0, 12.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05609130859375, -0.054483890533447266, -0.05287647247314453, -0.0512690544128418, -0.04966163635253906, -0.04805421829223633, -0.046446800231933594, -0.04483938217163086, -0.043231964111328125, -0.04162454605102539, -0.040017127990722656, -0.03840970993041992, -0.03680229187011719, -0.03519487380981445, -0.03358745574951172, -0.031980037689208984, -0.03037261962890625, -0.028765201568603516, -0.02715778350830078, -0.025550365447998047, -0.023942947387695312, -0.022335529327392578, -0.020728111267089844, -0.01912069320678711, -0.017513275146484375, -0.01590585708618164, -0.014298439025878906, -0.012691020965576172, -0.011083602905273438, -0.009476184844970703, -0.007868766784667969, -0.006261348724365234, -0.0046539306640625, -0.0030465126037597656, -0.0014390945434570312, 0.00016832351684570312, 0.0017757415771484375, 0.003383159637451172, 0.004990577697753906, 0.006597995758056641, 0.008205413818359375, 0.00981283187866211, 0.011420249938964844, 0.013027667999267578, 0.014635086059570312, 0.016242504119873047, 0.01784992218017578, 0.019457340240478516, 0.02106475830078125, 0.022672176361083984, 0.02427959442138672, 0.025887012481689453, 0.027494430541992188, 0.029101848602294922, 0.030709266662597656, 0.03231668472290039, 0.033924102783203125, 0.03553152084350586, 0.037138938903808594, 0.03874635696411133, 0.04035377502441406, 0.0419611930847168, 0.04356861114501953, 0.045176029205322266, 0.046783447265625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 7.0, 12.0, 10.0, 15.0, 12.0, 23.0, 18.0, 22.0, 29.0, 45.0, 44.0, 51.0, 42.0, 61.0, 60.0, 49.0, 49.0, 54.0, 53.0, 60.0, 41.0, 38.0, 42.0, 37.0, 23.0, 20.0, 18.0, 16.0, 10.0, 12.0, 7.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01183319091796875, -0.011432647705078125, -0.0110321044921875, -0.010631561279296875, -0.01023101806640625, -0.009830474853515625, -0.009429931640625, -0.009029388427734375, -0.00862884521484375, -0.008228302001953125, -0.0078277587890625, -0.007427215576171875, -0.00702667236328125, -0.006626129150390625, -0.0062255859375, -0.005825042724609375, -0.00542449951171875, -0.005023956298828125, -0.0046234130859375, -0.004222869873046875, -0.00382232666015625, -0.003421783447265625, -0.003021240234375, -0.002620697021484375, -0.00222015380859375, -0.001819610595703125, -0.0014190673828125, -0.001018524169921875, -0.00061798095703125, -0.000217437744140625, 0.00018310546875, 0.000583648681640625, 0.00098419189453125, 0.001384735107421875, 0.0017852783203125, 0.002185821533203125, 0.00258636474609375, 0.002986907958984375, 0.003387451171875, 0.003787994384765625, 0.00418853759765625, 0.004589080810546875, 0.0049896240234375, 0.005390167236328125, 0.00579071044921875, 0.006191253662109375, 0.006591796875, 0.006992340087890625, 0.00739288330078125, 0.007793426513671875, 0.0081939697265625, 0.008594512939453125, 0.00899505615234375, 0.009395599365234375, 0.009796142578125, 0.010196685791015625, 0.01059722900390625, 0.010997772216796875, 0.0113983154296875, 0.011798858642578125, 0.01219940185546875, 0.012599945068359375, 0.01300048828125, 0.013401031494140625, 0.01380157470703125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 6.0, 1.0, 1.0, 4.0, 1.0, 6.0, 5.0, 2.0, 10.0, 3.0, 14.0, 12.0, 15.0, 32.0, 22.0, 56.0, 49.0, 98.0, 169.0, 422.0, 1398.0, 6717.0, 155580.0, 864845.0, 15430.0, 2303.0, 707.0, 264.0, 118.0, 73.0, 53.0, 34.0, 29.0, 14.0, 11.0, 13.0, 6.0, 6.0, 2.0, 9.0, 1.0, 4.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 4.0], "bins": [-0.08447265625, -0.08207225799560547, -0.07967185974121094, -0.0772714614868164, -0.07487106323242188, -0.07247066497802734, -0.07007026672363281, -0.06766986846923828, -0.06526947021484375, -0.06286907196044922, -0.06046867370605469, -0.058068275451660156, -0.055667877197265625, -0.053267478942871094, -0.05086708068847656, -0.04846668243408203, -0.0460662841796875, -0.04366588592529297, -0.04126548767089844, -0.038865089416503906, -0.036464691162109375, -0.034064292907714844, -0.03166389465332031, -0.02926349639892578, -0.02686309814453125, -0.02446269989013672, -0.022062301635742188, -0.019661903381347656, -0.017261505126953125, -0.014861106872558594, -0.012460708618164062, -0.010060310363769531, -0.007659912109375, -0.005259513854980469, -0.0028591156005859375, -0.00045871734619140625, 0.001941680908203125, 0.004342079162597656, 0.0067424774169921875, 0.009142875671386719, 0.01154327392578125, 0.013943672180175781, 0.016344070434570312, 0.018744468688964844, 0.021144866943359375, 0.023545265197753906, 0.025945663452148438, 0.02834606170654297, 0.0307464599609375, 0.03314685821533203, 0.03554725646972656, 0.037947654724121094, 0.040348052978515625, 0.042748451232910156, 0.04514884948730469, 0.04754924774169922, 0.04994964599609375, 0.05235004425048828, 0.05475044250488281, 0.057150840759277344, 0.059551239013671875, 0.061951637268066406, 0.06435203552246094, 0.06675243377685547, 0.06915283203125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 6.0, 3.0, 6.0, 7.0, 18.0, 23.0, 46.0, 102.0, 169.0, 261.0, 157.0, 90.0, 40.0, 22.0, 20.0, 9.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000244140625, -0.0002363733947277069, -0.00022860616445541382, -0.00022083893418312073, -0.00021307170391082764, -0.00020530447363853455, -0.00019753724336624146, -0.00018977001309394836, -0.00018200278282165527, -0.00017423555254936218, -0.0001664683222770691, -0.000158701092004776, -0.0001509338617324829, -0.00014316663146018982, -0.00013539940118789673, -0.00012763217091560364, -0.00011986494064331055, -0.00011209771037101746, -0.00010433048009872437, -9.656324982643127e-05, -8.879601955413818e-05, -8.102878928184509e-05, -7.3261559009552e-05, -6.549432873725891e-05, -5.772709846496582e-05, -4.995986819267273e-05, -4.219263792037964e-05, -3.442540764808655e-05, -2.6658177375793457e-05, -1.8890947103500366e-05, -1.1123716831207275e-05, -3.3564865589141846e-06, 4.410743713378906e-06, 1.2177973985671997e-05, 1.9945204257965088e-05, 2.771243453025818e-05, 3.547966480255127e-05, 4.324689507484436e-05, 5.101412534713745e-05, 5.878135561943054e-05, 6.654858589172363e-05, 7.431581616401672e-05, 8.208304643630981e-05, 8.98502767086029e-05, 9.7617506980896e-05, 0.00010538473725318909, 0.00011315196752548218, 0.00012091919779777527, 0.00012868642807006836, 0.00013645365834236145, 0.00014422088861465454, 0.00015198811888694763, 0.00015975534915924072, 0.0001675225794315338, 0.0001752898097038269, 0.00018305703997612, 0.00019082427024841309, 0.00019859150052070618, 0.00020635873079299927, 0.00021412596106529236, 0.00022189319133758545, 0.00022966042160987854, 0.00023742765188217163, 0.0002451948821544647, 0.0002529621124267578]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 9.0, 15.0, 16.0, 36.0, 86.0, 132.0, 362.0, 1471.0, 17505.0, 1020543.0, 6981.0, 910.0, 245.0, 112.0, 56.0, 23.0, 15.0, 12.0, 8.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.312744140625, -0.30277252197265625, -0.2928009033203125, -0.28282928466796875, -0.272857666015625, -0.26288604736328125, -0.2529144287109375, -0.24294281005859375, -0.23297119140625, -0.22299957275390625, -0.2130279541015625, -0.20305633544921875, -0.193084716796875, -0.18311309814453125, -0.1731414794921875, -0.16316986083984375, -0.1531982421875, -0.14322662353515625, -0.1332550048828125, -0.12328338623046875, -0.113311767578125, -0.10334014892578125, -0.0933685302734375, -0.08339691162109375, -0.07342529296875, -0.06345367431640625, -0.0534820556640625, -0.04351043701171875, -0.033538818359375, -0.02356719970703125, -0.0135955810546875, -0.00362396240234375, 0.00634765625, 0.01631927490234375, 0.0262908935546875, 0.03626251220703125, 0.046234130859375, 0.05620574951171875, 0.0661773681640625, 0.07614898681640625, 0.08612060546875, 0.09609222412109375, 0.1060638427734375, 0.11603546142578125, 0.126007080078125, 0.13597869873046875, 0.1459503173828125, 0.15592193603515625, 0.1658935546875, 0.17586517333984375, 0.1858367919921875, 0.19580841064453125, 0.205780029296875, 0.21575164794921875, 0.2257232666015625, 0.23569488525390625, 0.24566650390625, 0.25563812255859375, 0.2656097412109375, 0.27558135986328125, 0.285552978515625, 0.29552459716796875, 0.3054962158203125, 0.31546783447265625, 0.325439453125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 8.0, 15.0, 47.0, 161.0, 384.0, 236.0, 64.0, 30.0, 13.0, 8.0, 5.0, 5.0, 1.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.09503173828125, -0.09290504455566406, -0.09077835083007812, -0.08865165710449219, -0.08652496337890625, -0.08439826965332031, -0.08227157592773438, -0.08014488220214844, -0.0780181884765625, -0.07589149475097656, -0.07376480102539062, -0.07163810729980469, -0.06951141357421875, -0.06738471984863281, -0.06525802612304688, -0.06313133239746094, -0.061004638671875, -0.05887794494628906, -0.056751251220703125, -0.05462455749511719, -0.05249786376953125, -0.05037117004394531, -0.048244476318359375, -0.04611778259277344, -0.0439910888671875, -0.04186439514160156, -0.039737701416015625, -0.03761100769042969, -0.03548431396484375, -0.03335762023925781, -0.031230926513671875, -0.029104232788085938, -0.0269775390625, -0.024850845336914062, -0.022724151611328125, -0.020597457885742188, -0.01847076416015625, -0.016344070434570312, -0.014217376708984375, -0.012090682983398438, -0.0099639892578125, -0.007837295532226562, -0.005710601806640625, -0.0035839080810546875, -0.00145721435546875, 0.0006694793701171875, 0.002796173095703125, 0.0049228668212890625, 0.007049560546875, 0.009176254272460938, 0.011302947998046875, 0.013429641723632812, 0.01555633544921875, 0.017683029174804688, 0.019809722900390625, 0.021936416625976562, 0.0240631103515625, 0.026189804077148438, 0.028316497802734375, 0.030443191528320312, 0.03256988525390625, 0.03469657897949219, 0.036823272705078125, 0.03894996643066406, 0.04107666015625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.0, 929.0, 57.0, 1.0, 2.0, 2.0], "bins": [-4.054222583770752, -3.986128091812134, -3.9180335998535156, -3.8499391078948975, -3.7818446159362793, -3.713750123977661, -3.645655632019043, -3.577561140060425, -3.5094666481018066, -3.4413721561431885, -3.3732776641845703, -3.305183172225952, -3.237088680267334, -3.168994188308716, -3.1008996963500977, -3.0328052043914795, -2.9647107124328613, -2.896616220474243, -2.828521728515625, -2.760427236557007, -2.6923327445983887, -2.6242382526397705, -2.5561437606811523, -2.488049268722534, -2.419954776763916, -2.351860284805298, -2.2837657928466797, -2.2156713008880615, -2.1475768089294434, -2.079482316970825, -2.011387825012207, -1.9432933330535889, -1.8751989603042603, -1.807104468345642, -1.739009976387024, -1.6709154844284058, -1.6028209924697876, -1.5347265005111694, -1.4666320085525513, -1.398537516593933, -1.330443024635315, -1.2623485326766968, -1.1942540407180786, -1.1261595487594604, -1.0580650568008423, -0.9899705648422241, -0.921876072883606, -0.8537815809249878, -0.7856870889663696, -0.7175925970077515, -0.6494981050491333, -0.5814036130905151, -0.513309121131897, -0.4452146291732788, -0.37712013721466064, -0.3090256452560425, -0.24093115329742432, -0.17283666133880615, -0.10474216938018799, -0.036647677421569824, 0.03144681453704834, 0.0995413064956665, 0.16763579845428467, 0.23573029041290283, 0.303824782371521]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 16.0, 19.0, 30.0, 37.0, 47.0, 67.0, 74.0, 73.0, 89.0, 89.0, 89.0, 83.0, 71.0, 59.0, 51.0, 43.0, 28.0, 17.0, 12.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08917844295501709, -0.08378955721855164, -0.07840067148208618, -0.07301178574562073, -0.06762290000915527, -0.06223401427268982, -0.056845128536224365, -0.05145624279975891, -0.04606735706329346, -0.040678471326828, -0.03528958559036255, -0.029900699853897095, -0.02451181411743164, -0.019122928380966187, -0.013734042644500732, -0.008345156908035278, -0.0029562711715698242, 0.00243261456489563, 0.007821500301361084, 0.013210386037826538, 0.018599271774291992, 0.023988157510757446, 0.0293770432472229, 0.034765928983688354, 0.04015481472015381, 0.04554370045661926, 0.05093258619308472, 0.05632147192955017, 0.061710357666015625, 0.06709924340248108, 0.07248812913894653, 0.07787701487541199, 0.08326590061187744, 0.0886547863483429, 0.09404367208480835, 0.0994325578212738, 0.10482144355773926, 0.11021032929420471, 0.11559921503067017, 0.12098810076713562, 0.12637698650360107, 0.13176587224006653, 0.13715475797653198, 0.14254364371299744, 0.1479325294494629, 0.15332141518592834, 0.1587103009223938, 0.16409918665885925, 0.1694880723953247, 0.17487695813179016, 0.18026584386825562, 0.18565472960472107, 0.19104361534118652, 0.19643250107765198, 0.20182138681411743, 0.20721027255058289, 0.21259915828704834, 0.2179880440235138, 0.22337692975997925, 0.2287658154964447, 0.23415470123291016, 0.2395435869693756, 0.24493247270584106, 0.2503213584423065, 0.255710244178772]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 12.0, 27.0, 33.0, 66.0, 148.0, 220.0, 734.0, 8430.0, 4181380.0, 2854.0, 228.0, 67.0, 40.0, 14.0, 13.0, 7.0, 2.0, 5.0, 2.0], "bins": [-0.56494140625, -0.5543642044067383, -0.5437870025634766, -0.5332098007202148, -0.5226325988769531, -0.5120553970336914, -0.5014781951904297, -0.49090099334716797, -0.48032379150390625, -0.46974658966064453, -0.4591693878173828, -0.4485921859741211, -0.4380149841308594, -0.42743778228759766, -0.41686058044433594, -0.4062833786010742, -0.3957061767578125, -0.3851289749145508, -0.37455177307128906, -0.36397457122802734, -0.3533973693847656, -0.3428201675415039, -0.3322429656982422, -0.32166576385498047, -0.31108856201171875, -0.30051136016845703, -0.2899341583251953, -0.2793569564819336, -0.2687797546386719, -0.25820255279541016, -0.24762535095214844, -0.23704814910888672, -0.226470947265625, -0.21589374542236328, -0.20531654357910156, -0.19473934173583984, -0.18416213989257812, -0.1735849380493164, -0.1630077362060547, -0.15243053436279297, -0.14185333251953125, -0.13127613067626953, -0.12069892883300781, -0.1101217269897461, -0.09954452514648438, -0.08896732330322266, -0.07839012145996094, -0.06781291961669922, -0.0572357177734375, -0.04665851593017578, -0.03608131408691406, -0.025504112243652344, -0.014926910400390625, -0.004349708557128906, 0.0062274932861328125, 0.01680469512939453, 0.02738189697265625, 0.03795909881591797, 0.04853630065917969, 0.059113502502441406, 0.06969070434570312, 0.08026790618896484, 0.09084510803222656, 0.10142230987548828, 0.11199951171875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 10.0, 17.0, 20.0, 43.0, 85.0, 141.0, 162.0, 163.0, 138.0, 95.0, 73.0, 35.0, 11.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.010498046875, -0.010288476943969727, -0.010078907012939453, -0.00986933708190918, -0.009659767150878906, -0.009450197219848633, -0.00924062728881836, -0.009031057357788086, -0.008821487426757812, -0.008611917495727539, -0.008402347564697266, -0.008192777633666992, -0.007983207702636719, -0.007773637771606445, -0.007564067840576172, -0.0073544979095458984, -0.007144927978515625, -0.0069353580474853516, -0.006725788116455078, -0.006516218185424805, -0.006306648254394531, -0.006097078323364258, -0.005887508392333984, -0.005677938461303711, -0.0054683685302734375, -0.005258798599243164, -0.005049228668212891, -0.004839658737182617, -0.004630088806152344, -0.00442051887512207, -0.004210948944091797, -0.0040013790130615234, -0.00379180908203125, -0.0035822391510009766, -0.003372669219970703, -0.0031630992889404297, -0.0029535293579101562, -0.002743959426879883, -0.0025343894958496094, -0.002324819564819336, -0.0021152496337890625, -0.001905679702758789, -0.0016961097717285156, -0.0014865398406982422, -0.0012769699096679688, -0.0010673999786376953, -0.0008578300476074219, -0.0006482601165771484, -0.000438690185546875, -0.00022912025451660156, -1.9550323486328125e-05, 0.0001900196075439453, 0.00039958953857421875, 0.0006091594696044922, 0.0008187294006347656, 0.001028299331665039, 0.0012378692626953125, 0.001447439193725586, 0.0016570091247558594, 0.0018665790557861328, 0.0020761489868164062, 0.0022857189178466797, 0.002495288848876953, 0.0027048587799072266, 0.0029144287109375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 20.0, 36.0, 99.0, 205.0, 396.0, 204232.0, 3988716.0, 379.0, 132.0, 45.0, 20.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.681640625, -1.6451034545898438, -1.6085662841796875, -1.5720291137695312, -1.535491943359375, -1.4989547729492188, -1.4624176025390625, -1.4258804321289062, -1.38934326171875, -1.3528060913085938, -1.3162689208984375, -1.2797317504882812, -1.243194580078125, -1.2066574096679688, -1.1701202392578125, -1.1335830688476562, -1.0970458984375, -1.0605087280273438, -1.0239715576171875, -0.9874343872070312, -0.950897216796875, -0.9143600463867188, -0.8778228759765625, -0.8412857055664062, -0.80474853515625, -0.7682113647460938, -0.7316741943359375, -0.6951370239257812, -0.658599853515625, -0.6220626831054688, -0.5855255126953125, -0.5489883422851562, -0.512451171875, -0.47591400146484375, -0.4393768310546875, -0.40283966064453125, -0.366302490234375, -0.32976531982421875, -0.2932281494140625, -0.25669097900390625, -0.22015380859375, -0.18361663818359375, -0.1470794677734375, -0.11054229736328125, -0.074005126953125, -0.03746795654296875, -0.0009307861328125, 0.03560638427734375, 0.0721435546875, 0.10868072509765625, 0.1452178955078125, 0.18175506591796875, 0.218292236328125, 0.25482940673828125, 0.2913665771484375, 0.32790374755859375, 0.36444091796875, 0.40097808837890625, 0.4375152587890625, 0.47405242919921875, 0.510589599609375, 0.5471267700195312, 0.5836639404296875, 0.6202011108398438, 0.65673828125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 13.0, 126.0, 3612.0, 282.0, 40.0, 8.0, 5.0], "bins": [-0.16015625, -0.1574711799621582, -0.1547861099243164, -0.1521010398864746, -0.1494159698486328, -0.14673089981079102, -0.14404582977294922, -0.14136075973510742, -0.13867568969726562, -0.13599061965942383, -0.13330554962158203, -0.13062047958374023, -0.12793540954589844, -0.12525033950805664, -0.12256526947021484, -0.11988019943237305, -0.11719512939453125, -0.11451005935668945, -0.11182498931884766, -0.10913991928100586, -0.10645484924316406, -0.10376977920532227, -0.10108470916748047, -0.09839963912963867, -0.09571456909179688, -0.09302949905395508, -0.09034442901611328, -0.08765935897827148, -0.08497428894042969, -0.08228921890258789, -0.0796041488647461, -0.0769190788269043, -0.0742340087890625, -0.0715489387512207, -0.0688638687133789, -0.06617879867553711, -0.06349372863769531, -0.060808658599853516, -0.05812358856201172, -0.05543851852416992, -0.052753448486328125, -0.05006837844848633, -0.04738330841064453, -0.044698238372802734, -0.04201316833496094, -0.03932809829711914, -0.036643028259277344, -0.03395795822143555, -0.03127288818359375, -0.028587818145751953, -0.025902748107910156, -0.02321767807006836, -0.020532608032226562, -0.017847537994384766, -0.015162467956542969, -0.012477397918701172, -0.009792327880859375, -0.007107257843017578, -0.004422187805175781, -0.0017371177673339844, 0.0009479522705078125, 0.0036330223083496094, 0.006318092346191406, 0.009003162384033203, 0.011688232421875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 41.0, 778.0, 168.0, 18.0, 5.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.068528175354004, -2.0320799350738525, -1.9956316947937012, -1.9591833353042603, -1.9227350950241089, -1.8862868547439575, -1.8498386144638062, -1.8133902549743652, -1.7769420146942139, -1.7404937744140625, -1.7040455341339111, -1.6675971746444702, -1.6311489343643188, -1.5947006940841675, -1.5582524538040161, -1.5218040943145752, -1.4853558540344238, -1.4489076137542725, -1.412459373474121, -1.3760110139846802, -1.3395627737045288, -1.3031145334243774, -1.266666293144226, -1.2302179336547852, -1.1937698125839233, -1.157321572303772, -1.1208733320236206, -1.0844249725341797, -1.0479767322540283, -1.011528491973877, -0.9750802516937256, -0.9386319518089294, -0.9021837115287781, -0.8657354712486267, -0.8292871713638306, -0.7928389310836792, -0.7563906311988831, -0.7199423909187317, -0.6834940910339355, -0.6470458507537842, -0.6105976104736328, -0.5741493701934814, -0.5377010703086853, -0.5012528300285339, -0.4648045301437378, -0.4283562898635864, -0.39190801978111267, -0.3554597496986389, -0.3190114498138428, -0.282563179731369, -0.24611490964889526, -0.2096666544675827, -0.17321838438510895, -0.1367701143026352, -0.10032185912132263, -0.06387358903884888, -0.027425318956375122, 0.009022947400808334, 0.04547121375799179, 0.08191947638988495, 0.1183677464723587, 0.15481601655483246, 0.19126427173614502, 0.22771254181861877, 0.26416081190109253]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 9.0, 16.0, 43.0, 67.0, 90.0, 143.0, 173.0, 148.0, 125.0, 79.0, 55.0, 24.0, 15.0, 6.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37566179037094116, -0.36347347497940063, -0.3512851595878601, -0.3390968441963196, -0.32690852880477905, -0.3147202134132385, -0.302531898021698, -0.29034358263015747, -0.27815526723861694, -0.2659669518470764, -0.2537786364555359, -0.24159032106399536, -0.22940200567245483, -0.2172136902809143, -0.20502537488937378, -0.19283705949783325, -0.18064874410629272, -0.1684604287147522, -0.15627211332321167, -0.14408379793167114, -0.13189548254013062, -0.11970716714859009, -0.10751885175704956, -0.09533053636550903, -0.0831422209739685, -0.07095390558242798, -0.05876559019088745, -0.046577274799346924, -0.034388959407806396, -0.02220064401626587, -0.010012328624725342, 0.0021759867668151855, 0.014364302158355713, 0.02655261754989624, 0.03874093294143677, 0.050929248332977295, 0.06311756372451782, 0.07530587911605835, 0.08749419450759888, 0.0996825098991394, 0.11187082529067993, 0.12405914068222046, 0.136247456073761, 0.1484357714653015, 0.16062408685684204, 0.17281240224838257, 0.1850007176399231, 0.19718903303146362, 0.20937734842300415, 0.22156566381454468, 0.2337539792060852, 0.24594229459762573, 0.25813060998916626, 0.2703189253807068, 0.2825072407722473, 0.29469555616378784, 0.30688387155532837, 0.3190721869468689, 0.3312605023384094, 0.34344881772994995, 0.3556371331214905, 0.367825448513031, 0.38001376390457153, 0.39220207929611206, 0.4043903946876526]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 3.0, 7.0, 7.0, 18.0, 10.0, 11.0, 17.0, 30.0, 31.0, 54.0, 69.0, 98.0, 153.0, 313.0, 597.0, 1481.0, 5232.0, 35094.0, 759141.0, 226690.0, 14293.0, 3030.0, 1074.0, 418.0, 245.0, 120.0, 92.0, 61.0, 43.0, 22.0, 21.0, 20.0, 17.0, 7.0, 6.0, 6.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11419677734375, -0.11008930206298828, -0.10598182678222656, -0.10187435150146484, -0.09776687622070312, -0.0936594009399414, -0.08955192565917969, -0.08544445037841797, -0.08133697509765625, -0.07722949981689453, -0.07312202453613281, -0.0690145492553711, -0.06490707397460938, -0.060799598693847656, -0.05669212341308594, -0.05258464813232422, -0.0484771728515625, -0.04436969757080078, -0.04026222229003906, -0.036154747009277344, -0.032047271728515625, -0.027939796447753906, -0.023832321166992188, -0.01972484588623047, -0.01561737060546875, -0.011509895324707031, -0.0074024200439453125, -0.0032949447631835938, 0.000812530517578125, 0.004920005798339844, 0.009027481079101562, 0.013134956359863281, 0.017242431640625, 0.02134990692138672, 0.025457382202148438, 0.029564857482910156, 0.033672332763671875, 0.037779808044433594, 0.04188728332519531, 0.04599475860595703, 0.05010223388671875, 0.05420970916748047, 0.05831718444824219, 0.062424659729003906, 0.06653213500976562, 0.07063961029052734, 0.07474708557128906, 0.07885456085205078, 0.0829620361328125, 0.08706951141357422, 0.09117698669433594, 0.09528446197509766, 0.09939193725585938, 0.1034994125366211, 0.10760688781738281, 0.11171436309814453, 0.11582183837890625, 0.11992931365966797, 0.12403678894042969, 0.1281442642211914, 0.13225173950195312, 0.13635921478271484, 0.14046669006347656, 0.14457416534423828, 0.148681640625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 8.0, 10.0, 20.0, 44.0, 56.0, 86.0, 121.0, 148.0, 135.0, 114.0, 98.0, 63.0, 49.0, 30.0, 13.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0203704833984375, -0.019753456115722656, -0.019136428833007812, -0.01851940155029297, -0.017902374267578125, -0.01728534698486328, -0.016668319702148438, -0.016051292419433594, -0.01543426513671875, -0.014817237854003906, -0.014200210571289062, -0.013583183288574219, -0.012966156005859375, -0.012349128723144531, -0.011732101440429688, -0.011115074157714844, -0.010498046875, -0.009881019592285156, -0.009263992309570312, -0.008646965026855469, -0.008029937744140625, -0.007412910461425781, -0.0067958831787109375, -0.006178855895996094, -0.00556182861328125, -0.004944801330566406, -0.0043277740478515625, -0.0037107467651367188, -0.003093719482421875, -0.0024766921997070312, -0.0018596649169921875, -0.0012426376342773438, -0.0006256103515625, -8.58306884765625e-06, 0.0006084442138671875, 0.0012254714965820312, 0.001842498779296875, 0.0024595260620117188, 0.0030765533447265625, 0.0036935806274414062, 0.00431060791015625, 0.004927635192871094, 0.0055446624755859375, 0.006161689758300781, 0.006778717041015625, 0.007395744323730469, 0.008012771606445312, 0.008629798889160156, 0.009246826171875, 0.009863853454589844, 0.010480880737304688, 0.011097908020019531, 0.011714935302734375, 0.012331962585449219, 0.012948989868164062, 0.013566017150878906, 0.01418304443359375, 0.014800071716308594, 0.015417098999023438, 0.01603412628173828, 0.016651153564453125, 0.01726818084716797, 0.017885208129882812, 0.018502235412597656, 0.0191192626953125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 2.0, 4.0, 1.0, 7.0, 10.0, 12.0, 12.0, 11.0, 22.0, 19.0, 42.0, 59.0, 99.0, 185.0, 507.0, 1996.0, 26203.0, 938485.0, 76276.0, 3306.0, 699.0, 265.0, 116.0, 63.0, 47.0, 27.0, 19.0, 14.0, 12.0, 9.0, 13.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11383056640625, -0.10985469818115234, -0.10587882995605469, -0.10190296173095703, -0.09792709350585938, -0.09395122528076172, -0.08997535705566406, -0.0859994888305664, -0.08202362060546875, -0.0780477523803711, -0.07407188415527344, -0.07009601593017578, -0.06612014770507812, -0.06214427947998047, -0.05816841125488281, -0.054192543029785156, -0.0502166748046875, -0.046240806579589844, -0.04226493835449219, -0.03828907012939453, -0.034313201904296875, -0.03033733367919922, -0.026361465454101562, -0.022385597229003906, -0.01840972900390625, -0.014433860778808594, -0.010457992553710938, -0.006482124328613281, -0.002506256103515625, 0.0014696121215820312, 0.0054454803466796875, 0.009421348571777344, 0.013397216796875, 0.017373085021972656, 0.021348953247070312, 0.02532482147216797, 0.029300689697265625, 0.03327655792236328, 0.03725242614746094, 0.041228294372558594, 0.04520416259765625, 0.049180030822753906, 0.05315589904785156, 0.05713176727294922, 0.061107635498046875, 0.06508350372314453, 0.06905937194824219, 0.07303524017333984, 0.0770111083984375, 0.08098697662353516, 0.08496284484863281, 0.08893871307373047, 0.09291458129882812, 0.09689044952392578, 0.10086631774902344, 0.1048421859741211, 0.10881805419921875, 0.1127939224243164, 0.11676979064941406, 0.12074565887451172, 0.12472152709960938, 0.12869739532470703, 0.1326732635498047, 0.13664913177490234, 0.140625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 9.0, 8.0, 14.0, 15.0, 10.0, 16.0, 24.0, 36.0, 30.0, 36.0, 51.0, 42.0, 39.0, 63.0, 53.0, 67.0, 66.0, 57.0, 62.0, 52.0, 49.0, 50.0, 28.0, 23.0, 29.0, 12.0, 14.0, 10.0, 8.0, 11.0, 3.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038299560546875, -0.03699636459350586, -0.03569316864013672, -0.03438997268676758, -0.03308677673339844, -0.0317835807800293, -0.030480384826660156, -0.029177188873291016, -0.027873992919921875, -0.026570796966552734, -0.025267601013183594, -0.023964405059814453, -0.022661209106445312, -0.021358013153076172, -0.02005481719970703, -0.01875162124633789, -0.01744842529296875, -0.01614522933959961, -0.014842033386230469, -0.013538837432861328, -0.012235641479492188, -0.010932445526123047, -0.009629249572753906, -0.008326053619384766, -0.007022857666015625, -0.005719661712646484, -0.004416465759277344, -0.003113269805908203, -0.0018100738525390625, -0.0005068778991699219, 0.0007963180541992188, 0.0020995140075683594, 0.0034027099609375, 0.004705905914306641, 0.006009101867675781, 0.007312297821044922, 0.008615493774414062, 0.009918689727783203, 0.011221885681152344, 0.012525081634521484, 0.013828277587890625, 0.015131473541259766, 0.016434669494628906, 0.017737865447998047, 0.019041061401367188, 0.020344257354736328, 0.02164745330810547, 0.02295064926147461, 0.02425384521484375, 0.02555704116821289, 0.02686023712158203, 0.028163433074951172, 0.029466629028320312, 0.030769824981689453, 0.032073020935058594, 0.033376216888427734, 0.034679412841796875, 0.035982608795166016, 0.037285804748535156, 0.0385890007019043, 0.03989219665527344, 0.04119539260864258, 0.04249858856201172, 0.04380178451538086, 0.04510498046875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 11.0, 10.0, 24.0, 43.0, 70.0, 167.0, 401.0, 1190.0, 6607.0, 301596.0, 726068.0, 9996.0, 1501.0, 488.0, 177.0, 84.0, 41.0, 28.0, 13.0, 7.0, 6.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09637451171875, -0.09402894973754883, -0.09168338775634766, -0.08933782577514648, -0.08699226379394531, -0.08464670181274414, -0.08230113983154297, -0.0799555778503418, -0.07761001586914062, -0.07526445388793945, -0.07291889190673828, -0.07057332992553711, -0.06822776794433594, -0.06588220596313477, -0.0635366439819336, -0.06119108200073242, -0.05884552001953125, -0.05649995803833008, -0.054154396057128906, -0.051808834075927734, -0.04946327209472656, -0.04711771011352539, -0.04477214813232422, -0.04242658615112305, -0.040081024169921875, -0.0377354621887207, -0.03538990020751953, -0.03304433822631836, -0.030698776245117188, -0.028353214263916016, -0.026007652282714844, -0.023662090301513672, -0.0213165283203125, -0.018970966339111328, -0.016625404357910156, -0.014279842376708984, -0.011934280395507812, -0.00958871841430664, -0.007243156433105469, -0.004897594451904297, -0.002552032470703125, -0.00020647048950195312, 0.0021390914916992188, 0.004484653472900391, 0.0068302154541015625, 0.009175777435302734, 0.011521339416503906, 0.013866901397705078, 0.01621246337890625, 0.018558025360107422, 0.020903587341308594, 0.023249149322509766, 0.025594711303710938, 0.02794027328491211, 0.03028583526611328, 0.03263139724731445, 0.034976959228515625, 0.0373225212097168, 0.03966808319091797, 0.04201364517211914, 0.04435920715332031, 0.046704769134521484, 0.049050331115722656, 0.05139589309692383, 0.053741455078125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 7.0, 7.0, 8.0, 8.0, 4.0, 8.0, 5.0, 17.0, 18.0, 17.0, 20.0, 27.0, 57.0, 57.0, 96.0, 109.0, 142.0, 72.0, 59.0, 38.0, 34.0, 24.0, 24.0, 24.0, 21.0, 13.0, 7.0, 13.0, 12.0, 12.0, 3.0, 4.0, 5.0, 6.0, 1.0, 5.0, 3.0, 0.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00013685226440429688, -0.00013256259262561798, -0.0001282729208469391, -0.0001239832490682602, -0.0001196935772895813, -0.0001154039055109024, -0.00011111423373222351, -0.00010682456195354462, -0.00010253489017486572, -9.824521839618683e-05, -9.395554661750793e-05, -8.966587483882904e-05, -8.537620306015015e-05, -8.108653128147125e-05, -7.679685950279236e-05, -7.250718772411346e-05, -6.821751594543457e-05, -6.392784416675568e-05, -5.963817238807678e-05, -5.534850060939789e-05, -5.1058828830718994e-05, -4.67691570520401e-05, -4.2479485273361206e-05, -3.818981349468231e-05, -3.390014171600342e-05, -2.9610469937324524e-05, -2.532079815864563e-05, -2.1031126379966736e-05, -1.6741454601287842e-05, -1.2451782822608948e-05, -8.162111043930054e-06, -3.87243926525116e-06, 4.172325134277344e-07, 4.706904292106628e-06, 8.996576070785522e-06, 1.3286247849464417e-05, 1.757591962814331e-05, 2.1865591406822205e-05, 2.61552631855011e-05, 3.0444934964179993e-05, 3.473460674285889e-05, 3.902427852153778e-05, 4.3313950300216675e-05, 4.760362207889557e-05, 5.189329385757446e-05, 5.618296563625336e-05, 6.047263741493225e-05, 6.476230919361115e-05, 6.905198097229004e-05, 7.334165275096893e-05, 7.763132452964783e-05, 8.192099630832672e-05, 8.621066808700562e-05, 9.050033986568451e-05, 9.47900116443634e-05, 9.90796834230423e-05, 0.00010336935520172119, 0.00010765902698040009, 0.00011194869875907898, 0.00011623837053775787, 0.00012052804231643677, 0.00012481771409511566, 0.00012910738587379456, 0.00013339705765247345, 0.00013768672943115234]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 8.0, 19.0, 29.0, 53.0, 95.0, 251.0, 839.0, 3836.0, 304794.0, 731651.0, 5458.0, 958.0, 292.0, 114.0, 63.0, 35.0, 12.0, 14.0, 9.0, 6.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1331787109375, -0.12977027893066406, -0.12636184692382812, -0.12295341491699219, -0.11954498291015625, -0.11613655090332031, -0.11272811889648438, -0.10931968688964844, -0.1059112548828125, -0.10250282287597656, -0.09909439086914062, -0.09568595886230469, -0.09227752685546875, -0.08886909484863281, -0.08546066284179688, -0.08205223083496094, -0.078643798828125, -0.07523536682128906, -0.07182693481445312, -0.06841850280761719, -0.06501007080078125, -0.06160163879394531, -0.058193206787109375, -0.05478477478027344, -0.0513763427734375, -0.04796791076660156, -0.044559478759765625, -0.04115104675292969, -0.03774261474609375, -0.03433418273925781, -0.030925750732421875, -0.027517318725585938, -0.02410888671875, -0.020700454711914062, -0.017292022705078125, -0.013883590698242188, -0.01047515869140625, -0.0070667266845703125, -0.003658294677734375, -0.0002498626708984375, 0.0031585693359375, 0.0065670013427734375, 0.009975433349609375, 0.013383865356445312, 0.01679229736328125, 0.020200729370117188, 0.023609161376953125, 0.027017593383789062, 0.030426025390625, 0.03383445739746094, 0.037242889404296875, 0.04065132141113281, 0.04405975341796875, 0.04746818542480469, 0.050876617431640625, 0.05428504943847656, 0.0576934814453125, 0.06110191345214844, 0.06451034545898438, 0.06791877746582031, 0.07132720947265625, 0.07473564147949219, 0.07814407348632812, 0.08155250549316406, 0.0849609375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 2.0, 2.0, 9.0, 11.0, 13.0, 19.0, 26.0, 45.0, 87.0, 103.0, 121.0, 128.0, 120.0, 99.0, 75.0, 41.0, 40.0, 22.0, 9.0, 6.0, 5.0, 5.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036865234375, -0.03573131561279297, -0.03459739685058594, -0.033463478088378906, -0.032329559326171875, -0.031195640563964844, -0.030061721801757812, -0.02892780303955078, -0.02779388427734375, -0.02665996551513672, -0.025526046752929688, -0.024392127990722656, -0.023258209228515625, -0.022124290466308594, -0.020990371704101562, -0.01985645294189453, -0.0187225341796875, -0.01758861541748047, -0.016454696655273438, -0.015320777893066406, -0.014186859130859375, -0.013052940368652344, -0.011919021606445312, -0.010785102844238281, -0.00965118408203125, -0.008517265319824219, -0.0073833465576171875, -0.006249427795410156, -0.005115509033203125, -0.003981590270996094, -0.0028476715087890625, -0.0017137527465820312, -0.000579833984375, 0.0005540847778320312, 0.0016880035400390625, 0.0028219223022460938, 0.003955841064453125, 0.005089759826660156, 0.0062236785888671875, 0.007357597351074219, 0.00849151611328125, 0.009625434875488281, 0.010759353637695312, 0.011893272399902344, 0.013027191162109375, 0.014161109924316406, 0.015295028686523438, 0.01642894744873047, 0.0175628662109375, 0.01869678497314453, 0.019830703735351562, 0.020964622497558594, 0.022098541259765625, 0.023232460021972656, 0.024366378784179688, 0.02550029754638672, 0.02663421630859375, 0.02776813507080078, 0.028902053833007812, 0.030035972595214844, 0.031169891357421875, 0.032303810119628906, 0.03343772888183594, 0.03457164764404297, 0.03570556640625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 15.0, 169.0, 725.0, 74.0, 16.0, 5.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8053152561187744, -1.7635196447372437, -1.721724033355713, -1.6799283027648926, -1.6381326913833618, -1.596337080001831, -1.5545413494110107, -1.51274573802948, -1.4709501266479492, -1.4291545152664185, -1.3873589038848877, -1.3455631732940674, -1.3037675619125366, -1.2619719505310059, -1.2201762199401855, -1.1783806085586548, -1.136584997177124, -1.0947893857955933, -1.0529937744140625, -1.0111980438232422, -0.9694024324417114, -0.9276068210601807, -0.8858111500740051, -0.8440154790878296, -0.8022198677062988, -0.7604242563247681, -0.7186285853385925, -0.676832914352417, -0.6350373029708862, -0.5932416915893555, -0.5514460206031799, -0.5096503496170044, -0.46785473823547363, -0.4260590970516205, -0.38426345586776733, -0.3424678146839142, -0.30067217350006104, -0.2588765323162079, -0.21708089113235474, -0.1752852499485016, -0.13348960876464844, -0.09169396758079529, -0.04989832639694214, -0.00810268521308899, 0.03369295597076416, 0.07548859715461731, 0.11728423833847046, 0.1590798795223236, 0.20087552070617676, 0.2426711618900299, 0.28446680307388306, 0.3262624442577362, 0.36805808544158936, 0.4098537266254425, 0.45164936780929565, 0.4934450089931488, 0.535240650177002, 0.5770362615585327, 0.6188319325447083, 0.6606276035308838, 0.7024232149124146, 0.7442188262939453, 0.7860144972801208, 0.8278101682662964, 0.8696057796478271]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 17.0, 11.0, 10.0, 23.0, 22.0, 29.0, 28.0, 63.0, 68.0, 61.0, 64.0, 76.0, 73.0, 65.0, 78.0, 48.0, 48.0, 34.0, 38.0, 33.0, 28.0, 24.0, 14.0, 7.0, 14.0, 2.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3083477020263672, -0.2979143559932709, -0.28748100996017456, -0.27704766392707825, -0.26661431789398193, -0.25618094205856323, -0.2457476109266281, -0.2353142499923706, -0.2248809039592743, -0.21444755792617798, -0.20401421189308167, -0.19358086585998535, -0.18314750492572784, -0.17271415889263153, -0.16228081285953522, -0.1518474519252777, -0.1414141207933426, -0.13098077476024628, -0.12054742127656937, -0.11011407524347305, -0.09968072175979614, -0.08924737572669983, -0.07881402969360352, -0.0683806762099266, -0.05794733017683029, -0.04751398041844368, -0.03708063066005707, -0.026647284626960754, -0.016213934868574142, -0.0057805851101875305, 0.004652760922908783, 0.015086114406585693, 0.025519460439682007, 0.03595281019806862, 0.04638615995645523, 0.056819505989551544, 0.06725285947322845, 0.07768620550632477, 0.08811955153942108, 0.09855290502309799, 0.1089862510561943, 0.11941959708929062, 0.12985295057296753, 0.14028629660606384, 0.15071964263916016, 0.16115298867225647, 0.17158633470535278, 0.1820196956396103, 0.1924530416727066, 0.20288638770580292, 0.21331973373889923, 0.22375309467315674, 0.23418644070625305, 0.24461978673934937, 0.2550531327724457, 0.265486478805542, 0.2759198248386383, 0.2863531708717346, 0.29678651690483093, 0.30721986293792725, 0.31765320897102356, 0.3280865550041199, 0.3385199308395386, 0.3489532768726349, 0.3593866229057312]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 3.0, 9.0, 10.0, 11.0, 12.0, 14.0, 28.0, 30.0, 48.0, 64.0, 90.0, 165.0, 269.0, 603.0, 1604.0, 7227.0, 151055.0, 3999899.0, 29125.0, 2980.0, 654.0, 227.0, 71.0, 39.0, 17.0, 13.0, 4.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0], "bins": [-0.331298828125, -0.3244361877441406, -0.31757354736328125, -0.3107109069824219, -0.3038482666015625, -0.2969856262207031, -0.29012298583984375, -0.2832603454589844, -0.276397705078125, -0.2695350646972656, -0.26267242431640625, -0.2558097839355469, -0.2489471435546875, -0.24208450317382812, -0.23522186279296875, -0.22835922241210938, -0.22149658203125, -0.21463394165039062, -0.20777130126953125, -0.20090866088867188, -0.1940460205078125, -0.18718338012695312, -0.18032073974609375, -0.17345809936523438, -0.166595458984375, -0.15973281860351562, -0.15287017822265625, -0.14600753784179688, -0.1391448974609375, -0.13228225708007812, -0.12541961669921875, -0.11855697631835938, -0.1116943359375, -0.10483169555664062, -0.09796905517578125, -0.09110641479492188, -0.0842437744140625, -0.07738113403320312, -0.07051849365234375, -0.06365585327148438, -0.056793212890625, -0.049930572509765625, -0.04306793212890625, -0.036205291748046875, -0.0293426513671875, -0.022480010986328125, -0.01561737060546875, -0.008754730224609375, -0.00189208984375, 0.004970550537109375, 0.01183319091796875, 0.018695831298828125, 0.0255584716796875, 0.032421112060546875, 0.03928375244140625, 0.046146392822265625, 0.053009033203125, 0.059871673583984375, 0.06673431396484375, 0.07359695434570312, 0.0804595947265625, 0.08732223510742188, 0.09418487548828125, 0.10104751586914062, 0.10791015625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 12.0, 16.0, 32.0, 59.0, 74.0, 92.0, 116.0, 124.0, 133.0, 107.0, 81.0, 60.0, 39.0, 21.0, 18.0, 10.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0240478515625, -0.023456692695617676, -0.02286553382873535, -0.022274374961853027, -0.021683216094970703, -0.02109205722808838, -0.020500898361206055, -0.01990973949432373, -0.019318580627441406, -0.018727421760559082, -0.018136262893676758, -0.017545104026794434, -0.01695394515991211, -0.016362786293029785, -0.01577162742614746, -0.015180468559265137, -0.014589309692382812, -0.013998150825500488, -0.013406991958618164, -0.01281583309173584, -0.012224674224853516, -0.011633515357971191, -0.011042356491088867, -0.010451197624206543, -0.009860038757324219, -0.009268879890441895, -0.00867772102355957, -0.008086562156677246, -0.007495403289794922, -0.006904244422912598, -0.0063130855560302734, -0.005721926689147949, -0.005130767822265625, -0.004539608955383301, -0.0039484500885009766, -0.0033572912216186523, -0.002766132354736328, -0.002174973487854004, -0.0015838146209716797, -0.0009926557540893555, -0.00040149688720703125, 0.00018966197967529297, 0.0007808208465576172, 0.0013719797134399414, 0.0019631385803222656, 0.00255429744720459, 0.003145456314086914, 0.0037366151809692383, 0.0043277740478515625, 0.004918932914733887, 0.005510091781616211, 0.006101250648498535, 0.006692409515380859, 0.007283568382263184, 0.007874727249145508, 0.008465886116027832, 0.009057044982910156, 0.00964820384979248, 0.010239362716674805, 0.010830521583557129, 0.011421680450439453, 0.012012839317321777, 0.012603998184204102, 0.013195157051086426, 0.01378631591796875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 26.0, 74.0, 252.0, 1777.0, 4190838.0, 1133.0, 121.0, 34.0, 15.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9248046875, -1.8851165771484375, -1.845428466796875, -1.8057403564453125, -1.76605224609375, -1.7263641357421875, -1.686676025390625, -1.6469879150390625, -1.6072998046875, -1.5676116943359375, -1.527923583984375, -1.4882354736328125, -1.44854736328125, -1.4088592529296875, -1.369171142578125, -1.3294830322265625, -1.289794921875, -1.2501068115234375, -1.210418701171875, -1.1707305908203125, -1.13104248046875, -1.0913543701171875, -1.051666259765625, -1.0119781494140625, -0.9722900390625, -0.9326019287109375, -0.892913818359375, -0.8532257080078125, -0.81353759765625, -0.7738494873046875, -0.734161376953125, -0.6944732666015625, -0.65478515625, -0.6150970458984375, -0.575408935546875, -0.5357208251953125, -0.49603271484375, -0.4563446044921875, -0.416656494140625, -0.3769683837890625, -0.3372802734375, -0.2975921630859375, -0.257904052734375, -0.2182159423828125, -0.17852783203125, -0.1388397216796875, -0.099151611328125, -0.0594635009765625, -0.019775390625, 0.0199127197265625, 0.059600830078125, 0.0992889404296875, 0.13897705078125, 0.1786651611328125, 0.218353271484375, 0.2580413818359375, 0.2977294921875, 0.3374176025390625, 0.377105712890625, 0.4167938232421875, 0.45648193359375, 0.4961700439453125, 0.535858154296875, 0.5755462646484375, 0.615234375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 12.0, 75.0, 520.0, 3243.0, 177.0, 27.0, 11.0, 6.0, 5.0, 2.0], "bins": [-0.1739501953125, -0.1709139347076416, -0.1678776741027832, -0.1648414134979248, -0.1618051528930664, -0.158768892288208, -0.1557326316833496, -0.1526963710784912, -0.1496601104736328, -0.14662384986877441, -0.14358758926391602, -0.14055132865905762, -0.13751506805419922, -0.13447880744934082, -0.13144254684448242, -0.12840628623962402, -0.12537002563476562, -0.12233376502990723, -0.11929750442504883, -0.11626124382019043, -0.11322498321533203, -0.11018872261047363, -0.10715246200561523, -0.10411620140075684, -0.10107994079589844, -0.09804368019104004, -0.09500741958618164, -0.09197115898132324, -0.08893489837646484, -0.08589863777160645, -0.08286237716674805, -0.07982611656188965, -0.07678985595703125, -0.07375359535217285, -0.07071733474731445, -0.06768107414245605, -0.06464481353759766, -0.06160855293273926, -0.05857229232788086, -0.05553603172302246, -0.05249977111816406, -0.049463510513305664, -0.046427249908447266, -0.04339098930358887, -0.04035472869873047, -0.03731846809387207, -0.03428220748901367, -0.031245946884155273, -0.028209686279296875, -0.025173425674438477, -0.022137165069580078, -0.01910090446472168, -0.01606464385986328, -0.013028383255004883, -0.009992122650146484, -0.006955862045288086, -0.0039196014404296875, -0.0008833408355712891, 0.0021529197692871094, 0.005189180374145508, 0.008225440979003906, 0.011261701583862305, 0.014297962188720703, 0.0173342227935791, 0.0203704833984375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 11.0, 92.0, 733.0, 140.0, 19.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0652590990066528, -1.0414105653762817, -1.0175621509552002, -0.9937136173248291, -0.969865083694458, -0.9460166096687317, -0.9221681356430054, -0.8983196020126343, -0.8744710683822632, -0.8506225943565369, -0.8267740607261658, -0.8029255867004395, -0.7790770530700684, -0.755228579044342, -0.7313801050186157, -0.7075315713882446, -0.6836830973625183, -0.659834623336792, -0.6359860897064209, -0.6121376156806946, -0.5882890820503235, -0.5644406080245972, -0.5405920743942261, -0.5167436003684998, -0.49289509654045105, -0.46904659271240234, -0.44519808888435364, -0.42134958505630493, -0.3975011110305786, -0.3736525774002075, -0.3498041033744812, -0.3259555995464325, -0.3021070957183838, -0.2782585918903351, -0.2544100880622864, -0.23056159913539886, -0.20671309530735016, -0.18286459147930145, -0.15901610255241394, -0.13516759872436523, -0.11131909489631653, -0.08747059106826782, -0.06362209469079971, -0.039773598313331604, -0.015925094485282898, 0.007923409342765808, 0.03177189826965332, 0.055620402097702026, 0.07946890592575073, 0.10331740975379944, 0.12716591358184814, 0.15101440250873566, 0.17486290633678436, 0.19871141016483307, 0.22255989909172058, 0.2464084029197693, 0.270256906747818, 0.2941054105758667, 0.3179539144039154, 0.3418024182319641, 0.36565089225769043, 0.3894994258880615, 0.41334789991378784, 0.43719640374183655, 0.46104490756988525]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 8.0, 12.0, 16.0, 31.0, 43.0, 82.0, 84.0, 106.0, 132.0, 125.0, 121.0, 73.0, 63.0, 46.0, 25.0, 17.0, 13.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3769615888595581, -0.3662453293800354, -0.3555290699005127, -0.34481281042099, -0.3340965807437897, -0.32338032126426697, -0.31266406178474426, -0.30194780230522156, -0.29123157262802124, -0.28051531314849854, -0.26979905366897583, -0.2590827941894531, -0.2483665645122528, -0.2376503050327301, -0.2269340455532074, -0.2162177860736847, -0.205501526594162, -0.19478526711463928, -0.18406902253627777, -0.17335276305675507, -0.16263651847839355, -0.15192025899887085, -0.14120399951934814, -0.13048774003982544, -0.11977149546146393, -0.10905524343252182, -0.09833899140357971, -0.087622731924057, -0.0769064798951149, -0.06619022786617279, -0.055473968386650085, -0.04475771635770798, -0.03404146432876587, -0.023325210437178612, -0.012608956545591354, -0.0018927007913589478, 0.00882355123758316, 0.01953980326652527, 0.030256062746047974, 0.04097231477499008, 0.05168856680393219, 0.0624048188328743, 0.0731210708618164, 0.08383733034133911, 0.09455358237028122, 0.10526983439922333, 0.11598609387874603, 0.12670233845710754, 0.13741859793663025, 0.14813485741615295, 0.15885110199451447, 0.16956736147403717, 0.18028360605239868, 0.1909998655319214, 0.2017161250114441, 0.2124323844909668, 0.2231486290693283, 0.233864888548851, 0.24458113312721252, 0.25529739260673523, 0.26601365208625793, 0.27672988176345825, 0.28744614124298096, 0.29816240072250366, 0.30887866020202637]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 3.0, 5.0, 6.0, 12.0, 8.0, 23.0, 21.0, 35.0, 47.0, 63.0, 109.0, 155.0, 238.0, 356.0, 754.0, 1685.0, 4975.0, 20497.0, 146978.0, 736978.0, 111053.0, 17023.0, 4320.0, 1461.0, 657.0, 364.0, 193.0, 150.0, 102.0, 77.0, 47.0, 36.0, 36.0, 26.0, 15.0, 12.0, 8.0, 5.0, 4.0, 4.0, 4.0, 3.0, 5.0], "bins": [-0.1190185546875, -0.11607551574707031, -0.11313247680664062, -0.11018943786621094, -0.10724639892578125, -0.10430335998535156, -0.10136032104492188, -0.09841728210449219, -0.0954742431640625, -0.09253120422363281, -0.08958816528320312, -0.08664512634277344, -0.08370208740234375, -0.08075904846191406, -0.07781600952148438, -0.07487297058105469, -0.071929931640625, -0.06898689270019531, -0.06604385375976562, -0.06310081481933594, -0.06015777587890625, -0.05721473693847656, -0.054271697998046875, -0.05132865905761719, -0.0483856201171875, -0.04544258117675781, -0.042499542236328125, -0.03955650329589844, -0.03661346435546875, -0.03367042541503906, -0.030727386474609375, -0.027784347534179688, -0.02484130859375, -0.021898269653320312, -0.018955230712890625, -0.016012191772460938, -0.01306915283203125, -0.010126113891601562, -0.007183074951171875, -0.0042400360107421875, -0.0012969970703125, 0.0016460418701171875, 0.004589080810546875, 0.0075321197509765625, 0.01047515869140625, 0.013418197631835938, 0.016361236572265625, 0.019304275512695312, 0.022247314453125, 0.025190353393554688, 0.028133392333984375, 0.031076431274414062, 0.03401947021484375, 0.03696250915527344, 0.039905548095703125, 0.04284858703613281, 0.0457916259765625, 0.04873466491699219, 0.051677703857421875, 0.05462074279785156, 0.05756378173828125, 0.06050682067871094, 0.06344985961914062, 0.06639289855957031, 0.0693359375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 10.0, 17.0, 30.0, 62.0, 64.0, 84.0, 104.0, 135.0, 123.0, 98.0, 88.0, 72.0, 43.0, 32.0, 14.0, 10.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031707763671875, -0.030848264694213867, -0.029988765716552734, -0.0291292667388916, -0.02826976776123047, -0.027410268783569336, -0.026550769805908203, -0.02569127082824707, -0.024831771850585938, -0.023972272872924805, -0.023112773895263672, -0.02225327491760254, -0.021393775939941406, -0.020534276962280273, -0.01967477798461914, -0.018815279006958008, -0.017955780029296875, -0.017096281051635742, -0.01623678207397461, -0.015377283096313477, -0.014517784118652344, -0.013658285140991211, -0.012798786163330078, -0.011939287185668945, -0.011079788208007812, -0.01022028923034668, -0.009360790252685547, -0.008501291275024414, -0.007641792297363281, -0.0067822933197021484, -0.005922794342041016, -0.005063295364379883, -0.00420379638671875, -0.003344297409057617, -0.0024847984313964844, -0.0016252994537353516, -0.0007658004760742188, 9.369850158691406e-05, 0.0009531974792480469, 0.0018126964569091797, 0.0026721954345703125, 0.0035316944122314453, 0.004391193389892578, 0.005250692367553711, 0.006110191345214844, 0.0069696903228759766, 0.00782918930053711, 0.008688688278198242, 0.009548187255859375, 0.010407686233520508, 0.01126718521118164, 0.012126684188842773, 0.012986183166503906, 0.013845682144165039, 0.014705181121826172, 0.015564680099487305, 0.016424179077148438, 0.01728367805480957, 0.018143177032470703, 0.019002676010131836, 0.01986217498779297, 0.0207216739654541, 0.021581172943115234, 0.022440671920776367, 0.0233001708984375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 5.0, 13.0, 8.0, 11.0, 9.0, 12.0, 17.0, 31.0, 50.0, 69.0, 118.0, 238.0, 636.0, 2028.0, 11841.0, 250890.0, 748875.0, 28451.0, 3580.0, 895.0, 323.0, 172.0, 90.0, 54.0, 39.0, 25.0, 21.0, 13.0, 13.0, 5.0, 5.0, 6.0, 1.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09295654296875, -0.08965778350830078, -0.08635902404785156, -0.08306026458740234, -0.07976150512695312, -0.0764627456665039, -0.07316398620605469, -0.06986522674560547, -0.06656646728515625, -0.06326770782470703, -0.05996894836425781, -0.056670188903808594, -0.053371429443359375, -0.050072669982910156, -0.04677391052246094, -0.04347515106201172, -0.0401763916015625, -0.03687763214111328, -0.03357887268066406, -0.030280113220214844, -0.026981353759765625, -0.023682594299316406, -0.020383834838867188, -0.01708507537841797, -0.01378631591796875, -0.010487556457519531, -0.0071887969970703125, -0.0038900375366210938, -0.000591278076171875, 0.0027074813842773438, 0.0060062408447265625, 0.009305000305175781, 0.012603759765625, 0.01590251922607422, 0.019201278686523438, 0.022500038146972656, 0.025798797607421875, 0.029097557067871094, 0.03239631652832031, 0.03569507598876953, 0.03899383544921875, 0.04229259490966797, 0.04559135437011719, 0.048890113830566406, 0.052188873291015625, 0.055487632751464844, 0.05878639221191406, 0.06208515167236328, 0.0653839111328125, 0.06868267059326172, 0.07198143005371094, 0.07528018951416016, 0.07857894897460938, 0.0818777084350586, 0.08517646789550781, 0.08847522735595703, 0.09177398681640625, 0.09507274627685547, 0.09837150573730469, 0.1016702651977539, 0.10496902465820312, 0.10826778411865234, 0.11156654357910156, 0.11486530303955078, 0.1181640625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 10.0, 13.0, 8.0, 5.0, 4.0, 22.0, 25.0, 26.0, 32.0, 34.0, 53.0, 48.0, 78.0, 73.0, 78.0, 60.0, 65.0, 56.0, 42.0, 55.0, 37.0, 37.0, 29.0, 21.0, 18.0, 11.0, 16.0, 9.0, 7.0, 4.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0604248046875, -0.058467864990234375, -0.05651092529296875, -0.054553985595703125, -0.0525970458984375, -0.050640106201171875, -0.04868316650390625, -0.046726226806640625, -0.044769287109375, -0.042812347412109375, -0.04085540771484375, -0.038898468017578125, -0.0369415283203125, -0.034984588623046875, -0.03302764892578125, -0.031070709228515625, -0.02911376953125, -0.027156829833984375, -0.02519989013671875, -0.023242950439453125, -0.0212860107421875, -0.019329071044921875, -0.01737213134765625, -0.015415191650390625, -0.013458251953125, -0.011501312255859375, -0.00954437255859375, -0.007587432861328125, -0.0056304931640625, -0.003673553466796875, -0.00171661376953125, 0.000240325927734375, 0.002197265625, 0.004154205322265625, 0.00611114501953125, 0.008068084716796875, 0.0100250244140625, 0.011981964111328125, 0.01393890380859375, 0.015895843505859375, 0.017852783203125, 0.019809722900390625, 0.02176666259765625, 0.023723602294921875, 0.0256805419921875, 0.027637481689453125, 0.02959442138671875, 0.031551361083984375, 0.03350830078125, 0.035465240478515625, 0.03742218017578125, 0.039379119873046875, 0.0413360595703125, 0.043292999267578125, 0.04524993896484375, 0.047206878662109375, 0.049163818359375, 0.051120758056640625, 0.05307769775390625, 0.055034637451171875, 0.0569915771484375, 0.058948516845703125, 0.06090545654296875, 0.06286239624023438, 0.0648193359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 4.0, 3.0, 8.0, 8.0, 11.0, 9.0, 21.0, 18.0, 32.0, 31.0, 63.0, 113.0, 242.0, 511.0, 1315.0, 3959.0, 19563.0, 437584.0, 554420.0, 23698.0, 4371.0, 1366.0, 584.0, 278.0, 116.0, 66.0, 42.0, 31.0, 26.0, 15.0, 7.0, 5.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.035552978515625, -0.03444337844848633, -0.033333778381347656, -0.032224178314208984, -0.031114578247070312, -0.03000497817993164, -0.02889537811279297, -0.027785778045654297, -0.026676177978515625, -0.025566577911376953, -0.02445697784423828, -0.02334737777709961, -0.022237777709960938, -0.021128177642822266, -0.020018577575683594, -0.018908977508544922, -0.01779937744140625, -0.016689777374267578, -0.015580177307128906, -0.014470577239990234, -0.013360977172851562, -0.01225137710571289, -0.011141777038574219, -0.010032176971435547, -0.008922576904296875, -0.007812976837158203, -0.006703376770019531, -0.005593776702880859, -0.0044841766357421875, -0.0033745765686035156, -0.0022649765014648438, -0.0011553764343261719, -4.57763671875e-05, 0.0010638236999511719, 0.0021734237670898438, 0.0032830238342285156, 0.0043926239013671875, 0.005502223968505859, 0.006611824035644531, 0.007721424102783203, 0.008831024169921875, 0.009940624237060547, 0.011050224304199219, 0.01215982437133789, 0.013269424438476562, 0.014379024505615234, 0.015488624572753906, 0.016598224639892578, 0.01770782470703125, 0.018817424774169922, 0.019927024841308594, 0.021036624908447266, 0.022146224975585938, 0.02325582504272461, 0.02436542510986328, 0.025475025177001953, 0.026584625244140625, 0.027694225311279297, 0.02880382537841797, 0.02991342544555664, 0.031023025512695312, 0.032132625579833984, 0.033242225646972656, 0.03435182571411133, 0.03546142578125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 9.0, 5.0, 8.0, 17.0, 21.0, 45.0, 74.0, 153.0, 244.0, 185.0, 119.0, 57.0, 30.0, 11.0, 11.0, 8.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013363361358642578, -0.0001286473125219345, -0.00012366101145744324, -0.00011867471039295197, -0.0001136884093284607, -0.00010870210826396942, -0.00010371580719947815, -9.872950613498688e-05, -9.37432050704956e-05, -8.875690400600433e-05, -8.377060294151306e-05, -7.878430187702179e-05, -7.379800081253052e-05, -6.881169974803925e-05, -6.382539868354797e-05, -5.88390976190567e-05, -5.385279655456543e-05, -4.886649549007416e-05, -4.3880194425582886e-05, -3.8893893361091614e-05, -3.390759229660034e-05, -2.892129123210907e-05, -2.3934990167617798e-05, -1.8948689103126526e-05, -1.3962388038635254e-05, -8.976086974143982e-06, -3.98978590965271e-06, 9.96515154838562e-07, 5.982816219329834e-06, 1.0969117283821106e-05, 1.5955418348312378e-05, 2.094171941280365e-05, 2.5928020477294922e-05, 3.0914321541786194e-05, 3.5900622606277466e-05, 4.088692367076874e-05, 4.587322473526001e-05, 5.085952579975128e-05, 5.5845826864242554e-05, 6.0832127928733826e-05, 6.58184289932251e-05, 7.080473005771637e-05, 7.579103112220764e-05, 8.077733218669891e-05, 8.576363325119019e-05, 9.074993431568146e-05, 9.573623538017273e-05, 0.000100722536444664, 0.00010570883750915527, 0.00011069513857364655, 0.00011568143963813782, 0.00012066774070262909, 0.00012565404176712036, 0.00013064034283161163, 0.0001356266438961029, 0.00014061294496059418, 0.00014559924602508545, 0.00015058554708957672, 0.000155571848154068, 0.00016055814921855927, 0.00016554445028305054, 0.0001705307513475418, 0.00017551705241203308, 0.00018050335347652435, 0.00018548965454101562]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 2.0, 8.0, 11.0, 12.0, 26.0, 35.0, 56.0, 89.0, 194.0, 416.0, 1239.0, 8454.0, 302121.0, 717642.0, 15434.0, 1857.0, 489.0, 199.0, 103.0, 50.0, 42.0, 24.0, 16.0, 14.0, 7.0, 2.0, 5.0, 7.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051422119140625, -0.049820899963378906, -0.04821968078613281, -0.04661846160888672, -0.045017242431640625, -0.04341602325439453, -0.04181480407714844, -0.040213584899902344, -0.03861236572265625, -0.037011146545410156, -0.03540992736816406, -0.03380870819091797, -0.032207489013671875, -0.03060626983642578, -0.029005050659179688, -0.027403831481933594, -0.0258026123046875, -0.024201393127441406, -0.022600173950195312, -0.02099895477294922, -0.019397735595703125, -0.01779651641845703, -0.016195297241210938, -0.014594078063964844, -0.01299285888671875, -0.011391639709472656, -0.009790420532226562, -0.008189201354980469, -0.006587982177734375, -0.004986763000488281, -0.0033855438232421875, -0.0017843246459960938, -0.00018310546875, 0.0014181137084960938, 0.0030193328857421875, 0.004620552062988281, 0.006221771240234375, 0.007822990417480469, 0.009424209594726562, 0.011025428771972656, 0.01262664794921875, 0.014227867126464844, 0.015829086303710938, 0.01743030548095703, 0.019031524658203125, 0.02063274383544922, 0.022233963012695312, 0.023835182189941406, 0.0254364013671875, 0.027037620544433594, 0.028638839721679688, 0.03024005889892578, 0.031841278076171875, 0.03344249725341797, 0.03504371643066406, 0.036644935607910156, 0.03824615478515625, 0.039847373962402344, 0.04144859313964844, 0.04304981231689453, 0.044651031494140625, 0.04625225067138672, 0.04785346984863281, 0.049454689025878906, 0.051055908203125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 7.0, 16.0, 13.0, 21.0, 35.0, 82.0, 80.0, 136.0, 176.0, 179.0, 105.0, 51.0, 32.0, 21.0, 16.0, 10.0, 6.0, 5.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037811279296875, -0.036685943603515625, -0.03556060791015625, -0.034435272216796875, -0.0333099365234375, -0.032184600830078125, -0.03105926513671875, -0.029933929443359375, -0.02880859375, -0.027683258056640625, -0.02655792236328125, -0.025432586669921875, -0.0243072509765625, -0.023181915283203125, -0.02205657958984375, -0.020931243896484375, -0.019805908203125, -0.018680572509765625, -0.01755523681640625, -0.016429901123046875, -0.0153045654296875, -0.014179229736328125, -0.01305389404296875, -0.011928558349609375, -0.01080322265625, -0.009677886962890625, -0.00855255126953125, -0.007427215576171875, -0.0063018798828125, -0.005176544189453125, -0.00405120849609375, -0.002925872802734375, -0.001800537109375, -0.000675201416015625, 0.00045013427734375, 0.001575469970703125, 0.0027008056640625, 0.003826141357421875, 0.00495147705078125, 0.006076812744140625, 0.0072021484375, 0.008327484130859375, 0.00945281982421875, 0.010578155517578125, 0.0117034912109375, 0.012828826904296875, 0.01395416259765625, 0.015079498291015625, 0.016204833984375, 0.017330169677734375, 0.01845550537109375, 0.019580841064453125, 0.0207061767578125, 0.021831512451171875, 0.02295684814453125, 0.024082183837890625, 0.02520751953125, 0.026332855224609375, 0.02745819091796875, 0.028583526611328125, 0.0297088623046875, 0.030834197998046875, 0.03195953369140625, 0.033084869384765625, 0.034210205078125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 11.0, 44.0, 244.0, 491.0, 163.0, 32.0, 11.0, 5.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6486761569976807, -0.6230819225311279, -0.5974876880645752, -0.5718934535980225, -0.5462992191314697, -0.520704984664917, -0.49511075019836426, -0.4695165157318115, -0.4439222812652588, -0.41832804679870605, -0.3927338123321533, -0.3671395778656006, -0.34154534339904785, -0.3159511089324951, -0.2903568744659424, -0.26476263999938965, -0.23916837573051453, -0.2135741412639618, -0.18797990679740906, -0.16238567233085632, -0.1367914378643036, -0.11119718849658966, -0.08560295403003693, -0.06000871956348419, -0.03441448509693146, -0.008820248767733574, 0.01677398756146431, 0.04236822575330734, 0.06796246021986008, 0.09355670213699341, 0.11915093660354614, 0.14474517107009888, 0.1703394055366516, 0.19593364000320435, 0.22152787446975708, 0.24712210893630981, 0.27271634340286255, 0.2983105778694153, 0.323904812335968, 0.34949904680252075, 0.3750932812690735, 0.4006875157356262, 0.42628175020217896, 0.4518759846687317, 0.4774702191352844, 0.5030644536018372, 0.5286586880683899, 0.5542529225349426, 0.5798472166061401, 0.6054414510726929, 0.6310356855392456, 0.6566299200057983, 0.6822241544723511, 0.7078183889389038, 0.7334126234054565, 0.7590068578720093, 0.784601092338562, 0.8101953268051147, 0.8357895612716675, 0.8613837957382202, 0.886978030204773, 0.9125722646713257, 0.9381664991378784, 0.9637607336044312, 0.9893549680709839]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 8.0, 3.0, 10.0, 7.0, 12.0, 18.0, 20.0, 22.0, 21.0, 32.0, 41.0, 50.0, 41.0, 54.0, 56.0, 62.0, 63.0, 62.0, 56.0, 46.0, 36.0, 57.0, 31.0, 39.0, 29.0, 26.0, 20.0, 14.0, 16.0, 12.0, 3.0, 11.0, 8.0, 6.0, 2.0, 1.0, 2.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.36685633659362793, -0.35721081495285034, -0.34756529331207275, -0.33791977167129517, -0.3282742500305176, -0.31862872838974, -0.3089832067489624, -0.2993376553058624, -0.28969213366508484, -0.28004661202430725, -0.27040109038352966, -0.2607555687427521, -0.2511100471019745, -0.2414645105600357, -0.23181898891925812, -0.22217345237731934, -0.21252794563770294, -0.20288242399692535, -0.19323690235614777, -0.18359136581420898, -0.1739458441734314, -0.1643003225326538, -0.15465480089187622, -0.14500927925109863, -0.13536375761032104, -0.12571823596954346, -0.11607270687818527, -0.10642718523740768, -0.0967816561460495, -0.08713613450527191, -0.07749061286449432, -0.06784508377313614, -0.058199554681777954, -0.04855402931571007, -0.03890850394964218, -0.029262982308864594, -0.019617456942796707, -0.00997193157672882, -0.0003264099359512329, 0.009319119155406952, 0.01896464079618454, 0.028610166162252426, 0.03825569152832031, 0.0479012131690979, 0.05754673853516579, 0.06719226390123367, 0.07683778554201126, 0.08648331463336945, 0.09612883627414703, 0.10577435791492462, 0.1154198870062828, 0.125065416097641, 0.13471093773841858, 0.14435645937919617, 0.15400198101997375, 0.16364750266075134, 0.17329302430152893, 0.18293854594230652, 0.1925840675830841, 0.2022295892238617, 0.21187512576580048, 0.22152064740657806, 0.23116616904735565, 0.24081170558929443, 0.250457227230072]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 12.0, 10.0, 10.0, 19.0, 18.0, 39.0, 56.0, 58.0, 91.0, 132.0, 215.0, 373.0, 706.0, 1682.0, 4847.0, 23899.0, 871070.0, 3250987.0, 32040.0, 5352.0, 1527.0, 570.0, 266.0, 145.0, 58.0, 31.0, 18.0, 11.0, 9.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1861572265625, -0.1819324493408203, -0.17770767211914062, -0.17348289489746094, -0.16925811767578125, -0.16503334045410156, -0.16080856323242188, -0.1565837860107422, -0.1523590087890625, -0.1481342315673828, -0.14390945434570312, -0.13968467712402344, -0.13545989990234375, -0.13123512268066406, -0.12701034545898438, -0.12278556823730469, -0.118560791015625, -0.11433601379394531, -0.11011123657226562, -0.10588645935058594, -0.10166168212890625, -0.09743690490722656, -0.09321212768554688, -0.08898735046386719, -0.0847625732421875, -0.08053779602050781, -0.07631301879882812, -0.07208824157714844, -0.06786346435546875, -0.06363868713378906, -0.059413909912109375, -0.05518913269042969, -0.05096435546875, -0.04673957824707031, -0.042514801025390625, -0.03829002380371094, -0.03406524658203125, -0.029840469360351562, -0.025615692138671875, -0.021390914916992188, -0.0171661376953125, -0.012941360473632812, -0.008716583251953125, -0.0044918060302734375, -0.00026702880859375, 0.0039577484130859375, 0.008182525634765625, 0.012407302856445312, 0.016632080078125, 0.020856857299804688, 0.025081634521484375, 0.029306411743164062, 0.03353118896484375, 0.03775596618652344, 0.041980743408203125, 0.04620552062988281, 0.0504302978515625, 0.05465507507324219, 0.058879852294921875, 0.06310462951660156, 0.06732940673828125, 0.07155418395996094, 0.07577896118164062, 0.08000373840332031, 0.084228515625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 7.0, 9.0, 18.0, 39.0, 43.0, 52.0, 70.0, 105.0, 80.0, 104.0, 103.0, 81.0, 84.0, 66.0, 32.0, 42.0, 24.0, 15.0, 12.0, 5.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02783203125, -0.027129650115966797, -0.026427268981933594, -0.02572488784790039, -0.025022506713867188, -0.024320125579833984, -0.02361774444580078, -0.022915363311767578, -0.022212982177734375, -0.021510601043701172, -0.02080821990966797, -0.020105838775634766, -0.019403457641601562, -0.01870107650756836, -0.017998695373535156, -0.017296314239501953, -0.01659393310546875, -0.015891551971435547, -0.015189170837402344, -0.01448678970336914, -0.013784408569335938, -0.013082027435302734, -0.012379646301269531, -0.011677265167236328, -0.010974884033203125, -0.010272502899169922, -0.009570121765136719, -0.008867740631103516, -0.008165359497070312, -0.007462978363037109, -0.006760597229003906, -0.006058216094970703, -0.0053558349609375, -0.004653453826904297, -0.003951072692871094, -0.0032486915588378906, -0.0025463104248046875, -0.0018439292907714844, -0.0011415481567382812, -0.0004391670227050781, 0.000263214111328125, 0.0009655952453613281, 0.0016679763793945312, 0.0023703575134277344, 0.0030727386474609375, 0.0037751197814941406, 0.004477500915527344, 0.005179882049560547, 0.00588226318359375, 0.006584644317626953, 0.007287025451660156, 0.00798940658569336, 0.008691787719726562, 0.009394168853759766, 0.010096549987792969, 0.010798931121826172, 0.011501312255859375, 0.012203693389892578, 0.012906074523925781, 0.013608455657958984, 0.014310836791992188, 0.01501321792602539, 0.015715599060058594, 0.016417980194091797, 0.017120361328125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 9.0, 14.0, 24.0, 45.0, 78.0, 195.0, 857.0, 4190736.0, 1761.0, 257.0, 120.0, 78.0, 54.0, 25.0, 22.0, 4.0, 6.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50732421875, -0.48146820068359375, -0.4556121826171875, -0.42975616455078125, -0.403900146484375, -0.37804412841796875, -0.3521881103515625, -0.32633209228515625, -0.30047607421875, -0.27462005615234375, -0.2487640380859375, -0.22290802001953125, -0.197052001953125, -0.17119598388671875, -0.1453399658203125, -0.11948394775390625, -0.0936279296875, -0.06777191162109375, -0.0419158935546875, -0.01605987548828125, 0.009796142578125, 0.03565216064453125, 0.0615081787109375, 0.08736419677734375, 0.11322021484375, 0.13907623291015625, 0.1649322509765625, 0.19078826904296875, 0.216644287109375, 0.24250030517578125, 0.2683563232421875, 0.29421234130859375, 0.320068359375, 0.34592437744140625, 0.3717803955078125, 0.39763641357421875, 0.423492431640625, 0.44934844970703125, 0.4752044677734375, 0.5010604858398438, 0.52691650390625, 0.5527725219726562, 0.5786285400390625, 0.6044845581054688, 0.630340576171875, 0.6561965942382812, 0.6820526123046875, 0.7079086303710938, 0.7337646484375, 0.7596206665039062, 0.7854766845703125, 0.8113327026367188, 0.837188720703125, 0.8630447387695312, 0.8889007568359375, 0.9147567749023438, 0.94061279296875, 0.9664688110351562, 0.9923248291015625, 1.0181808471679688, 1.044036865234375, 1.0698928833007812, 1.0957489013671875, 1.1216049194335938, 1.1474609375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 19.0, 377.0, 3581.0, 89.0, 14.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07818603515625, -0.07413005828857422, -0.07007408142089844, -0.06601810455322266, -0.061962127685546875, -0.057906150817871094, -0.05385017395019531, -0.04979419708251953, -0.04573822021484375, -0.04168224334716797, -0.03762626647949219, -0.033570289611816406, -0.029514312744140625, -0.025458335876464844, -0.021402359008789062, -0.01734638214111328, -0.0132904052734375, -0.009234428405761719, -0.0051784515380859375, -0.0011224746704101562, 0.002933502197265625, 0.006989479064941406, 0.011045455932617188, 0.015101432800292969, 0.01915740966796875, 0.02321338653564453, 0.027269363403320312, 0.031325340270996094, 0.035381317138671875, 0.039437294006347656, 0.04349327087402344, 0.04754924774169922, 0.051605224609375, 0.05566120147705078, 0.05971717834472656, 0.06377315521240234, 0.06782913208007812, 0.0718851089477539, 0.07594108581542969, 0.07999706268310547, 0.08405303955078125, 0.08810901641845703, 0.09216499328613281, 0.0962209701538086, 0.10027694702148438, 0.10433292388916016, 0.10838890075683594, 0.11244487762451172, 0.1165008544921875, 0.12055683135986328, 0.12461280822753906, 0.12866878509521484, 0.13272476196289062, 0.1367807388305664, 0.1408367156982422, 0.14489269256591797, 0.14894866943359375, 0.15300464630126953, 0.1570606231689453, 0.1611166000366211, 0.16517257690429688, 0.16922855377197266, 0.17328453063964844, 0.17734050750732422, 0.181396484375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 57.0, 930.0, 15.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2481105327606201, -1.2117807865142822, -1.1754511594772339, -1.139121413230896, -1.1027917861938477, -1.0664620399475098, -1.0301324129104614, -0.9938026666641235, -0.9574729800224304, -0.9211432933807373, -0.8848136067390442, -0.8484839200973511, -0.8121541738510132, -0.7758245468139648, -0.739494800567627, -0.7031651139259338, -0.6668354272842407, -0.6305057406425476, -0.5941760540008545, -0.5578463673591614, -0.5215166807174683, -0.48518696427345276, -0.44885724782943726, -0.41252756118774414, -0.376197874546051, -0.3398681879043579, -0.3035385012626648, -0.2672087848186493, -0.23087909817695618, -0.19454941153526306, -0.15821970999240875, -0.12189000844955444, -0.08556032180786133, -0.049230627715587616, -0.012900933623313904, 0.02342876046895981, 0.05975845456123352, 0.09608814120292664, 0.13241784274578094, 0.16874754428863525, 0.20507723093032837, 0.24140691757202148, 0.2777366042137146, 0.3140663206577301, 0.3503960072994232, 0.38672569394111633, 0.42305541038513184, 0.45938509702682495, 0.49571478366851807, 0.5320444703102112, 0.5683741569519043, 0.6047038435935974, 0.6410335302352905, 0.6773632764816284, 0.7136929631233215, 0.7500226497650146, 0.7863523364067078, 0.8226820230484009, 0.859011709690094, 0.8953413963317871, 0.931671142578125, 0.9680007696151733, 1.0043305158615112, 1.0406601428985596, 1.0769898891448975]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 9.0, 33.0, 55.0, 82.0, 127.0, 186.0, 166.0, 141.0, 103.0, 56.0, 22.0, 9.0, 12.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.31947869062423706, -0.31115612387657166, -0.30283358693122864, -0.29451102018356323, -0.2861884534358978, -0.2778659164905548, -0.2695433497428894, -0.261220782995224, -0.252898246049881, -0.24457569420337677, -0.23625312745571136, -0.22793057560920715, -0.21960802376270294, -0.21128547191619873, -0.20296290516853333, -0.1946403533220291, -0.1863177865743637, -0.1779952347278595, -0.1696726679801941, -0.16135011613368988, -0.15302756428718567, -0.14470499753952026, -0.13638244569301605, -0.12805989384651184, -0.11973733454942703, -0.11141477525234222, -0.10309222340583801, -0.0947696641087532, -0.0864471048116684, -0.07812455296516418, -0.06980199366807938, -0.061479438096284866, -0.053156882524490356, -0.04483432695269585, -0.03651177138090134, -0.02818921208381653, -0.01986665651202202, -0.011544100940227509, -0.0032215416431427, 0.00510101392865181, 0.01342356950044632, 0.02174612507224083, 0.03006868250668049, 0.03839123994112015, 0.04671379551291466, 0.05503635108470917, 0.06335891038179398, 0.07168146967887878, 0.080004021525383, 0.0883265808224678, 0.09664913266897202, 0.10497169196605682, 0.11329424381256104, 0.12161680310964584, 0.12993936240673065, 0.13826191425323486, 0.14658448100090027, 0.15490703284740448, 0.16322959959506989, 0.1715521514415741, 0.1798747032880783, 0.18819725513458252, 0.19651982188224792, 0.20484237372875214, 0.21316492557525635]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 4.0, 5.0, 8.0, 17.0, 16.0, 25.0, 50.0, 57.0, 91.0, 195.0, 353.0, 712.0, 1671.0, 5402.0, 26673.0, 246046.0, 671447.0, 78602.0, 11975.0, 2976.0, 1064.0, 489.0, 267.0, 137.0, 97.0, 66.0, 47.0, 20.0, 12.0, 6.0, 10.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.066650390625, -0.06437301635742188, -0.06209564208984375, -0.059818267822265625, -0.0575408935546875, -0.055263519287109375, -0.05298614501953125, -0.050708770751953125, -0.048431396484375, -0.046154022216796875, -0.04387664794921875, -0.041599273681640625, -0.0393218994140625, -0.037044525146484375, -0.03476715087890625, -0.032489776611328125, -0.03021240234375, -0.027935028076171875, -0.02565765380859375, -0.023380279541015625, -0.0211029052734375, -0.018825531005859375, -0.01654815673828125, -0.014270782470703125, -0.011993408203125, -0.009716033935546875, -0.00743865966796875, -0.005161285400390625, -0.0028839111328125, -0.000606536865234375, 0.00167083740234375, 0.003948211669921875, 0.0062255859375, 0.008502960205078125, 0.01078033447265625, 0.013057708740234375, 0.0153350830078125, 0.017612457275390625, 0.01988983154296875, 0.022167205810546875, 0.024444580078125, 0.026721954345703125, 0.02899932861328125, 0.031276702880859375, 0.0335540771484375, 0.035831451416015625, 0.03810882568359375, 0.040386199951171875, 0.04266357421875, 0.044940948486328125, 0.04721832275390625, 0.049495697021484375, 0.0517730712890625, 0.054050445556640625, 0.05632781982421875, 0.058605194091796875, 0.060882568359375, 0.06315994262695312, 0.06543731689453125, 0.06771469116210938, 0.0699920654296875, 0.07226943969726562, 0.07454681396484375, 0.07682418823242188, 0.0791015625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 6.0, 18.0, 22.0, 27.0, 35.0, 41.0, 52.0, 60.0, 81.0, 83.0, 81.0, 79.0, 79.0, 65.0, 62.0, 41.0, 45.0, 36.0, 17.0, 27.0, 14.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0207977294921875, -0.020245790481567383, -0.019693851470947266, -0.01914191246032715, -0.01858997344970703, -0.018038034439086914, -0.017486095428466797, -0.01693415641784668, -0.016382217407226562, -0.015830278396606445, -0.015278339385986328, -0.014726400375366211, -0.014174461364746094, -0.013622522354125977, -0.01307058334350586, -0.012518644332885742, -0.011966705322265625, -0.011414766311645508, -0.01086282730102539, -0.010310888290405273, -0.009758949279785156, -0.009207010269165039, -0.008655071258544922, -0.008103132247924805, -0.0075511932373046875, -0.00699925422668457, -0.006447315216064453, -0.005895376205444336, -0.005343437194824219, -0.0047914981842041016, -0.004239559173583984, -0.003687620162963867, -0.00313568115234375, -0.002583742141723633, -0.0020318031311035156, -0.0014798641204833984, -0.0009279251098632812, -0.00037598609924316406, 0.00017595291137695312, 0.0007278919219970703, 0.0012798309326171875, 0.0018317699432373047, 0.002383708953857422, 0.002935647964477539, 0.0034875869750976562, 0.0040395259857177734, 0.004591464996337891, 0.005143404006958008, 0.005695343017578125, 0.006247282028198242, 0.006799221038818359, 0.0073511600494384766, 0.007903099060058594, 0.008455038070678711, 0.009006977081298828, 0.009558916091918945, 0.010110855102539062, 0.01066279411315918, 0.011214733123779297, 0.011766672134399414, 0.012318611145019531, 0.012870550155639648, 0.013422489166259766, 0.013974428176879883, 0.0145263671875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 4.0, 13.0, 16.0, 18.0, 29.0, 27.0, 57.0, 102.0, 158.0, 361.0, 801.0, 2702.0, 15939.0, 416008.0, 586802.0, 20610.0, 3158.0, 914.0, 358.0, 164.0, 121.0, 63.0, 29.0, 23.0, 17.0, 16.0, 14.0, 1.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0], "bins": [-0.11724853515625, -0.11424636840820312, -0.11124420166015625, -0.10824203491210938, -0.1052398681640625, -0.10223770141601562, -0.09923553466796875, -0.09623336791992188, -0.093231201171875, -0.09022903442382812, -0.08722686767578125, -0.08422470092773438, -0.0812225341796875, -0.07822036743164062, -0.07521820068359375, -0.07221603393554688, -0.0692138671875, -0.06621170043945312, -0.06320953369140625, -0.060207366943359375, -0.0572052001953125, -0.054203033447265625, -0.05120086669921875, -0.048198699951171875, -0.045196533203125, -0.042194366455078125, -0.03919219970703125, -0.036190032958984375, -0.0331878662109375, -0.030185699462890625, -0.02718353271484375, -0.024181365966796875, -0.02117919921875, -0.018177032470703125, -0.01517486572265625, -0.012172698974609375, -0.0091705322265625, -0.006168365478515625, -0.00316619873046875, -0.000164031982421875, 0.002838134765625, 0.005840301513671875, 0.00884246826171875, 0.011844635009765625, 0.0148468017578125, 0.017848968505859375, 0.02085113525390625, 0.023853302001953125, 0.02685546875, 0.029857635498046875, 0.03285980224609375, 0.035861968994140625, 0.0388641357421875, 0.041866302490234375, 0.04486846923828125, 0.047870635986328125, 0.050872802734375, 0.053874969482421875, 0.05687713623046875, 0.059879302978515625, 0.0628814697265625, 0.06588363647460938, 0.06888580322265625, 0.07188796997070312, 0.07489013671875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 3.0, 1.0, 5.0, 4.0, 7.0, 9.0, 17.0, 17.0, 19.0, 23.0, 43.0, 56.0, 59.0, 60.0, 87.0, 69.0, 84.0, 73.0, 64.0, 61.0, 60.0, 38.0, 36.0, 27.0, 22.0, 16.0, 8.0, 13.0, 6.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08001708984375, -0.07781362533569336, -0.07561016082763672, -0.07340669631958008, -0.07120323181152344, -0.0689997673034668, -0.06679630279541016, -0.06459283828735352, -0.062389373779296875, -0.060185909271240234, -0.057982444763183594, -0.05577898025512695, -0.05357551574707031, -0.05137205123901367, -0.04916858673095703, -0.04696512222290039, -0.04476165771484375, -0.04255819320678711, -0.04035472869873047, -0.03815126419067383, -0.03594779968261719, -0.03374433517456055, -0.031540870666503906, -0.029337406158447266, -0.027133941650390625, -0.024930477142333984, -0.022727012634277344, -0.020523548126220703, -0.018320083618164062, -0.016116619110107422, -0.013913154602050781, -0.01170969009399414, -0.0095062255859375, -0.007302761077880859, -0.005099296569824219, -0.002895832061767578, -0.0006923675537109375, 0.0015110969543457031, 0.0037145614624023438, 0.005918025970458984, 0.008121490478515625, 0.010324954986572266, 0.012528419494628906, 0.014731884002685547, 0.016935348510742188, 0.019138813018798828, 0.02134227752685547, 0.02354574203491211, 0.02574920654296875, 0.02795267105102539, 0.03015613555908203, 0.03235960006713867, 0.03456306457519531, 0.03676652908325195, 0.038969993591308594, 0.041173458099365234, 0.043376922607421875, 0.045580387115478516, 0.047783851623535156, 0.0499873161315918, 0.05219078063964844, 0.05439424514770508, 0.05659770965576172, 0.05880117416381836, 0.061004638671875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 3.0, 3.0, 3.0, 10.0, 5.0, 4.0, 8.0, 20.0, 30.0, 55.0, 115.0, 229.0, 438.0, 919.0, 2675.0, 12770.0, 220704.0, 757702.0, 44627.0, 5364.0, 1568.0, 659.0, 264.0, 150.0, 100.0, 50.0, 31.0, 17.0, 8.0, 9.0, 8.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0164642333984375, -0.015651464462280273, -0.014838695526123047, -0.01402592658996582, -0.013213157653808594, -0.012400388717651367, -0.01158761978149414, -0.010774850845336914, -0.009962081909179688, -0.009149312973022461, -0.008336544036865234, -0.007523775100708008, -0.006711006164550781, -0.005898237228393555, -0.005085468292236328, -0.0042726993560791016, -0.003459930419921875, -0.0026471614837646484, -0.0018343925476074219, -0.0010216236114501953, -0.00020885467529296875, 0.0006039142608642578, 0.0014166831970214844, 0.002229452133178711, 0.0030422210693359375, 0.003854990005493164, 0.004667758941650391, 0.005480527877807617, 0.006293296813964844, 0.00710606575012207, 0.007918834686279297, 0.008731603622436523, 0.00954437255859375, 0.010357141494750977, 0.011169910430908203, 0.01198267936706543, 0.012795448303222656, 0.013608217239379883, 0.01442098617553711, 0.015233755111694336, 0.016046524047851562, 0.01685929298400879, 0.017672061920166016, 0.018484830856323242, 0.01929759979248047, 0.020110368728637695, 0.020923137664794922, 0.02173590660095215, 0.022548675537109375, 0.0233614444732666, 0.024174213409423828, 0.024986982345581055, 0.02579975128173828, 0.026612520217895508, 0.027425289154052734, 0.02823805809020996, 0.029050827026367188, 0.029863595962524414, 0.03067636489868164, 0.03148913383483887, 0.032301902770996094, 0.03311467170715332, 0.03392744064331055, 0.03474020957946777, 0.035552978515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 12.0, 3.0, 14.0, 22.0, 25.0, 31.0, 50.0, 64.0, 72.0, 119.0, 121.0, 131.0, 83.0, 74.0, 51.0, 38.0, 27.0, 19.0, 15.0, 10.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.033348083496094e-05, -6.787478923797607e-05, -6.541609764099121e-05, -6.295740604400635e-05, -6.0498714447021484e-05, -5.804002285003662e-05, -5.558133125305176e-05, -5.3122639656066895e-05, -5.066394805908203e-05, -4.820525646209717e-05, -4.5746564865112305e-05, -4.328787326812744e-05, -4.082918167114258e-05, -3.8370490074157715e-05, -3.591179847717285e-05, -3.345310688018799e-05, -3.0994415283203125e-05, -2.8535723686218262e-05, -2.60770320892334e-05, -2.3618340492248535e-05, -2.1159648895263672e-05, -1.870095729827881e-05, -1.6242265701293945e-05, -1.3783574104309082e-05, -1.1324882507324219e-05, -8.866190910339355e-06, -6.407499313354492e-06, -3.948807716369629e-06, -1.4901161193847656e-06, 9.685754776000977e-07, 3.427267074584961e-06, 5.885958671569824e-06, 8.344650268554688e-06, 1.080334186553955e-05, 1.3262033462524414e-05, 1.5720725059509277e-05, 1.817941665649414e-05, 2.0638108253479004e-05, 2.3096799850463867e-05, 2.555549144744873e-05, 2.8014183044433594e-05, 3.0472874641418457e-05, 3.293156623840332e-05, 3.5390257835388184e-05, 3.784894943237305e-05, 4.030764102935791e-05, 4.2766332626342773e-05, 4.522502422332764e-05, 4.76837158203125e-05, 5.014240741729736e-05, 5.2601099014282227e-05, 5.505979061126709e-05, 5.751848220825195e-05, 5.9977173805236816e-05, 6.243586540222168e-05, 6.489455699920654e-05, 6.73532485961914e-05, 6.981194019317627e-05, 7.227063179016113e-05, 7.4729323387146e-05, 7.718801498413086e-05, 7.964670658111572e-05, 8.210539817810059e-05, 8.456408977508545e-05, 8.702278137207031e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 1.0, 14.0, 25.0, 27.0, 50.0, 84.0, 187.0, 377.0, 1164.0, 4819.0, 76620.0, 907482.0, 51875.0, 4114.0, 975.0, 392.0, 160.0, 75.0, 44.0, 25.0, 18.0, 9.0, 4.0, 5.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039306640625, -0.03822827339172363, -0.037149906158447266, -0.0360715389251709, -0.03499317169189453, -0.033914804458618164, -0.0328364372253418, -0.03175806999206543, -0.030679702758789062, -0.029601335525512695, -0.028522968292236328, -0.02744460105895996, -0.026366233825683594, -0.025287866592407227, -0.02420949935913086, -0.023131132125854492, -0.022052764892578125, -0.020974397659301758, -0.01989603042602539, -0.018817663192749023, -0.017739295959472656, -0.01666092872619629, -0.015582561492919922, -0.014504194259643555, -0.013425827026367188, -0.01234745979309082, -0.011269092559814453, -0.010190725326538086, -0.009112358093261719, -0.008033990859985352, -0.006955623626708984, -0.005877256393432617, -0.00479888916015625, -0.003720521926879883, -0.0026421546936035156, -0.0015637874603271484, -0.00048542022705078125, 0.0005929470062255859, 0.0016713142395019531, 0.0027496814727783203, 0.0038280487060546875, 0.004906415939331055, 0.005984783172607422, 0.007063150405883789, 0.008141517639160156, 0.009219884872436523, 0.01029825210571289, 0.011376619338989258, 0.012454986572265625, 0.013533353805541992, 0.01461172103881836, 0.015690088272094727, 0.016768455505371094, 0.01784682273864746, 0.018925189971923828, 0.020003557205200195, 0.021081924438476562, 0.02216029167175293, 0.023238658905029297, 0.024317026138305664, 0.02539539337158203, 0.0264737606048584, 0.027552127838134766, 0.028630495071411133, 0.0297088623046875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 6.0, 14.0, 18.0, 30.0, 59.0, 97.0, 129.0, 170.0, 151.0, 106.0, 80.0, 44.0, 41.0, 18.0, 16.0, 9.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.029632568359375, -0.02885293960571289, -0.02807331085205078, -0.027293682098388672, -0.026514053344726562, -0.025734424591064453, -0.024954795837402344, -0.024175167083740234, -0.023395538330078125, -0.022615909576416016, -0.021836280822753906, -0.021056652069091797, -0.020277023315429688, -0.019497394561767578, -0.01871776580810547, -0.01793813705444336, -0.01715850830078125, -0.01637887954711914, -0.015599250793457031, -0.014819622039794922, -0.014039993286132812, -0.013260364532470703, -0.012480735778808594, -0.011701107025146484, -0.010921478271484375, -0.010141849517822266, -0.009362220764160156, -0.008582592010498047, -0.0078029632568359375, -0.007023334503173828, -0.006243705749511719, -0.005464076995849609, -0.0046844482421875, -0.0039048194885253906, -0.0031251907348632812, -0.002345561981201172, -0.0015659332275390625, -0.0007863044738769531, -6.67572021484375e-06, 0.0007729530334472656, 0.001552581787109375, 0.0023322105407714844, 0.0031118392944335938, 0.003891468048095703, 0.0046710968017578125, 0.005450725555419922, 0.006230354309082031, 0.007009983062744141, 0.00778961181640625, 0.00856924057006836, 0.009348869323730469, 0.010128498077392578, 0.010908126831054688, 0.011687755584716797, 0.012467384338378906, 0.013247013092041016, 0.014026641845703125, 0.014806270599365234, 0.015585899353027344, 0.016365528106689453, 0.017145156860351562, 0.017924785614013672, 0.01870441436767578, 0.01948404312133789, 0.020263671875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 16.0, 36.0, 148.0, 414.0, 279.0, 70.0, 23.0, 7.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.119673252105713, -1.0980406999588013, -1.0764080286026, -1.0547754764556885, -1.0331428050994873, -1.0115102529525757, -0.9898776412010193, -0.9682450294494629, -0.9466124773025513, -0.9249798655509949, -0.9033472537994385, -0.8817147016525269, -0.8600820899009705, -0.8384494781494141, -0.8168168663978577, -0.7951842546463013, -0.7735516428947449, -0.7519190311431885, -0.7302864193916321, -0.7086538076400757, -0.6870212554931641, -0.6653886437416077, -0.6437560319900513, -0.6221234202384949, -0.6004908084869385, -0.5788581967353821, -0.5572255849838257, -0.5355930328369141, -0.5139604210853577, -0.49232780933380127, -0.4706951975822449, -0.4490625858306885, -0.42743003368377686, -0.40579742193222046, -0.38416483998298645, -0.36253222823143005, -0.34089964628219604, -0.31926703453063965, -0.29763442277908325, -0.27600181102752686, -0.25436922907829285, -0.23273663222789764, -0.21110403537750244, -0.18947142362594604, -0.16783882677555084, -0.14620622992515564, -0.12457361817359924, -0.10294102132320404, -0.08130842447280884, -0.05967582389712334, -0.038043223321437836, -0.016410619020462036, 0.0052219778299331665, 0.02685457468032837, 0.048487186431884766, 0.07011978328227997, 0.09175238013267517, 0.11338497698307037, 0.13501757383346558, 0.15665018558502197, 0.17828278243541718, 0.19991537928581238, 0.22154799103736877, 0.24318058788776398, 0.2648131847381592]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 5.0, 4.0, 11.0, 11.0, 13.0, 8.0, 19.0, 19.0, 22.0, 34.0, 30.0, 31.0, 32.0, 42.0, 48.0, 43.0, 44.0, 48.0, 58.0, 50.0, 45.0, 47.0, 35.0, 42.0, 37.0, 33.0, 25.0, 24.0, 28.0, 23.0, 20.0, 13.0, 15.0, 7.0, 6.0, 10.0, 5.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.2805614471435547, -0.27219751477241516, -0.26383358240127563, -0.2554696500301361, -0.24710571765899658, -0.23874178528785706, -0.23037786781787872, -0.2220139354467392, -0.21365000307559967, -0.20528607070446014, -0.19692213833332062, -0.1885582059621811, -0.18019428849220276, -0.17183035612106323, -0.1634664237499237, -0.15510249137878418, -0.14673855900764465, -0.13837462663650513, -0.1300106942653656, -0.12164676934480667, -0.11328283697366714, -0.10491890460252762, -0.09655497968196869, -0.08819104731082916, -0.07982711493968964, -0.07146318256855011, -0.06309925019741058, -0.054735325276851654, -0.04637139290571213, -0.0380074605345726, -0.029643531888723373, -0.021279603242874146, -0.01291567087173462, -0.004551740363240242, 0.003812190145254135, 0.012176120653748512, 0.02054005116224289, 0.028903983533382416, 0.037267912179231644, 0.04563184082508087, 0.0539957731962204, 0.062359705567359924, 0.07072363793849945, 0.07908756285905838, 0.0874514952301979, 0.09581542760133743, 0.10417935252189636, 0.11254328489303589, 0.12090721726417542, 0.12927114963531494, 0.13763508200645447, 0.145999014377594, 0.15436294674873352, 0.16272687911987305, 0.17109079658985138, 0.1794547289609909, 0.18781866133213043, 0.19618259370326996, 0.20454652607440948, 0.212910458445549, 0.22127437591552734, 0.22963830828666687, 0.2380022406578064, 0.24636617302894592, 0.25473010540008545]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 5.0, 7.0, 11.0, 18.0, 14.0, 20.0, 32.0, 34.0, 47.0, 91.0, 111.0, 160.0, 292.0, 542.0, 985.0, 1983.0, 4878.0, 16834.0, 113996.0, 3815720.0, 207713.0, 21622.0, 5494.0, 1902.0, 849.0, 426.0, 198.0, 120.0, 59.0, 39.0, 23.0, 13.0, 12.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1282958984375, -0.12497138977050781, -0.12164688110351562, -0.11832237243652344, -0.11499786376953125, -0.11167335510253906, -0.10834884643554688, -0.10502433776855469, -0.1016998291015625, -0.09837532043457031, -0.09505081176757812, -0.09172630310058594, -0.08840179443359375, -0.08507728576660156, -0.08175277709960938, -0.07842826843261719, -0.075103759765625, -0.07177925109863281, -0.06845474243164062, -0.06513023376464844, -0.06180572509765625, -0.05848121643066406, -0.055156707763671875, -0.05183219909667969, -0.0485076904296875, -0.04518318176269531, -0.041858673095703125, -0.03853416442871094, -0.03520965576171875, -0.03188514709472656, -0.028560638427734375, -0.025236129760742188, -0.02191162109375, -0.018587112426757812, -0.015262603759765625, -0.011938095092773438, -0.00861358642578125, -0.0052890777587890625, -0.001964569091796875, 0.0013599395751953125, 0.0046844482421875, 0.008008956909179688, 0.011333465576171875, 0.014657974243164062, 0.01798248291015625, 0.021306991577148438, 0.024631500244140625, 0.027956008911132812, 0.031280517578125, 0.03460502624511719, 0.037929534912109375, 0.04125404357910156, 0.04457855224609375, 0.04790306091308594, 0.051227569580078125, 0.05455207824707031, 0.0578765869140625, 0.06120109558105469, 0.06452560424804688, 0.06785011291503906, 0.07117462158203125, 0.07449913024902344, 0.07782363891601562, 0.08114814758300781, 0.08447265625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 6.0, 9.0, 8.0, 17.0, 16.0, 27.0, 39.0, 45.0, 47.0, 62.0, 60.0, 74.0, 88.0, 79.0, 75.0, 70.0, 54.0, 49.0, 36.0, 38.0, 30.0, 25.0, 19.0, 11.0, 4.0, 9.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0184783935546875, -0.017963767051696777, -0.017449140548706055, -0.016934514045715332, -0.01641988754272461, -0.015905261039733887, -0.015390634536743164, -0.014876008033752441, -0.014361381530761719, -0.013846755027770996, -0.013332128524780273, -0.01281750202178955, -0.012302875518798828, -0.011788249015808105, -0.011273622512817383, -0.01075899600982666, -0.010244369506835938, -0.009729743003845215, -0.009215116500854492, -0.00870048999786377, -0.008185863494873047, -0.007671236991882324, -0.0071566104888916016, -0.006641983985900879, -0.006127357482910156, -0.005612730979919434, -0.005098104476928711, -0.004583477973937988, -0.004068851470947266, -0.003554224967956543, -0.0030395984649658203, -0.0025249719619750977, -0.002010345458984375, -0.0014957189559936523, -0.0009810924530029297, -0.00046646595001220703, 4.8160552978515625e-05, 0.0005627870559692383, 0.001077413558959961, 0.0015920400619506836, 0.0021066665649414062, 0.002621293067932129, 0.0031359195709228516, 0.0036505460739135742, 0.004165172576904297, 0.0046797990798950195, 0.005194425582885742, 0.005709052085876465, 0.0062236785888671875, 0.00673830509185791, 0.007252931594848633, 0.0077675580978393555, 0.008282184600830078, 0.0087968111038208, 0.009311437606811523, 0.009826064109802246, 0.010340690612792969, 0.010855317115783691, 0.011369943618774414, 0.011884570121765137, 0.01239919662475586, 0.012913823127746582, 0.013428449630737305, 0.013943076133728027, 0.01445770263671875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 9.0, 11.0, 16.0, 13.0, 26.0, 45.0, 52.0, 90.0, 211.0, 448.0, 1044.0, 4115.0, 37933.0, 4111928.0, 32617.0, 4026.0, 982.0, 356.0, 143.0, 89.0, 42.0, 32.0, 19.0, 11.0, 7.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.21630859375, -0.21053695678710938, -0.20476531982421875, -0.19899368286132812, -0.1932220458984375, -0.18745040893554688, -0.18167877197265625, -0.17590713500976562, -0.170135498046875, -0.16436386108398438, -0.15859222412109375, -0.15282058715820312, -0.1470489501953125, -0.14127731323242188, -0.13550567626953125, -0.12973403930664062, -0.12396240234375, -0.11819076538085938, -0.11241912841796875, -0.10664749145507812, -0.1008758544921875, -0.09510421752929688, -0.08933258056640625, -0.08356094360351562, -0.077789306640625, -0.07201766967773438, -0.06624603271484375, -0.060474395751953125, -0.0547027587890625, -0.048931121826171875, -0.04315948486328125, -0.037387847900390625, -0.0316162109375, -0.025844573974609375, -0.02007293701171875, -0.014301300048828125, -0.0085296630859375, -0.002758026123046875, 0.00301361083984375, 0.008785247802734375, 0.014556884765625, 0.020328521728515625, 0.02610015869140625, 0.031871795654296875, 0.0376434326171875, 0.043415069580078125, 0.04918670654296875, 0.054958343505859375, 0.06072998046875, 0.06650161743164062, 0.07227325439453125, 0.07804489135742188, 0.0838165283203125, 0.08958816528320312, 0.09535980224609375, 0.10113143920898438, 0.106903076171875, 0.11267471313476562, 0.11844635009765625, 0.12421798706054688, 0.1299896240234375, 0.13576126098632812, 0.14153289794921875, 0.14730453491210938, 0.153076171875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 0.0, 6.0, 2.0, 7.0, 7.0, 16.0, 29.0, 55.0, 132.0, 541.0, 2425.0, 583.0, 135.0, 59.0, 24.0, 12.0, 14.0, 5.0, 4.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07086181640625, -0.06911277770996094, -0.06736373901367188, -0.06561470031738281, -0.06386566162109375, -0.06211662292480469, -0.060367584228515625, -0.05861854553222656, -0.0568695068359375, -0.05512046813964844, -0.053371429443359375, -0.05162239074707031, -0.04987335205078125, -0.04812431335449219, -0.046375274658203125, -0.04462623596191406, -0.042877197265625, -0.04112815856933594, -0.039379119873046875, -0.03763008117675781, -0.03588104248046875, -0.03413200378417969, -0.032382965087890625, -0.030633926391601562, -0.0288848876953125, -0.027135848999023438, -0.025386810302734375, -0.023637771606445312, -0.02188873291015625, -0.020139694213867188, -0.018390655517578125, -0.016641616821289062, -0.014892578125, -0.013143539428710938, -0.011394500732421875, -0.009645462036132812, -0.00789642333984375, -0.0061473846435546875, -0.004398345947265625, -0.0026493072509765625, -0.0009002685546875, 0.0008487701416015625, 0.002597808837890625, 0.0043468475341796875, 0.00609588623046875, 0.007844924926757812, 0.009593963623046875, 0.011343002319335938, 0.013092041015625, 0.014841079711914062, 0.016590118408203125, 0.018339157104492188, 0.02008819580078125, 0.021837234497070312, 0.023586273193359375, 0.025335311889648438, 0.0270843505859375, 0.028833389282226562, 0.030582427978515625, 0.03233146667480469, 0.03408050537109375, 0.03582954406738281, 0.037578582763671875, 0.03932762145996094, 0.04107666015625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 68.0, 819.0, 107.0, 12.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0050221681594849, -0.9751108288764954, -0.9451994299888611, -0.9152880907058716, -0.8853766918182373, -0.8554653525352478, -0.8255540132522583, -0.795642614364624, -0.7657312154769897, -0.7358198761940002, -0.705908477306366, -0.6759971380233765, -0.6460857391357422, -0.6161743998527527, -0.5862630605697632, -0.5563516616821289, -0.5264403223991394, -0.4965289533138275, -0.4666175842285156, -0.4367062449455261, -0.40679484605789185, -0.37688350677490234, -0.34697213768959045, -0.31706076860427856, -0.2871493995189667, -0.2572380304336548, -0.2273266613483429, -0.1974153071641922, -0.1675039380788803, -0.13759256899356842, -0.10768121480941772, -0.07776984572410583, -0.047858476638793945, -0.017947111278772354, 0.011964254081249237, 0.04187561571598053, 0.07178698480129242, 0.10169835388660431, 0.131609708070755, 0.1615210771560669, 0.19143244624137878, 0.22134381532669067, 0.25125518441200256, 0.28116655349731445, 0.31107789278030396, 0.34098929166793823, 0.37090063095092773, 0.4008120000362396, 0.4307233691215515, 0.4606347382068634, 0.4905461072921753, 0.5204574465751648, 0.5503688454627991, 0.5802801847457886, 0.6101915836334229, 0.6401029229164124, 0.6700142621994019, 0.6999256014823914, 0.7298370003700256, 0.7597483396530151, 0.7896597385406494, 0.8195710778236389, 0.8494824171066284, 0.8793938159942627, 0.909305214881897]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 11.0, 12.0, 24.0, 27.0, 23.0, 37.0, 31.0, 59.0, 60.0, 66.0, 90.0, 77.0, 83.0, 73.0, 60.0, 66.0, 47.0, 33.0, 42.0, 16.0, 17.0, 13.0, 10.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.17158102989196777, -0.16578951478004456, -0.15999801456928253, -0.1542065143585205, -0.1484149992465973, -0.14262348413467407, -0.13683198392391205, -0.13104048371315002, -0.1252489686012268, -0.11945746093988419, -0.11366595327854156, -0.10787444561719894, -0.10208293795585632, -0.0962914302945137, -0.09049992263317108, -0.08470841497182846, -0.07891690731048584, -0.07312539964914322, -0.0673338919878006, -0.06154238432645798, -0.055750876665115356, -0.049959369003772736, -0.044167861342430115, -0.038376353681087494, -0.03258484601974487, -0.026793338358402252, -0.02100183069705963, -0.01521032303571701, -0.00941881537437439, -0.003627307713031769, 0.002164199948310852, 0.007955707609653473, 0.013747215270996094, 0.019538722932338715, 0.025330230593681335, 0.031121738255023956, 0.03691324591636658, 0.0427047535777092, 0.04849626123905182, 0.05428776890039444, 0.06007927656173706, 0.06587078422307968, 0.0716622918844223, 0.07745379954576492, 0.08324530720710754, 0.08903681486845016, 0.09482832252979279, 0.1006198301911354, 0.10641133785247803, 0.11220284551382065, 0.11799435317516327, 0.12378586083650589, 0.1295773684978485, 0.13536888360977173, 0.14116038382053375, 0.14695188403129578, 0.152743399143219, 0.1585349142551422, 0.16432641446590424, 0.17011791467666626, 0.17590942978858948, 0.1817009449005127, 0.18749244511127472, 0.19328394532203674, 0.19907546043395996]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 10.0, 6.0, 11.0, 23.0, 23.0, 34.0, 51.0, 65.0, 135.0, 225.0, 319.0, 659.0, 1363.0, 3774.0, 14374.0, 92521.0, 587744.0, 298142.0, 37174.0, 7410.0, 2306.0, 994.0, 465.0, 273.0, 151.0, 87.0, 62.0, 47.0, 38.0, 14.0, 19.0, 13.0, 9.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059326171875, -0.05756950378417969, -0.055812835693359375, -0.05405616760253906, -0.05229949951171875, -0.05054283142089844, -0.048786163330078125, -0.04702949523925781, -0.0452728271484375, -0.04351615905761719, -0.041759490966796875, -0.04000282287597656, -0.03824615478515625, -0.03648948669433594, -0.034732818603515625, -0.03297615051269531, -0.031219482421875, -0.029462814331054688, -0.027706146240234375, -0.025949478149414062, -0.02419281005859375, -0.022436141967773438, -0.020679473876953125, -0.018922805786132812, -0.0171661376953125, -0.015409469604492188, -0.013652801513671875, -0.011896133422851562, -0.01013946533203125, -0.008382797241210938, -0.006626129150390625, -0.0048694610595703125, -0.00311279296875, -0.0013561248779296875, 0.000400543212890625, 0.0021572113037109375, 0.00391387939453125, 0.0056705474853515625, 0.007427215576171875, 0.009183883666992188, 0.0109405517578125, 0.012697219848632812, 0.014453887939453125, 0.016210556030273438, 0.01796722412109375, 0.019723892211914062, 0.021480560302734375, 0.023237228393554688, 0.024993896484375, 0.026750564575195312, 0.028507232666015625, 0.030263900756835938, 0.03202056884765625, 0.03377723693847656, 0.035533905029296875, 0.03729057312011719, 0.0390472412109375, 0.04080390930175781, 0.042560577392578125, 0.04431724548339844, 0.04607391357421875, 0.04783058166503906, 0.049587249755859375, 0.05134391784667969, 0.0531005859375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 9.0, 18.0, 24.0, 35.0, 59.0, 75.0, 82.0, 111.0, 137.0, 95.0, 112.0, 64.0, 60.0, 45.0, 33.0, 17.0, 15.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027801513671875, -0.027116060256958008, -0.026430606842041016, -0.025745153427124023, -0.02505970001220703, -0.02437424659729004, -0.023688793182373047, -0.023003339767456055, -0.022317886352539062, -0.02163243293762207, -0.020946979522705078, -0.020261526107788086, -0.019576072692871094, -0.0188906192779541, -0.01820516586303711, -0.017519712448120117, -0.016834259033203125, -0.016148805618286133, -0.01546335220336914, -0.014777898788452148, -0.014092445373535156, -0.013406991958618164, -0.012721538543701172, -0.01203608512878418, -0.011350631713867188, -0.010665178298950195, -0.009979724884033203, -0.009294271469116211, -0.008608818054199219, -0.007923364639282227, -0.007237911224365234, -0.006552457809448242, -0.00586700439453125, -0.005181550979614258, -0.004496097564697266, -0.0038106441497802734, -0.0031251907348632812, -0.002439737319946289, -0.0017542839050292969, -0.0010688304901123047, -0.0003833770751953125, 0.0003020763397216797, 0.0009875297546386719, 0.001672983169555664, 0.0023584365844726562, 0.0030438899993896484, 0.0037293434143066406, 0.004414796829223633, 0.005100250244140625, 0.005785703659057617, 0.006471157073974609, 0.0071566104888916016, 0.007842063903808594, 0.008527517318725586, 0.009212970733642578, 0.00989842414855957, 0.010583877563476562, 0.011269330978393555, 0.011954784393310547, 0.012640237808227539, 0.013325691223144531, 0.014011144638061523, 0.014696598052978516, 0.015382051467895508, 0.0160675048828125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 8.0, 14.0, 16.0, 22.0, 37.0, 48.0, 79.0, 103.0, 177.0, 301.0, 707.0, 2123.0, 8722.0, 51212.0, 347532.0, 521447.0, 96278.0, 14499.0, 3252.0, 1008.0, 387.0, 209.0, 121.0, 80.0, 47.0, 32.0, 25.0, 19.0, 13.0, 9.0, 8.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03668212890625, -0.035424232482910156, -0.03416633605957031, -0.03290843963623047, -0.031650543212890625, -0.03039264678955078, -0.029134750366210938, -0.027876853942871094, -0.02661895751953125, -0.025361061096191406, -0.024103164672851562, -0.02284526824951172, -0.021587371826171875, -0.02032947540283203, -0.019071578979492188, -0.017813682556152344, -0.0165557861328125, -0.015297889709472656, -0.014039993286132812, -0.012782096862792969, -0.011524200439453125, -0.010266304016113281, -0.009008407592773438, -0.007750511169433594, -0.00649261474609375, -0.005234718322753906, -0.0039768218994140625, -0.0027189254760742188, -0.001461029052734375, -0.00020313262939453125, 0.0010547637939453125, 0.0023126602172851562, 0.003570556640625, 0.004828453063964844, 0.0060863494873046875, 0.007344245910644531, 0.008602142333984375, 0.009860038757324219, 0.011117935180664062, 0.012375831604003906, 0.01363372802734375, 0.014891624450683594, 0.016149520874023438, 0.01740741729736328, 0.018665313720703125, 0.01992321014404297, 0.021181106567382812, 0.022439002990722656, 0.0236968994140625, 0.024954795837402344, 0.026212692260742188, 0.02747058868408203, 0.028728485107421875, 0.02998638153076172, 0.031244277954101562, 0.032502174377441406, 0.03376007080078125, 0.035017967224121094, 0.03627586364746094, 0.03753376007080078, 0.038791656494140625, 0.04004955291748047, 0.04130744934082031, 0.042565345764160156, 0.0438232421875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 1.0, 6.0, 11.0, 5.0, 20.0, 12.0, 23.0, 20.0, 36.0, 32.0, 25.0, 41.0, 55.0, 42.0, 51.0, 55.0, 56.0, 44.0, 56.0, 50.0, 41.0, 50.0, 40.0, 36.0, 30.0, 43.0, 22.0, 17.0, 12.0, 13.0, 14.0, 11.0, 9.0, 5.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03607177734375, -0.03478431701660156, -0.033496856689453125, -0.03220939636230469, -0.03092193603515625, -0.029634475708007812, -0.028347015380859375, -0.027059555053710938, -0.0257720947265625, -0.024484634399414062, -0.023197174072265625, -0.021909713745117188, -0.02062225341796875, -0.019334793090820312, -0.018047332763671875, -0.016759872436523438, -0.015472412109375, -0.014184951782226562, -0.012897491455078125, -0.011610031127929688, -0.01032257080078125, -0.009035110473632812, -0.007747650146484375, -0.0064601898193359375, -0.0051727294921875, -0.0038852691650390625, -0.002597808837890625, -0.0013103485107421875, -2.288818359375e-05, 0.0012645721435546875, 0.002552032470703125, 0.0038394927978515625, 0.005126953125, 0.0064144134521484375, 0.007701873779296875, 0.008989334106445312, 0.01027679443359375, 0.011564254760742188, 0.012851715087890625, 0.014139175415039062, 0.0154266357421875, 0.016714096069335938, 0.018001556396484375, 0.019289016723632812, 0.02057647705078125, 0.021863937377929688, 0.023151397705078125, 0.024438858032226562, 0.025726318359375, 0.027013778686523438, 0.028301239013671875, 0.029588699340820312, 0.03087615966796875, 0.03216361999511719, 0.033451080322265625, 0.03473854064941406, 0.0360260009765625, 0.03731346130371094, 0.038600921630859375, 0.03988838195800781, 0.04117584228515625, 0.04246330261230469, 0.043750762939453125, 0.04503822326660156, 0.04632568359375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 10.0, 15.0, 20.0, 27.0, 43.0, 91.0, 184.0, 360.0, 795.0, 1952.0, 6678.0, 43836.0, 542001.0, 412887.0, 31085.0, 5434.0, 1747.0, 715.0, 321.0, 153.0, 76.0, 45.0, 28.0, 7.0, 10.0, 9.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0195465087890625, -0.018934249877929688, -0.018321990966796875, -0.017709732055664062, -0.01709747314453125, -0.016485214233398438, -0.015872955322265625, -0.015260696411132812, -0.0146484375, -0.014036178588867188, -0.013423919677734375, -0.012811660766601562, -0.01219940185546875, -0.011587142944335938, -0.010974884033203125, -0.010362625122070312, -0.0097503662109375, -0.009138107299804688, -0.008525848388671875, -0.007913589477539062, -0.00730133056640625, -0.0066890716552734375, -0.006076812744140625, -0.0054645538330078125, -0.004852294921875, -0.0042400360107421875, -0.003627777099609375, -0.0030155181884765625, -0.00240325927734375, -0.0017910003662109375, -0.001178741455078125, -0.0005664825439453125, 4.57763671875e-05, 0.0006580352783203125, 0.001270294189453125, 0.0018825531005859375, 0.00249481201171875, 0.0031070709228515625, 0.003719329833984375, 0.0043315887451171875, 0.00494384765625, 0.0055561065673828125, 0.006168365478515625, 0.0067806243896484375, 0.00739288330078125, 0.008005142211914062, 0.008617401123046875, 0.009229660034179688, 0.0098419189453125, 0.010454177856445312, 0.011066436767578125, 0.011678695678710938, 0.01229095458984375, 0.012903213500976562, 0.013515472412109375, 0.014127731323242188, 0.014739990234375, 0.015352249145507812, 0.015964508056640625, 0.016576766967773438, 0.01718902587890625, 0.017801284790039062, 0.018413543701171875, 0.019025802612304688, 0.0196380615234375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [6.0, 7.0, 5.0, 11.0, 19.0, 51.0, 88.0, 154.0, 214.0, 195.0, 128.0, 66.0, 44.0, 16.0, 7.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.987550735473633e-05, -3.5363249480724335e-05, -3.085099160671234e-05, -2.6338733732700348e-05, -2.1826475858688354e-05, -1.731421798467636e-05, -1.2801960110664368e-05, -8.289702236652374e-06, -3.777444362640381e-06, 7.348135113716125e-07, 5.247071385383606e-06, 9.7593292593956e-06, 1.4271587133407593e-05, 1.8783845007419586e-05, 2.329610288143158e-05, 2.7808360755443573e-05, 3.2320618629455566e-05, 3.683287650346756e-05, 4.134513437747955e-05, 4.585739225149155e-05, 5.036965012550354e-05, 5.4881907999515533e-05, 5.939416587352753e-05, 6.390642374753952e-05, 6.841868162155151e-05, 7.293093949556351e-05, 7.74431973695755e-05, 8.19554552435875e-05, 8.646771311759949e-05, 9.097997099161148e-05, 9.549222886562347e-05, 0.00010000448673963547, 0.00010451674461364746, 0.00010902900248765945, 0.00011354126036167145, 0.00011805351823568344, 0.00012256577610969543, 0.00012707803398370743, 0.00013159029185771942, 0.00013610254973173141, 0.0001406148076057434, 0.0001451270654797554, 0.0001496393233537674, 0.0001541515812277794, 0.00015866383910179138, 0.00016317609697580338, 0.00016768835484981537, 0.00017220061272382736, 0.00017671287059783936, 0.00018122512847185135, 0.00018573738634586334, 0.00019024964421987534, 0.00019476190209388733, 0.00019927415996789932, 0.00020378641784191132, 0.0002082986757159233, 0.0002128109335899353, 0.0002173231914639473, 0.0002218354493379593, 0.00022634770721197128, 0.00023085996508598328, 0.00023537222295999527, 0.00023988448083400726, 0.00024439673870801926, 0.00024890899658203125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 5.0, 5.0, 7.0, 16.0, 23.0, 47.0, 69.0, 110.0, 233.0, 449.0, 1332.0, 4940.0, 34316.0, 466919.0, 495566.0, 37033.0, 5051.0, 1398.0, 505.0, 238.0, 114.0, 68.0, 40.0, 21.0, 13.0, 7.0, 9.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0161895751953125, -0.015567302703857422, -0.014945030212402344, -0.014322757720947266, -0.013700485229492188, -0.01307821273803711, -0.012455940246582031, -0.011833667755126953, -0.011211395263671875, -0.010589122772216797, -0.009966850280761719, -0.00934457778930664, -0.008722305297851562, -0.008100032806396484, -0.007477760314941406, -0.006855487823486328, -0.00623321533203125, -0.005610942840576172, -0.004988670349121094, -0.004366397857666016, -0.0037441253662109375, -0.0031218528747558594, -0.0024995803833007812, -0.0018773078918457031, -0.001255035400390625, -0.0006327629089355469, -1.049041748046875e-05, 0.0006117820739746094, 0.0012340545654296875, 0.0018563270568847656, 0.0024785995483398438, 0.003100872039794922, 0.00372314453125, 0.004345417022705078, 0.004967689514160156, 0.005589962005615234, 0.0062122344970703125, 0.006834506988525391, 0.007456779479980469, 0.008079051971435547, 0.008701324462890625, 0.009323596954345703, 0.009945869445800781, 0.01056814193725586, 0.011190414428710938, 0.011812686920166016, 0.012434959411621094, 0.013057231903076172, 0.01367950439453125, 0.014301776885986328, 0.014924049377441406, 0.015546321868896484, 0.016168594360351562, 0.01679086685180664, 0.01741313934326172, 0.018035411834716797, 0.018657684326171875, 0.019279956817626953, 0.01990222930908203, 0.02052450180053711, 0.021146774291992188, 0.021769046783447266, 0.022391319274902344, 0.023013591766357422, 0.0236358642578125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 3.0, 5.0, 3.0, 15.0, 17.0, 16.0, 35.0, 24.0, 39.0, 62.0, 51.0, 82.0, 70.0, 74.0, 76.0, 74.0, 67.0, 63.0, 39.0, 39.0, 34.0, 24.0, 18.0, 12.0, 7.0, 10.0, 3.0, 7.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00983428955078125, -0.009452581405639648, -0.009070873260498047, -0.008689165115356445, -0.008307456970214844, -0.007925748825073242, -0.007544040679931641, -0.007162332534790039, -0.0067806243896484375, -0.006398916244506836, -0.006017208099365234, -0.005635499954223633, -0.005253791809082031, -0.00487208366394043, -0.004490375518798828, -0.0041086673736572266, -0.003726959228515625, -0.0033452510833740234, -0.002963542938232422, -0.0025818347930908203, -0.0022001266479492188, -0.0018184185028076172, -0.0014367103576660156, -0.001055002212524414, -0.0006732940673828125, -0.00029158592224121094, 9.012222290039062e-05, 0.0004718303680419922, 0.0008535385131835938, 0.0012352466583251953, 0.0016169548034667969, 0.0019986629486083984, 0.00238037109375, 0.0027620792388916016, 0.003143787384033203, 0.0035254955291748047, 0.003907203674316406, 0.004288911819458008, 0.004670619964599609, 0.005052328109741211, 0.0054340362548828125, 0.005815744400024414, 0.006197452545166016, 0.006579160690307617, 0.006960868835449219, 0.00734257698059082, 0.007724285125732422, 0.008105993270874023, 0.008487701416015625, 0.008869409561157227, 0.009251117706298828, 0.00963282585144043, 0.010014533996582031, 0.010396242141723633, 0.010777950286865234, 0.011159658432006836, 0.011541366577148438, 0.011923074722290039, 0.01230478286743164, 0.012686491012573242, 0.013068199157714844, 0.013449907302856445, 0.013831615447998047, 0.014213323593139648, 0.01459503173828125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 18.0, 54.0, 136.0, 233.0, 261.0, 172.0, 69.0, 30.0, 10.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18249693512916565, -0.1712089478969574, -0.15992097556591034, -0.1486329883337021, -0.13734501600265503, -0.12605702877044678, -0.11476904153823853, -0.10348106175661087, -0.09219308197498322, -0.08090510219335556, -0.0696171224117279, -0.05832913517951965, -0.047041155397892, -0.03575317561626434, -0.02446518838405609, -0.013177208602428436, -0.0018892288208007812, 0.009398752823472023, 0.020686734467744827, 0.03197471797466278, 0.043262697756290436, 0.05455067753791809, 0.06583866477012634, 0.077126644551754, 0.08841462433338165, 0.09970260411500931, 0.11099058389663696, 0.12227857112884521, 0.13356655836105347, 0.14485453069210052, 0.15614251792430878, 0.16743049025535583, 0.1787184476852417, 0.19000643491744995, 0.201294407248497, 0.21258239448070526, 0.22387036681175232, 0.23515835404396057, 0.24644634127616882, 0.2577343285083771, 0.26902228593826294, 0.2803102731704712, 0.29159826040267944, 0.3028862476348877, 0.31417420506477356, 0.3254621922969818, 0.33675017952919006, 0.3480381667613983, 0.35932615399360657, 0.3706141412258148, 0.38190212845802307, 0.39319008588790894, 0.4044780731201172, 0.41576606035232544, 0.4270540475845337, 0.43834203481674194, 0.4496300220489502, 0.46091800928115845, 0.4722059965133667, 0.48349398374557495, 0.4947819411754608, 0.5060698986053467, 0.5173579454421997, 0.5286458730697632, 0.5399338603019714]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 6.0, 11.0, 10.0, 8.0, 16.0, 14.0, 21.0, 20.0, 21.0, 31.0, 29.0, 36.0, 41.0, 52.0, 39.0, 38.0, 41.0, 46.0, 39.0, 47.0, 39.0, 39.0, 37.0, 28.0, 31.0, 29.0, 36.0, 24.0, 27.0, 24.0, 21.0, 18.0, 18.0, 17.0, 3.0, 8.0, 8.0, 4.0, 2.0, 3.0, 4.0, 4.0, 2.0, 0.0, 3.0], "bins": [-0.2228478193283081, -0.21688516438007355, -0.210922509431839, -0.20495986938476562, -0.19899721443653107, -0.1930345594882965, -0.18707191944122314, -0.1811092644929886, -0.17514660954475403, -0.16918395459651947, -0.1632212996482849, -0.15725865960121155, -0.151296004652977, -0.14533334970474243, -0.13937070965766907, -0.1334080547094345, -0.12744539976119995, -0.1214827448129654, -0.11552009731531143, -0.10955744981765747, -0.10359479486942291, -0.09763213992118835, -0.0916694924235344, -0.08570684492588043, -0.07974418997764587, -0.07378153502941132, -0.06781888753175735, -0.061856236308813095, -0.055893585085868835, -0.049930933862924576, -0.043968282639980316, -0.038005631417036057, -0.0320429801940918, -0.026080328971147537, -0.020117677748203278, -0.014155026525259018, -0.008192375302314758, -0.0022297240793704987, 0.003732927143573761, 0.00969557836651802, 0.01565822958946228, 0.02162088081240654, 0.0275835320353508, 0.03354618325829506, 0.03950883448123932, 0.04547148570418358, 0.05143413692712784, 0.0573967881500721, 0.06335943937301636, 0.06932209432125092, 0.07528474181890488, 0.08124738931655884, 0.0872100442647934, 0.09317269921302795, 0.09913534671068192, 0.10509799420833588, 0.11106064915657043, 0.11702330410480499, 0.12298595160245895, 0.12894859910011292, 0.13491125404834747, 0.14087390899658203, 0.1468365490436554, 0.15279920399188995, 0.1587618589401245]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 8.0, 5.0, 11.0, 12.0, 10.0, 19.0, 22.0, 30.0, 54.0, 74.0, 134.0, 177.0, 345.0, 575.0, 1264.0, 3487.0, 12039.0, 79652.0, 3858660.0, 211215.0, 19168.0, 4540.0, 1574.0, 623.0, 277.0, 140.0, 70.0, 38.0, 17.0, 11.0, 6.0, 9.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.074951171875, -0.07284879684448242, -0.07074642181396484, -0.06864404678344727, -0.06654167175292969, -0.06443929672241211, -0.06233692169189453, -0.06023454666137695, -0.058132171630859375, -0.0560297966003418, -0.05392742156982422, -0.05182504653930664, -0.04972267150878906, -0.047620296478271484, -0.045517921447753906, -0.04341554641723633, -0.04131317138671875, -0.03921079635620117, -0.037108421325683594, -0.035006046295166016, -0.03290367126464844, -0.03080129623413086, -0.02869892120361328, -0.026596546173095703, -0.024494171142578125, -0.022391796112060547, -0.02028942108154297, -0.01818704605102539, -0.016084671020507812, -0.013982295989990234, -0.011879920959472656, -0.009777545928955078, -0.0076751708984375, -0.005572795867919922, -0.0034704208374023438, -0.0013680458068847656, 0.0007343292236328125, 0.0028367042541503906, 0.004939079284667969, 0.007041454315185547, 0.009143829345703125, 0.011246204376220703, 0.013348579406738281, 0.01545095443725586, 0.017553329467773438, 0.019655704498291016, 0.021758079528808594, 0.023860454559326172, 0.02596282958984375, 0.028065204620361328, 0.030167579650878906, 0.032269954681396484, 0.03437232971191406, 0.03647470474243164, 0.03857707977294922, 0.0406794548034668, 0.042781829833984375, 0.04488420486450195, 0.04698657989501953, 0.04908895492553711, 0.05119132995605469, 0.053293704986572266, 0.055396080017089844, 0.05749845504760742, 0.059600830078125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 11.0, 19.0, 17.0, 18.0, 34.0, 62.0, 78.0, 92.0, 83.0, 95.0, 99.0, 105.0, 89.0, 64.0, 56.0, 26.0, 18.0, 15.0, 12.0, 4.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0268096923828125, -0.026166677474975586, -0.025523662567138672, -0.024880647659301758, -0.024237632751464844, -0.02359461784362793, -0.022951602935791016, -0.0223085880279541, -0.021665573120117188, -0.021022558212280273, -0.02037954330444336, -0.019736528396606445, -0.01909351348876953, -0.018450498580932617, -0.017807483673095703, -0.01716446876525879, -0.016521453857421875, -0.01587843894958496, -0.015235424041748047, -0.014592409133911133, -0.013949394226074219, -0.013306379318237305, -0.01266336441040039, -0.012020349502563477, -0.011377334594726562, -0.010734319686889648, -0.010091304779052734, -0.00944828987121582, -0.008805274963378906, -0.008162260055541992, -0.007519245147705078, -0.006876230239868164, -0.00623321533203125, -0.005590200424194336, -0.004947185516357422, -0.004304170608520508, -0.0036611557006835938, -0.0030181407928466797, -0.0023751258850097656, -0.0017321109771728516, -0.0010890960693359375, -0.00044608116149902344, 0.00019693374633789062, 0.0008399486541748047, 0.0014829635620117188, 0.002125978469848633, 0.002768993377685547, 0.003412008285522461, 0.004055023193359375, 0.004698038101196289, 0.005341053009033203, 0.005984067916870117, 0.006627082824707031, 0.007270097732543945, 0.00791311264038086, 0.008556127548217773, 0.009199142456054688, 0.009842157363891602, 0.010485172271728516, 0.01112818717956543, 0.011771202087402344, 0.012414216995239258, 0.013057231903076172, 0.013700246810913086, 0.01434326171875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 13.0, 15.0, 31.0, 50.0, 134.0, 271.0, 820.0, 5748.0, 357925.0, 3814488.0, 12574.0, 1440.0, 372.0, 193.0, 95.0, 53.0, 24.0, 17.0, 4.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0872802734375, -0.08447742462158203, -0.08167457580566406, -0.0788717269897461, -0.07606887817382812, -0.07326602935791016, -0.07046318054199219, -0.06766033172607422, -0.06485748291015625, -0.06205463409423828, -0.05925178527832031, -0.056448936462402344, -0.053646087646484375, -0.050843238830566406, -0.04804039001464844, -0.04523754119873047, -0.0424346923828125, -0.03963184356689453, -0.03682899475097656, -0.034026145935058594, -0.031223297119140625, -0.028420448303222656, -0.025617599487304688, -0.02281475067138672, -0.02001190185546875, -0.01720905303955078, -0.014406204223632812, -0.011603355407714844, -0.008800506591796875, -0.005997657775878906, -0.0031948089599609375, -0.00039196014404296875, 0.002410888671875, 0.005213737487792969, 0.008016586303710938, 0.010819435119628906, 0.013622283935546875, 0.016425132751464844, 0.019227981567382812, 0.02203083038330078, 0.02483367919921875, 0.02763652801513672, 0.030439376831054688, 0.033242225646972656, 0.036045074462890625, 0.038847923278808594, 0.04165077209472656, 0.04445362091064453, 0.0472564697265625, 0.05005931854248047, 0.05286216735839844, 0.055665016174316406, 0.058467864990234375, 0.061270713806152344, 0.06407356262207031, 0.06687641143798828, 0.06967926025390625, 0.07248210906982422, 0.07528495788574219, 0.07808780670166016, 0.08089065551757812, 0.0836935043334961, 0.08649635314941406, 0.08929920196533203, 0.09210205078125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 15.0, 16.0, 39.0, 110.0, 366.0, 2135.0, 1006.0, 219.0, 69.0, 33.0, 22.0, 9.0, 9.0, 7.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0215606689453125, -0.020723581314086914, -0.019886493682861328, -0.019049406051635742, -0.018212318420410156, -0.01737523078918457, -0.016538143157958984, -0.0157010555267334, -0.014863967895507812, -0.014026880264282227, -0.01318979263305664, -0.012352705001831055, -0.011515617370605469, -0.010678529739379883, -0.009841442108154297, -0.009004354476928711, -0.008167266845703125, -0.007330179214477539, -0.006493091583251953, -0.005656003952026367, -0.004818916320800781, -0.003981828689575195, -0.0031447410583496094, -0.0023076534271240234, -0.0014705657958984375, -0.0006334781646728516, 0.00020360946655273438, 0.0010406970977783203, 0.0018777847290039062, 0.002714872360229492, 0.003551959991455078, 0.004389047622680664, 0.00522613525390625, 0.006063222885131836, 0.006900310516357422, 0.007737398147583008, 0.008574485778808594, 0.00941157341003418, 0.010248661041259766, 0.011085748672485352, 0.011922836303710938, 0.012759923934936523, 0.01359701156616211, 0.014434099197387695, 0.015271186828613281, 0.016108274459838867, 0.016945362091064453, 0.01778244972229004, 0.018619537353515625, 0.01945662498474121, 0.020293712615966797, 0.021130800247192383, 0.02196788787841797, 0.022804975509643555, 0.02364206314086914, 0.024479150772094727, 0.025316238403320312, 0.0261533260345459, 0.026990413665771484, 0.02782750129699707, 0.028664588928222656, 0.029501676559448242, 0.030338764190673828, 0.031175851821899414, 0.032012939453125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 30.0, 667.0, 300.0, 10.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46417441964149475, -0.4495387673377991, -0.4349031150341034, -0.4202674627304077, -0.4056318402290344, -0.39099618792533875, -0.37636053562164307, -0.3617248833179474, -0.3470892310142517, -0.33245357871055603, -0.31781792640686035, -0.30318230390548706, -0.2885466516017914, -0.2739109992980957, -0.2592753469944, -0.24463969469070435, -0.23000407218933105, -0.21536841988563538, -0.2007327824831009, -0.1860971301794052, -0.17146149277687073, -0.15682584047317505, -0.14219018816947937, -0.1275545358657837, -0.1129188984632492, -0.09828325361013412, -0.08364760875701904, -0.06901195645332336, -0.05437631160020828, -0.0397406667470932, -0.025105014443397522, -0.01046936959028244, 0.004166305065155029, 0.01880195178091526, 0.03343759849667549, 0.04807324707508087, 0.06270889192819595, 0.07734453678131104, 0.09198018908500671, 0.1066158339381218, 0.12125147879123688, 0.13588713109493256, 0.15052276849746704, 0.16515842080116272, 0.1797940731048584, 0.19442971050739288, 0.20906536281108856, 0.22370100021362305, 0.23833665251731873, 0.2529723048210144, 0.2676079571247101, 0.28224360942840576, 0.29687923192977905, 0.31151488423347473, 0.3261505365371704, 0.3407861888408661, 0.35542184114456177, 0.37005749344825745, 0.3846931457519531, 0.3993287682533264, 0.4139644205570221, 0.4286000728607178, 0.44323572516441345, 0.45787137746810913, 0.4725069999694824]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 11.0, 14.0, 15.0, 31.0, 46.0, 51.0, 70.0, 81.0, 104.0, 93.0, 87.0, 95.0, 72.0, 70.0, 55.0, 44.0, 27.0, 12.0, 7.0, 9.0, 8.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08634567260742188, -0.08315745741128922, -0.07996924221515656, -0.0767810270190239, -0.07359281182289124, -0.07040458917617798, -0.06721637398004532, -0.06402815878391266, -0.06083994358778, -0.05765172839164734, -0.05446351319551468, -0.05127529427409172, -0.04808707907795906, -0.0448988638818264, -0.04171064496040344, -0.03852242976427078, -0.03533421456813812, -0.03214599937200546, -0.028957782313227654, -0.025769565254449844, -0.022581350058317184, -0.019393134862184525, -0.016204917803406715, -0.013016700744628906, -0.009828485548496246, -0.006640269421041012, -0.0034520532935857773, -0.00026383716613054276, 0.0029243789613246918, 0.006112594157457352, 0.00930081121623516, 0.01248902827501297, 0.01567724347114563, 0.01886545866727829, 0.0220536757260561, 0.025241892784833908, 0.028430107980966568, 0.03161832317709923, 0.034806542098522186, 0.037994757294654846, 0.041182972490787506, 0.044371187686920166, 0.047559402883052826, 0.050747621804475784, 0.053935837000608444, 0.057124052196741104, 0.06031227111816406, 0.06350048631429672, 0.06668870151042938, 0.06987691670656204, 0.0730651319026947, 0.07625334709882736, 0.07944156229496002, 0.08262978494167328, 0.08581800013780594, 0.0890062153339386, 0.09219443053007126, 0.09538264572620392, 0.09857086092233658, 0.10175907611846924, 0.1049472987651825, 0.10813550651073456, 0.11132372915744781, 0.11451194435358047, 0.11770015954971313]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 5.0, 15.0, 16.0, 31.0, 35.0, 67.0, 105.0, 153.0, 310.0, 533.0, 1157.0, 2861.0, 9740.0, 51933.0, 376177.0, 506541.0, 79104.0, 13284.0, 3642.0, 1408.0, 605.0, 344.0, 174.0, 110.0, 65.0, 49.0, 30.0, 16.0, 14.0, 11.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0357666015625, -0.03439664840698242, -0.033026695251464844, -0.031656742095947266, -0.030286788940429688, -0.02891683578491211, -0.02754688262939453, -0.026176929473876953, -0.024806976318359375, -0.023437023162841797, -0.02206707000732422, -0.02069711685180664, -0.019327163696289062, -0.017957210540771484, -0.016587257385253906, -0.015217304229736328, -0.01384735107421875, -0.012477397918701172, -0.011107444763183594, -0.009737491607666016, -0.008367538452148438, -0.006997585296630859, -0.005627632141113281, -0.004257678985595703, -0.002887725830078125, -0.0015177726745605469, -0.00014781951904296875, 0.0012221336364746094, 0.0025920867919921875, 0.003962039947509766, 0.005331993103027344, 0.006701946258544922, 0.0080718994140625, 0.009441852569580078, 0.010811805725097656, 0.012181758880615234, 0.013551712036132812, 0.01492166519165039, 0.01629161834716797, 0.017661571502685547, 0.019031524658203125, 0.020401477813720703, 0.02177143096923828, 0.02314138412475586, 0.024511337280273438, 0.025881290435791016, 0.027251243591308594, 0.028621196746826172, 0.02999114990234375, 0.03136110305786133, 0.032731056213378906, 0.034101009368896484, 0.03547096252441406, 0.03684091567993164, 0.03821086883544922, 0.0395808219909668, 0.040950775146484375, 0.04232072830200195, 0.04369068145751953, 0.04506063461303711, 0.04643058776855469, 0.047800540924072266, 0.049170494079589844, 0.05054044723510742, 0.051910400390625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 8.0, 14.0, 17.0, 19.0, 22.0, 35.0, 57.0, 49.0, 91.0, 74.0, 92.0, 82.0, 89.0, 71.0, 75.0, 63.0, 44.0, 31.0, 20.0, 11.0, 12.0, 8.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0208587646484375, -0.020325183868408203, -0.019791603088378906, -0.01925802230834961, -0.018724441528320312, -0.018190860748291016, -0.01765727996826172, -0.017123699188232422, -0.016590118408203125, -0.016056537628173828, -0.015522956848144531, -0.014989376068115234, -0.014455795288085938, -0.01392221450805664, -0.013388633728027344, -0.012855052947998047, -0.01232147216796875, -0.011787891387939453, -0.011254310607910156, -0.01072072982788086, -0.010187149047851562, -0.009653568267822266, -0.009119987487792969, -0.008586406707763672, -0.008052825927734375, -0.007519245147705078, -0.006985664367675781, -0.006452083587646484, -0.0059185028076171875, -0.005384922027587891, -0.004851341247558594, -0.004317760467529297, -0.0037841796875, -0.003250598907470703, -0.0027170181274414062, -0.0021834373474121094, -0.0016498565673828125, -0.0011162757873535156, -0.0005826950073242188, -4.9114227294921875e-05, 0.000484466552734375, 0.0010180473327636719, 0.0015516281127929688, 0.0020852088928222656, 0.0026187896728515625, 0.0031523704528808594, 0.0036859512329101562, 0.004219532012939453, 0.00475311279296875, 0.005286693572998047, 0.005820274353027344, 0.006353855133056641, 0.0068874359130859375, 0.007421016693115234, 0.007954597473144531, 0.008488178253173828, 0.009021759033203125, 0.009555339813232422, 0.010088920593261719, 0.010622501373291016, 0.011156082153320312, 0.01168966293334961, 0.012223243713378906, 0.012756824493408203, 0.0132904052734375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 1.0, 3.0, 3.0, 4.0, 7.0, 9.0, 12.0, 14.0, 32.0, 31.0, 37.0, 51.0, 63.0, 80.0, 140.0, 220.0, 366.0, 753.0, 1737.0, 4649.0, 15486.0, 64106.0, 281224.0, 471811.0, 157409.0, 35269.0, 9356.0, 3078.0, 1145.0, 527.0, 290.0, 186.0, 115.0, 87.0, 59.0, 54.0, 42.0, 20.0, 11.0, 25.0, 13.0, 8.0, 7.0, 8.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0274505615234375, -0.02660059928894043, -0.02575063705444336, -0.02490067481994629, -0.02405071258544922, -0.02320075035095215, -0.022350788116455078, -0.021500825881958008, -0.020650863647460938, -0.019800901412963867, -0.018950939178466797, -0.018100976943969727, -0.017251014709472656, -0.016401052474975586, -0.015551090240478516, -0.014701128005981445, -0.013851165771484375, -0.013001203536987305, -0.012151241302490234, -0.011301279067993164, -0.010451316833496094, -0.009601354598999023, -0.008751392364501953, -0.007901430130004883, -0.0070514678955078125, -0.006201505661010742, -0.005351543426513672, -0.0045015811920166016, -0.0036516189575195312, -0.002801656723022461, -0.0019516944885253906, -0.0011017322540283203, -0.00025177001953125, 0.0005981922149658203, 0.0014481544494628906, 0.002298116683959961, 0.0031480789184570312, 0.0039980411529541016, 0.004848003387451172, 0.005697965621948242, 0.0065479278564453125, 0.007397890090942383, 0.008247852325439453, 0.009097814559936523, 0.009947776794433594, 0.010797739028930664, 0.011647701263427734, 0.012497663497924805, 0.013347625732421875, 0.014197587966918945, 0.015047550201416016, 0.015897512435913086, 0.016747474670410156, 0.017597436904907227, 0.018447399139404297, 0.019297361373901367, 0.020147323608398438, 0.020997285842895508, 0.021847248077392578, 0.02269721031188965, 0.02354717254638672, 0.02439713478088379, 0.02524709701538086, 0.02609705924987793, 0.026947021484375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 4.0, 5.0, 6.0, 8.0, 9.0, 13.0, 12.0, 11.0, 23.0, 25.0, 9.0, 27.0, 24.0, 19.0, 31.0, 29.0, 24.0, 38.0, 36.0, 43.0, 45.0, 43.0, 41.0, 47.0, 48.0, 28.0, 39.0, 36.0, 33.0, 25.0, 30.0, 24.0, 28.0, 23.0, 20.0, 16.0, 12.0, 14.0, 12.0, 7.0, 9.0, 5.0, 4.0, 4.0, 7.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.027587890625, -0.026635169982910156, -0.025682449340820312, -0.02472972869873047, -0.023777008056640625, -0.02282428741455078, -0.021871566772460938, -0.020918846130371094, -0.01996612548828125, -0.019013404846191406, -0.018060684204101562, -0.01710796356201172, -0.016155242919921875, -0.015202522277832031, -0.014249801635742188, -0.013297080993652344, -0.0123443603515625, -0.011391639709472656, -0.010438919067382812, -0.009486198425292969, -0.008533477783203125, -0.007580757141113281, -0.0066280364990234375, -0.005675315856933594, -0.00472259521484375, -0.0037698745727539062, -0.0028171539306640625, -0.0018644332885742188, -0.000911712646484375, 4.100799560546875e-05, 0.0009937286376953125, 0.0019464492797851562, 0.002899169921875, 0.0038518905639648438, 0.0048046112060546875, 0.005757331848144531, 0.006710052490234375, 0.007662773132324219, 0.008615493774414062, 0.009568214416503906, 0.01052093505859375, 0.011473655700683594, 0.012426376342773438, 0.013379096984863281, 0.014331817626953125, 0.015284538269042969, 0.016237258911132812, 0.017189979553222656, 0.0181427001953125, 0.019095420837402344, 0.020048141479492188, 0.02100086212158203, 0.021953582763671875, 0.02290630340576172, 0.023859024047851562, 0.024811744689941406, 0.02576446533203125, 0.026717185974121094, 0.027669906616210938, 0.02862262725830078, 0.029575347900390625, 0.03052806854248047, 0.03148078918457031, 0.032433509826660156, 0.03338623046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 11.0, 9.0, 10.0, 17.0, 15.0, 34.0, 58.0, 79.0, 145.0, 226.0, 369.0, 793.0, 1712.0, 4839.0, 19252.0, 131142.0, 572529.0, 268290.0, 36875.0, 7437.0, 2441.0, 1036.0, 476.0, 303.0, 164.0, 101.0, 58.0, 38.0, 26.0, 14.0, 10.0, 11.0, 7.0, 7.0, 4.0, 7.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01129150390625, -0.010911107063293457, -0.010530710220336914, -0.010150313377380371, -0.009769916534423828, -0.009389519691467285, -0.009009122848510742, -0.0086287260055542, -0.008248329162597656, -0.007867932319641113, -0.00748753547668457, -0.007107138633728027, -0.006726741790771484, -0.006346344947814941, -0.0059659481048583984, -0.0055855512619018555, -0.0052051544189453125, -0.0048247575759887695, -0.0044443607330322266, -0.004063963890075684, -0.0036835670471191406, -0.0033031702041625977, -0.0029227733612060547, -0.0025423765182495117, -0.0021619796752929688, -0.0017815828323364258, -0.0014011859893798828, -0.0010207891464233398, -0.0006403923034667969, -0.0002599954605102539, 0.00012040138244628906, 0.000500798225402832, 0.000881195068359375, 0.001261591911315918, 0.001641988754272461, 0.002022385597229004, 0.002402782440185547, 0.00278317928314209, 0.003163576126098633, 0.0035439729690551758, 0.003924369812011719, 0.004304766654968262, 0.004685163497924805, 0.005065560340881348, 0.005445957183837891, 0.005826354026794434, 0.0062067508697509766, 0.0065871477127075195, 0.0069675445556640625, 0.0073479413986206055, 0.0077283382415771484, 0.008108735084533691, 0.008489131927490234, 0.008869528770446777, 0.00924992561340332, 0.009630322456359863, 0.010010719299316406, 0.01039111614227295, 0.010771512985229492, 0.011151909828186035, 0.011532306671142578, 0.011912703514099121, 0.012293100357055664, 0.012673497200012207, 0.01305389404296875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 7.0, 7.0, 14.0, 25.0, 28.0, 40.0, 61.0, 90.0, 159.0, 166.0, 126.0, 90.0, 63.0, 45.0, 34.0, 18.0, 19.0, 8.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00015103816986083984, -0.00014770496636629105, -0.00014437176287174225, -0.00014103855937719345, -0.00013770535588264465, -0.00013437215238809586, -0.00013103894889354706, -0.00012770574539899826, -0.00012437254190444946, -0.00012103933840990067, -0.00011770613491535187, -0.00011437293142080307, -0.00011103972792625427, -0.00010770652443170547, -0.00010437332093715668, -0.00010104011744260788, -9.770691394805908e-05, -9.437371045351028e-05, -9.104050695896149e-05, -8.770730346441269e-05, -8.437409996986389e-05, -8.10408964753151e-05, -7.77076929807663e-05, -7.43744894862175e-05, -7.10412859916687e-05, -6.77080824971199e-05, -6.43748790025711e-05, -6.104167550802231e-05, -5.770847201347351e-05, -5.437526851892471e-05, -5.1042065024375916e-05, -4.770886152982712e-05, -4.437565803527832e-05, -4.104245454072952e-05, -3.7709251046180725e-05, -3.437604755163193e-05, -3.104284405708313e-05, -2.7709640562534332e-05, -2.4376437067985535e-05, -2.1043233573436737e-05, -1.771003007888794e-05, -1.4376826584339142e-05, -1.1043623089790344e-05, -7.710419595241547e-06, -4.377216100692749e-06, -1.0440126061439514e-06, 2.289190888404846e-06, 5.622394382953644e-06, 8.955597877502441e-06, 1.2288801372051239e-05, 1.5622004866600037e-05, 1.8955208361148834e-05, 2.2288411855697632e-05, 2.562161535024643e-05, 2.8954818844795227e-05, 3.2288022339344025e-05, 3.562122583389282e-05, 3.895442932844162e-05, 4.228763282299042e-05, 4.5620836317539215e-05, 4.895403981208801e-05, 5.228724330663681e-05, 5.562044680118561e-05, 5.8953650295734406e-05, 6.22868537902832e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 15.0, 6.0, 17.0, 19.0, 35.0, 59.0, 133.0, 241.0, 524.0, 1393.0, 5384.0, 52852.0, 640553.0, 322552.0, 19947.0, 3098.0, 938.0, 386.0, 188.0, 92.0, 55.0, 23.0, 15.0, 7.0, 8.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0232086181640625, -0.022653579711914062, -0.022098541259765625, -0.021543502807617188, -0.02098846435546875, -0.020433425903320312, -0.019878387451171875, -0.019323348999023438, -0.018768310546875, -0.018213272094726562, -0.017658233642578125, -0.017103195190429688, -0.01654815673828125, -0.015993118286132812, -0.015438079833984375, -0.014883041381835938, -0.0143280029296875, -0.013772964477539062, -0.013217926025390625, -0.012662887573242188, -0.01210784912109375, -0.011552810668945312, -0.010997772216796875, -0.010442733764648438, -0.0098876953125, -0.009332656860351562, -0.008777618408203125, -0.008222579956054688, -0.00766754150390625, -0.0071125030517578125, -0.006557464599609375, -0.0060024261474609375, -0.0054473876953125, -0.0048923492431640625, -0.004337310791015625, -0.0037822723388671875, -0.00322723388671875, -0.0026721954345703125, -0.002117156982421875, -0.0015621185302734375, -0.001007080078125, -0.0004520416259765625, 0.000102996826171875, 0.0006580352783203125, 0.00121307373046875, 0.0017681121826171875, 0.002323150634765625, 0.0028781890869140625, 0.0034332275390625, 0.0039882659912109375, 0.004543304443359375, 0.0050983428955078125, 0.00565338134765625, 0.0062084197998046875, 0.006763458251953125, 0.0073184967041015625, 0.00787353515625, 0.008428573608398438, 0.008983612060546875, 0.009538650512695312, 0.01009368896484375, 0.010648727416992188, 0.011203765869140625, 0.011758804321289062, 0.0123138427734375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 8.0, 8.0, 17.0, 20.0, 39.0, 46.0, 54.0, 77.0, 70.0, 86.0, 102.0, 72.0, 82.0, 72.0, 65.0, 55.0, 36.0, 20.0, 31.0, 16.0, 8.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0160369873046875, -0.015634894371032715, -0.01523280143737793, -0.014830708503723145, -0.01442861557006836, -0.014026522636413574, -0.013624429702758789, -0.013222336769104004, -0.012820243835449219, -0.012418150901794434, -0.012016057968139648, -0.011613965034484863, -0.011211872100830078, -0.010809779167175293, -0.010407686233520508, -0.010005593299865723, -0.009603500366210938, -0.009201407432556152, -0.008799314498901367, -0.008397221565246582, -0.007995128631591797, -0.007593035697937012, -0.0071909427642822266, -0.006788849830627441, -0.006386756896972656, -0.005984663963317871, -0.005582571029663086, -0.005180478096008301, -0.004778385162353516, -0.0043762922286987305, -0.003974199295043945, -0.00357210636138916, -0.003170013427734375, -0.00276792049407959, -0.0023658275604248047, -0.0019637346267700195, -0.0015616416931152344, -0.0011595487594604492, -0.0007574558258056641, -0.0003553628921508789, 4.673004150390625e-05, 0.0004488229751586914, 0.0008509159088134766, 0.0012530088424682617, 0.0016551017761230469, 0.002057194709777832, 0.002459287643432617, 0.0028613805770874023, 0.0032634735107421875, 0.0036655664443969727, 0.004067659378051758, 0.004469752311706543, 0.004871845245361328, 0.005273938179016113, 0.0056760311126708984, 0.006078124046325684, 0.006480216979980469, 0.006882309913635254, 0.007284402847290039, 0.007686495780944824, 0.00808858871459961, 0.008490681648254395, 0.00889277458190918, 0.009294867515563965, 0.00969696044921875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 10.0, 36.0, 220.0, 437.0, 232.0, 59.0, 10.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7505373358726501, -0.7315293550491333, -0.7125213742256165, -0.6935133934020996, -0.6745054125785828, -0.6554974317550659, -0.6364894509315491, -0.6174814701080322, -0.5984734892845154, -0.5794655084609985, -0.5604575276374817, -0.5414495468139648, -0.522441565990448, -0.5034335851669312, -0.4844256043434143, -0.46541762351989746, -0.4464096426963806, -0.42740166187286377, -0.4083936810493469, -0.3893857002258301, -0.37037771940231323, -0.3513697385787964, -0.33236175775527954, -0.3133537769317627, -0.29434579610824585, -0.275337815284729, -0.25632983446121216, -0.2373218536376953, -0.21831387281417847, -0.19930589199066162, -0.18029791116714478, -0.16128993034362793, -0.14228200912475586, -0.12327402830123901, -0.10426604747772217, -0.08525806665420532, -0.06625008583068848, -0.04724210500717163, -0.028234124183654785, -0.00922614336013794, 0.009781837463378906, 0.028789818286895752, 0.0477977991104126, 0.06680577993392944, 0.08581376075744629, 0.10482174158096313, 0.12382972240447998, 0.14283770322799683, 0.16184568405151367, 0.18085366487503052, 0.19986164569854736, 0.2188696265220642, 0.23787760734558105, 0.2568855881690979, 0.27589356899261475, 0.2949015498161316, 0.31390953063964844, 0.3329175114631653, 0.35192549228668213, 0.370933473110199, 0.3899414539337158, 0.40894943475723267, 0.4279574155807495, 0.44696539640426636, 0.4659733772277832]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 8.0, 3.0, 8.0, 14.0, 16.0, 6.0, 23.0, 10.0, 23.0, 18.0, 33.0, 35.0, 45.0, 35.0, 24.0, 38.0, 32.0, 43.0, 46.0, 45.0, 41.0, 38.0, 53.0, 42.0, 38.0, 34.0, 30.0, 23.0, 20.0, 24.0, 30.0, 18.0, 18.0, 6.0, 13.0, 17.0, 8.0, 2.0, 12.0, 5.0, 2.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15470582246780396, -0.14950239658355713, -0.1442989706993103, -0.13909555971622467, -0.13389213383197784, -0.12868870794773102, -0.12348528206348419, -0.11828185617923737, -0.11307843774557114, -0.10787501186132431, -0.10267159342765808, -0.09746816754341125, -0.09226474165916443, -0.0870613232254982, -0.08185789734125137, -0.07665447890758514, -0.07145105302333832, -0.06624762713909149, -0.06104420870542526, -0.055840782821178436, -0.05063736066222191, -0.04543393850326538, -0.040230512619018555, -0.03502709046006203, -0.0298236683011055, -0.02462024614214897, -0.019416822120547295, -0.014213399030268192, -0.00900997593998909, -0.0038065537810325623, 0.0013968702405691147, 0.006600294262170792, 0.01180371642112732, 0.017007138580083847, 0.022210562601685524, 0.0274139866232872, 0.03261740878224373, 0.037820830941200256, 0.04302425682544708, 0.04822767898440361, 0.05343110114336014, 0.058634523302316666, 0.0638379454612732, 0.06904137134552002, 0.07424479722976685, 0.07944821566343307, 0.0846516415476799, 0.08985505998134613, 0.09505848586559296, 0.10026191174983978, 0.10546533018350601, 0.11066875606775284, 0.11587217450141907, 0.1210756003856659, 0.12627902626991272, 0.13148245215415955, 0.13668587803840637, 0.1418893039226532, 0.14709272980690002, 0.15229614078998566, 0.15749956667423248, 0.1627029925584793, 0.16790641844272614, 0.17310984432697296, 0.1783132553100586]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 10.0, 23.0, 49.0, 171.0, 615.0, 5855.0, 3993125.0, 191412.0, 2594.0, 332.0, 71.0, 19.0, 11.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06634521484375, -0.06075000762939453, -0.05515480041503906, -0.049559593200683594, -0.043964385986328125, -0.038369178771972656, -0.03277397155761719, -0.02717876434326172, -0.02158355712890625, -0.01598834991455078, -0.010393142700195312, -0.004797935485839844, 0.000797271728515625, 0.006392478942871094, 0.011987686157226562, 0.01758289337158203, 0.0231781005859375, 0.02877330780029297, 0.03436851501464844, 0.039963722229003906, 0.045558929443359375, 0.051154136657714844, 0.05674934387207031, 0.06234455108642578, 0.06793975830078125, 0.07353496551513672, 0.07913017272949219, 0.08472537994384766, 0.09032058715820312, 0.0959157943725586, 0.10151100158691406, 0.10710620880126953, 0.112701416015625, 0.11829662322998047, 0.12389183044433594, 0.1294870376586914, 0.13508224487304688, 0.14067745208740234, 0.1462726593017578, 0.15186786651611328, 0.15746307373046875, 0.16305828094482422, 0.1686534881591797, 0.17424869537353516, 0.17984390258789062, 0.1854391098022461, 0.19103431701660156, 0.19662952423095703, 0.2022247314453125, 0.20781993865966797, 0.21341514587402344, 0.2190103530883789, 0.22460556030273438, 0.23020076751708984, 0.2357959747314453, 0.24139118194580078, 0.24698638916015625, 0.2525815963745117, 0.2581768035888672, 0.26377201080322266, 0.2693672180175781, 0.2749624252319336, 0.28055763244628906, 0.28615283966064453, 0.291748046875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 9.0, 8.0, 13.0, 27.0, 27.0, 40.0, 49.0, 57.0, 72.0, 77.0, 82.0, 96.0, 82.0, 64.0, 63.0, 56.0, 41.0, 46.0, 30.0, 17.0, 9.0, 14.0, 2.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0197601318359375, -0.019243836402893066, -0.018727540969848633, -0.0182112455368042, -0.017694950103759766, -0.017178654670715332, -0.0166623592376709, -0.016146063804626465, -0.01562976837158203, -0.015113472938537598, -0.014597177505493164, -0.01408088207244873, -0.013564586639404297, -0.013048291206359863, -0.01253199577331543, -0.012015700340270996, -0.011499404907226562, -0.010983109474182129, -0.010466814041137695, -0.009950518608093262, -0.009434223175048828, -0.008917927742004395, -0.008401632308959961, -0.007885336875915527, -0.007369041442871094, -0.00685274600982666, -0.0063364505767822266, -0.005820155143737793, -0.005303859710693359, -0.004787564277648926, -0.004271268844604492, -0.0037549734115600586, -0.003238677978515625, -0.0027223825454711914, -0.002206087112426758, -0.0016897916793823242, -0.0011734962463378906, -0.000657200813293457, -0.00014090538024902344, 0.00037539005279541016, 0.0008916854858398438, 0.0014079809188842773, 0.001924276351928711, 0.0024405717849731445, 0.002956867218017578, 0.0034731626510620117, 0.003989458084106445, 0.004505753517150879, 0.0050220489501953125, 0.005538344383239746, 0.00605463981628418, 0.006570935249328613, 0.007087230682373047, 0.0076035261154174805, 0.008119821548461914, 0.008636116981506348, 0.009152412414550781, 0.009668707847595215, 0.010185003280639648, 0.010701298713684082, 0.011217594146728516, 0.01173388957977295, 0.012250185012817383, 0.012766480445861816, 0.01328277587890625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 6.0, 8.0, 15.0, 30.0, 41.0, 76.0, 153.0, 312.0, 729.0, 1929.0, 7623.0, 55141.0, 3460514.0, 633392.0, 26618.0, 4969.0, 1457.0, 591.0, 271.0, 163.0, 90.0, 53.0, 38.0, 9.0, 11.0, 6.0, 3.0, 12.0, 2.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.03857421875, -0.03718852996826172, -0.03580284118652344, -0.034417152404785156, -0.033031463623046875, -0.031645774841308594, -0.030260086059570312, -0.02887439727783203, -0.02748870849609375, -0.02610301971435547, -0.024717330932617188, -0.023331642150878906, -0.021945953369140625, -0.020560264587402344, -0.019174575805664062, -0.01778888702392578, -0.0164031982421875, -0.015017509460449219, -0.013631820678710938, -0.012246131896972656, -0.010860443115234375, -0.009474754333496094, -0.008089065551757812, -0.006703376770019531, -0.00531768798828125, -0.003931999206542969, -0.0025463104248046875, -0.0011606216430664062, 0.000225067138671875, 0.0016107559204101562, 0.0029964447021484375, 0.004382133483886719, 0.005767822265625, 0.007153511047363281, 0.008539199829101562, 0.009924888610839844, 0.011310577392578125, 0.012696266174316406, 0.014081954956054688, 0.015467643737792969, 0.01685333251953125, 0.01823902130126953, 0.019624710083007812, 0.021010398864746094, 0.022396087646484375, 0.023781776428222656, 0.025167465209960938, 0.02655315399169922, 0.0279388427734375, 0.02932453155517578, 0.030710220336914062, 0.032095909118652344, 0.033481597900390625, 0.034867286682128906, 0.03625297546386719, 0.03763866424560547, 0.03902435302734375, 0.04041004180908203, 0.04179573059082031, 0.043181419372558594, 0.044567108154296875, 0.045952796936035156, 0.04733848571777344, 0.04872417449951172, 0.05010986328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 9.0, 4.0, 8.0, 14.0, 36.0, 49.0, 96.0, 130.0, 394.0, 1552.0, 1142.0, 311.0, 129.0, 66.0, 46.0, 26.0, 26.0, 6.0, 7.0, 7.0, 8.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0174102783203125, -0.016785383224487305, -0.01616048812866211, -0.015535593032836914, -0.014910697937011719, -0.014285802841186523, -0.013660907745361328, -0.013036012649536133, -0.012411117553710938, -0.011786222457885742, -0.011161327362060547, -0.010536432266235352, -0.009911537170410156, -0.009286642074584961, -0.008661746978759766, -0.00803685188293457, -0.007411956787109375, -0.00678706169128418, -0.006162166595458984, -0.005537271499633789, -0.004912376403808594, -0.0042874813079833984, -0.003662586212158203, -0.003037691116333008, -0.0024127960205078125, -0.0017879009246826172, -0.0011630058288574219, -0.0005381107330322266, 8.678436279296875e-05, 0.0007116794586181641, 0.0013365745544433594, 0.0019614696502685547, 0.00258636474609375, 0.0032112598419189453, 0.0038361549377441406, 0.004461050033569336, 0.005085945129394531, 0.0057108402252197266, 0.006335735321044922, 0.006960630416870117, 0.0075855255126953125, 0.008210420608520508, 0.008835315704345703, 0.009460210800170898, 0.010085105895996094, 0.010710000991821289, 0.011334896087646484, 0.01195979118347168, 0.012584686279296875, 0.01320958137512207, 0.013834476470947266, 0.014459371566772461, 0.015084266662597656, 0.01570916175842285, 0.016334056854248047, 0.016958951950073242, 0.017583847045898438, 0.018208742141723633, 0.018833637237548828, 0.019458532333374023, 0.02008342742919922, 0.020708322525024414, 0.02133321762084961, 0.021958112716674805, 0.0225830078125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 10.0, 39.0, 159.0, 327.0, 270.0, 132.0, 40.0, 17.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16127228736877441, -0.15617221593856812, -0.15107214450836182, -0.14597207307815552, -0.14087198674678802, -0.13577191531658173, -0.13067184388637543, -0.12557177245616913, -0.12047170102596283, -0.11537162959575653, -0.11027155071496964, -0.10517147928476334, -0.10007140785455704, -0.09497132897377014, -0.08987125754356384, -0.08477118611335754, -0.07967110723257065, -0.07457103580236435, -0.06947095692157745, -0.06437088549137115, -0.059270814061164856, -0.05417073890566826, -0.04907066375017166, -0.04397059231996536, -0.038870517164468765, -0.03377044200897217, -0.02867037057876587, -0.023570295423269272, -0.018470222130417824, -0.013370148837566376, -0.008270073682069778, -0.0031700022518634796, 0.0019300729036331177, 0.007030146662145853, 0.012130220420658588, 0.01723029464483261, 0.02233036793768406, 0.027430441230535507, 0.032530516386032104, 0.0376305878162384, 0.042730662971735, 0.0478307381272316, 0.0529308095574379, 0.058030884712934494, 0.06313095986843109, 0.06823103129863739, 0.07333110272884369, 0.07843117415904999, 0.08353125303983688, 0.08863132447004318, 0.09373140335083008, 0.09883147478103638, 0.10393154621124268, 0.10903161764144897, 0.11413169652223587, 0.11923176795244217, 0.12433184683322906, 0.12943191826343536, 0.13453198969364166, 0.13963207602500916, 0.14473214745521545, 0.14983221888542175, 0.15493229031562805, 0.16003236174583435, 0.16513243317604065]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 7.0, 2.0, 7.0, 9.0, 10.0, 19.0, 24.0, 26.0, 37.0, 35.0, 56.0, 55.0, 57.0, 65.0, 73.0, 62.0, 60.0, 69.0, 52.0, 50.0, 50.0, 48.0, 37.0, 24.0, 19.0, 22.0, 9.0, 9.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05652731657028198, -0.05409948527812958, -0.05167165398597717, -0.049243826419115067, -0.04681599512696266, -0.04438816383481026, -0.04196033626794815, -0.039532504975795746, -0.03710467368364334, -0.034676842391490936, -0.03224901109933853, -0.029821183532476425, -0.02739335224032402, -0.024965520948171616, -0.02253769151866436, -0.020109862089157104, -0.0176820307970047, -0.01525420043617487, -0.01282637007534504, -0.01039853971451521, -0.007970709353685379, -0.005542878992855549, -0.0031150486320257187, -0.0006872192025184631, 0.0017406120896339417, 0.004168442450463772, 0.006596272811293602, 0.009024103172123432, 0.011451933532953262, 0.013879763893783092, 0.016307594254612923, 0.018735423684120178, 0.021163254976272583, 0.023591086268424988, 0.026018915697932243, 0.0284467451274395, 0.030874576419591904, 0.03330240771174431, 0.035730235278606415, 0.03815806657075882, 0.040585897862911224, 0.04301372915506363, 0.045441560447216034, 0.04786938801407814, 0.050297219306230545, 0.05272505059838295, 0.055152878165245056, 0.05758070945739746, 0.060008540749549866, 0.06243637204170227, 0.06486420333385468, 0.06729203462600708, 0.06971986591815948, 0.07214768975973129, 0.0745755210518837, 0.0770033523440361, 0.07943118363618851, 0.08185901492834091, 0.08428684622049332, 0.08671467751264572, 0.08914250135421753, 0.09157033264636993, 0.09399816393852234, 0.09642599523067474, 0.09885382652282715]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 0.0, 5.0, 11.0, 4.0, 19.0, 21.0, 33.0, 35.0, 79.0, 109.0, 255.0, 420.0, 931.0, 2295.0, 7202.0, 37997.0, 432017.0, 509301.0, 45185.0, 8123.0, 2485.0, 989.0, 446.0, 236.0, 135.0, 75.0, 51.0, 31.0, 17.0, 12.0, 7.0, 10.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05389404296875, -0.05215787887573242, -0.050421714782714844, -0.048685550689697266, -0.04694938659667969, -0.04521322250366211, -0.04347705841064453, -0.04174089431762695, -0.040004730224609375, -0.0382685661315918, -0.03653240203857422, -0.03479623794555664, -0.03306007385253906, -0.031323909759521484, -0.029587745666503906, -0.027851581573486328, -0.02611541748046875, -0.024379253387451172, -0.022643089294433594, -0.020906925201416016, -0.019170761108398438, -0.01743459701538086, -0.01569843292236328, -0.013962268829345703, -0.012226104736328125, -0.010489940643310547, -0.008753776550292969, -0.007017612457275391, -0.0052814483642578125, -0.0035452842712402344, -0.0018091201782226562, -7.295608520507812e-05, 0.0016632080078125, 0.003399372100830078, 0.005135536193847656, 0.006871700286865234, 0.008607864379882812, 0.01034402847290039, 0.012080192565917969, 0.013816356658935547, 0.015552520751953125, 0.017288684844970703, 0.01902484893798828, 0.02076101303100586, 0.022497177124023438, 0.024233341217041016, 0.025969505310058594, 0.027705669403076172, 0.02944183349609375, 0.031177997589111328, 0.032914161682128906, 0.034650325775146484, 0.03638648986816406, 0.03812265396118164, 0.03985881805419922, 0.0415949821472168, 0.043331146240234375, 0.04506731033325195, 0.04680347442626953, 0.04853963851928711, 0.05027580261230469, 0.052011966705322266, 0.053748130798339844, 0.05548429489135742, 0.057220458984375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 10.0, 11.0, 18.0, 19.0, 29.0, 44.0, 56.0, 61.0, 60.0, 66.0, 96.0, 91.0, 75.0, 61.0, 66.0, 47.0, 49.0, 40.0, 31.0, 13.0, 13.0, 15.0, 5.0, 6.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.018280029296875, -0.017775416374206543, -0.017270803451538086, -0.01676619052886963, -0.016261577606201172, -0.015756964683532715, -0.015252351760864258, -0.0147477388381958, -0.014243125915527344, -0.013738512992858887, -0.01323390007019043, -0.012729287147521973, -0.012224674224853516, -0.011720061302185059, -0.011215448379516602, -0.010710835456848145, -0.010206222534179688, -0.00970160961151123, -0.009196996688842773, -0.008692383766174316, -0.00818777084350586, -0.007683157920837402, -0.007178544998168945, -0.006673932075500488, -0.006169319152832031, -0.005664706230163574, -0.005160093307495117, -0.00465548038482666, -0.004150867462158203, -0.003646254539489746, -0.003141641616821289, -0.002637028694152832, -0.002132415771484375, -0.001627802848815918, -0.001123189926147461, -0.0006185770034790039, -0.00011396408081054688, 0.00039064884185791016, 0.0008952617645263672, 0.0013998746871948242, 0.0019044876098632812, 0.0024091005325317383, 0.0029137134552001953, 0.0034183263778686523, 0.003922939300537109, 0.004427552223205566, 0.0049321651458740234, 0.0054367780685424805, 0.0059413909912109375, 0.0064460039138793945, 0.0069506168365478516, 0.007455229759216309, 0.007959842681884766, 0.008464455604553223, 0.00896906852722168, 0.009473681449890137, 0.009978294372558594, 0.01048290729522705, 0.010987520217895508, 0.011492133140563965, 0.011996746063232422, 0.012501358985900879, 0.013005971908569336, 0.013510584831237793, 0.01401519775390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 8.0, 8.0, 4.0, 7.0, 8.0, 19.0, 24.0, 28.0, 33.0, 35.0, 64.0, 83.0, 108.0, 173.0, 339.0, 594.0, 1647.0, 5798.0, 28495.0, 191882.0, 594827.0, 187896.0, 27579.0, 5670.0, 1615.0, 599.0, 320.0, 185.0, 127.0, 96.0, 58.0, 46.0, 40.0, 34.0, 24.0, 13.0, 16.0, 8.0, 15.0, 4.0, 8.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.03326416015625, -0.03224039077758789, -0.03121662139892578, -0.030192852020263672, -0.029169082641601562, -0.028145313262939453, -0.027121543884277344, -0.026097774505615234, -0.025074005126953125, -0.024050235748291016, -0.023026466369628906, -0.022002696990966797, -0.020978927612304688, -0.019955158233642578, -0.01893138885498047, -0.01790761947631836, -0.01688385009765625, -0.01586008071899414, -0.014836311340332031, -0.013812541961669922, -0.012788772583007812, -0.011765003204345703, -0.010741233825683594, -0.009717464447021484, -0.008693695068359375, -0.007669925689697266, -0.006646156311035156, -0.005622386932373047, -0.0045986175537109375, -0.003574848175048828, -0.0025510787963867188, -0.0015273094177246094, -0.0005035400390625, 0.0005202293395996094, 0.0015439987182617188, 0.002567768096923828, 0.0035915374755859375, 0.004615306854248047, 0.005639076232910156, 0.006662845611572266, 0.007686614990234375, 0.008710384368896484, 0.009734153747558594, 0.010757923126220703, 0.011781692504882812, 0.012805461883544922, 0.013829231262207031, 0.01485300064086914, 0.01587677001953125, 0.01690053939819336, 0.01792430877685547, 0.018948078155517578, 0.019971847534179688, 0.020995616912841797, 0.022019386291503906, 0.023043155670166016, 0.024066925048828125, 0.025090694427490234, 0.026114463806152344, 0.027138233184814453, 0.028162002563476562, 0.029185771942138672, 0.03020954132080078, 0.03123331069946289, 0.032257080078125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 8.0, 9.0, 11.0, 9.0, 10.0, 11.0, 16.0, 18.0, 25.0, 29.0, 37.0, 57.0, 38.0, 39.0, 46.0, 57.0, 56.0, 62.0, 45.0, 45.0, 37.0, 63.0, 49.0, 45.0, 29.0, 26.0, 27.0, 19.0, 14.0, 14.0, 7.0, 10.0, 10.0, 10.0, 4.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03741455078125, -0.036124229431152344, -0.03483390808105469, -0.03354358673095703, -0.032253265380859375, -0.03096294403076172, -0.029672622680664062, -0.028382301330566406, -0.02709197998046875, -0.025801658630371094, -0.024511337280273438, -0.02322101593017578, -0.021930694580078125, -0.02064037322998047, -0.019350051879882812, -0.018059730529785156, -0.0167694091796875, -0.015479087829589844, -0.014188766479492188, -0.012898445129394531, -0.011608123779296875, -0.010317802429199219, -0.009027481079101562, -0.007737159729003906, -0.00644683837890625, -0.005156517028808594, -0.0038661956787109375, -0.0025758743286132812, -0.001285552978515625, 4.76837158203125e-06, 0.0012950897216796875, 0.0025854110717773438, 0.003875732421875, 0.005166053771972656, 0.0064563751220703125, 0.007746696472167969, 0.009037017822265625, 0.010327339172363281, 0.011617660522460938, 0.012907981872558594, 0.01419830322265625, 0.015488624572753906, 0.016778945922851562, 0.01806926727294922, 0.019359588623046875, 0.02064990997314453, 0.021940231323242188, 0.023230552673339844, 0.0245208740234375, 0.025811195373535156, 0.027101516723632812, 0.02839183807373047, 0.029682159423828125, 0.03097248077392578, 0.03226280212402344, 0.033553123474121094, 0.03484344482421875, 0.036133766174316406, 0.03742408752441406, 0.03871440887451172, 0.040004730224609375, 0.04129505157470703, 0.04258537292480469, 0.043875694274902344, 0.045166015625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 8.0, 18.0, 54.0, 119.0, 318.0, 1952.0, 913108.0, 131502.0, 1062.0, 245.0, 97.0, 40.0, 16.0, 14.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.072265625, -0.06999874114990234, -0.06773185729980469, -0.06546497344970703, -0.06319808959960938, -0.06093120574951172, -0.05866432189941406, -0.056397438049316406, -0.05413055419921875, -0.051863670349121094, -0.04959678649902344, -0.04732990264892578, -0.045063018798828125, -0.04279613494873047, -0.04052925109863281, -0.038262367248535156, -0.0359954833984375, -0.033728599548339844, -0.03146171569824219, -0.02919483184814453, -0.026927947998046875, -0.02466106414794922, -0.022394180297851562, -0.020127296447753906, -0.01786041259765625, -0.015593528747558594, -0.013326644897460938, -0.011059761047363281, -0.008792877197265625, -0.006525993347167969, -0.0042591094970703125, -0.0019922256469726562, 0.000274658203125, 0.0025415420532226562, 0.0048084259033203125, 0.007075309753417969, 0.009342193603515625, 0.011609077453613281, 0.013875961303710938, 0.016142845153808594, 0.01840972900390625, 0.020676612854003906, 0.022943496704101562, 0.02521038055419922, 0.027477264404296875, 0.02974414825439453, 0.03201103210449219, 0.034277915954589844, 0.0365447998046875, 0.038811683654785156, 0.04107856750488281, 0.04334545135498047, 0.045612335205078125, 0.04787921905517578, 0.05014610290527344, 0.052412986755371094, 0.05467987060546875, 0.056946754455566406, 0.05921363830566406, 0.06148052215576172, 0.06374740600585938, 0.06601428985595703, 0.06828117370605469, 0.07054805755615234, 0.07281494140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 24.0, 110.0, 339.0, 381.0, 101.0, 35.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0005464553833007812, -0.0005337707698345184, -0.0005210861563682556, -0.0005084015429019928, -0.00049571692943573, -0.00048303231596946716, -0.00047034770250320435, -0.00045766308903694153, -0.0004449784755706787, -0.0004322938621044159, -0.0004196092486381531, -0.00040692463517189026, -0.00039424002170562744, -0.0003815554082393646, -0.0003688707947731018, -0.000356186181306839, -0.00034350156784057617, -0.00033081695437431335, -0.00031813234090805054, -0.0003054477274417877, -0.0002927631139755249, -0.0002800785005092621, -0.00026739388704299927, -0.00025470927357673645, -0.00024202466011047363, -0.00022934004664421082, -0.000216655433177948, -0.00020397081971168518, -0.00019128620624542236, -0.00017860159277915955, -0.00016591697931289673, -0.0001532323658466339, -0.0001405477523803711, -0.00012786313891410828, -0.00011517852544784546, -0.00010249391198158264, -8.980929851531982e-05, -7.712468504905701e-05, -6.444007158279419e-05, -5.175545811653137e-05, -3.9070844650268555e-05, -2.6386231184005737e-05, -1.370161771774292e-05, -1.0170042514801025e-06, 1.1667609214782715e-05, 2.4352222681045532e-05, 3.703683614730835e-05, 4.972144961357117e-05, 6.240606307983398e-05, 7.50906765460968e-05, 8.777529001235962e-05, 0.00010045990347862244, 0.00011314451694488525, 0.00012582913041114807, 0.0001385137438774109, 0.0001511983573436737, 0.00016388297080993652, 0.00017656758427619934, 0.00018925219774246216, 0.00020193681120872498, 0.0002146214246749878, 0.0002273060381412506, 0.00023999065160751343, 0.00025267526507377625, 0.00026535987854003906]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 8.0, 17.0, 51.0, 113.0, 321.0, 1494.0, 838401.0, 206700.0, 1051.0, 247.0, 88.0, 39.0, 8.0, 9.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.10040283203125, -0.0980076789855957, -0.0956125259399414, -0.09321737289428711, -0.09082221984863281, -0.08842706680297852, -0.08603191375732422, -0.08363676071166992, -0.08124160766601562, -0.07884645462036133, -0.07645130157470703, -0.07405614852905273, -0.07166099548339844, -0.06926584243774414, -0.06687068939208984, -0.06447553634643555, -0.06208038330078125, -0.05968523025512695, -0.057290077209472656, -0.05489492416381836, -0.05249977111816406, -0.050104618072509766, -0.04770946502685547, -0.04531431198120117, -0.042919158935546875, -0.04052400588989258, -0.03812885284423828, -0.035733699798583984, -0.03333854675292969, -0.03094339370727539, -0.028548240661621094, -0.026153087615966797, -0.0237579345703125, -0.021362781524658203, -0.018967628479003906, -0.01657247543334961, -0.014177322387695312, -0.011782169342041016, -0.009387016296386719, -0.006991863250732422, -0.004596710205078125, -0.002201557159423828, 0.00019359588623046875, 0.0025887489318847656, 0.0049839019775390625, 0.007379055023193359, 0.009774208068847656, 0.012169361114501953, 0.01456451416015625, 0.016959667205810547, 0.019354820251464844, 0.02174997329711914, 0.024145126342773438, 0.026540279388427734, 0.02893543243408203, 0.03133058547973633, 0.033725738525390625, 0.03612089157104492, 0.03851604461669922, 0.040911197662353516, 0.04330635070800781, 0.04570150375366211, 0.048096656799316406, 0.0504918098449707, 0.052886962890625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 11.0, 22.0, 27.0, 117.0, 258.0, 325.0, 162.0, 58.0, 23.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07177734375, -0.07007789611816406, -0.06837844848632812, -0.06667900085449219, -0.06497955322265625, -0.06328010559082031, -0.061580657958984375, -0.05988121032714844, -0.0581817626953125, -0.05648231506347656, -0.054782867431640625, -0.05308341979980469, -0.05138397216796875, -0.04968452453613281, -0.047985076904296875, -0.04628562927246094, -0.044586181640625, -0.04288673400878906, -0.041187286376953125, -0.03948783874511719, -0.03778839111328125, -0.03608894348144531, -0.034389495849609375, -0.03269004821777344, -0.0309906005859375, -0.029291152954101562, -0.027591705322265625, -0.025892257690429688, -0.02419281005859375, -0.022493362426757812, -0.020793914794921875, -0.019094467163085938, -0.01739501953125, -0.015695571899414062, -0.013996124267578125, -0.012296676635742188, -0.01059722900390625, -0.008897781372070312, -0.007198333740234375, -0.0054988861083984375, -0.0037994384765625, -0.0020999908447265625, -0.000400543212890625, 0.0012989044189453125, 0.00299835205078125, 0.0046977996826171875, 0.006397247314453125, 0.008096694946289062, 0.009796142578125, 0.011495590209960938, 0.013195037841796875, 0.014894485473632812, 0.01659393310546875, 0.018293380737304688, 0.019992828369140625, 0.021692276000976562, 0.0233917236328125, 0.025091171264648438, 0.026790618896484375, 0.028490066528320312, 0.03018951416015625, 0.03188896179199219, 0.033588409423828125, 0.03528785705566406, 0.0369873046875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 28.0, 121.0, 345.0, 320.0, 123.0, 40.0, 13.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5841373205184937, -0.5686408281326294, -0.5531442761421204, -0.5376477837562561, -0.5221512913703918, -0.5066547989845276, -0.49115824699401855, -0.4756617546081543, -0.46016526222229004, -0.4446687400341034, -0.42917224764823914, -0.4136757254600525, -0.39817923307418823, -0.3826827108860016, -0.36718618869781494, -0.3516896963119507, -0.33619317412376404, -0.3206966519355774, -0.30520015954971313, -0.2897036373615265, -0.27420714497566223, -0.2587106227874756, -0.24321411550045013, -0.22771760821342468, -0.21222110092639923, -0.19672459363937378, -0.18122808635234833, -0.16573157906532288, -0.15023505687713623, -0.13473856449127197, -0.11924204230308533, -0.10374553501605988, -0.08824902772903442, -0.07275252044200897, -0.05725600942969322, -0.04175949841737747, -0.02626299113035202, -0.010766483843326569, 0.00473003089427948, 0.02022653818130493, 0.03572304546833038, 0.051219552755355835, 0.06671606004238129, 0.08221257477998734, 0.09770908206701279, 0.11320558935403824, 0.1287021040916443, 0.14419861137866974, 0.1596951186656952, 0.17519162595272064, 0.1906881332397461, 0.20618465542793274, 0.221681147813797, 0.23717767000198364, 0.2526741623878479, 0.26817068457603455, 0.2836672067642212, 0.29916372895240784, 0.3146602213382721, 0.33015674352645874, 0.345653235912323, 0.36114975810050964, 0.3766462802886963, 0.39214277267456055, 0.4076392650604248]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 4.0, 7.0, 4.0, 7.0, 13.0, 7.0, 13.0, 16.0, 24.0, 20.0, 36.0, 24.0, 28.0, 32.0, 32.0, 34.0, 43.0, 41.0, 33.0, 41.0, 47.0, 45.0, 50.0, 43.0, 45.0, 35.0, 37.0, 31.0, 36.0, 30.0, 19.0, 31.0, 17.0, 15.0, 12.0, 6.0, 12.0, 11.0, 8.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1760135293006897, -0.17053663730621338, -0.16505974531173706, -0.15958286821842194, -0.15410597622394562, -0.1486290842294693, -0.14315220713615417, -0.13767531514167786, -0.13219842314720154, -0.12672153115272522, -0.1212446466088295, -0.11576776206493378, -0.11029087007045746, -0.10481397807598114, -0.09933709353208542, -0.0938602089881897, -0.08838331699371338, -0.08290642499923706, -0.07742954045534134, -0.07195265591144562, -0.0664757639169693, -0.06099887564778328, -0.05552198737859726, -0.05004509910941124, -0.04456821084022522, -0.0390913225710392, -0.03361443430185318, -0.02813754603266716, -0.02266065776348114, -0.01718376949429512, -0.0117068812251091, -0.0062299929559230804, -0.0007531046867370605, 0.004723783582448959, 0.01020067185163498, 0.015677560120821, 0.02115444839000702, 0.02663133665919304, 0.03210822492837906, 0.03758511319756508, 0.0430620014667511, 0.04853888973593712, 0.05401577800512314, 0.05949266627430916, 0.06496955454349518, 0.0704464465379715, 0.07592333108186722, 0.08140021562576294, 0.08687710762023926, 0.09235399961471558, 0.0978308841586113, 0.10330776870250702, 0.10878466069698334, 0.11426155269145966, 0.11973843723535538, 0.1252153217792511, 0.13069221377372742, 0.13616910576820374, 0.14164599776268005, 0.14712287485599518, 0.1525997668504715, 0.15807665884494781, 0.16355353593826294, 0.16903042793273926, 0.17450731992721558]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 1.0, 4.0, 6.0, 9.0, 11.0, 8.0, 15.0, 14.0, 26.0, 33.0, 54.0, 60.0, 111.0, 165.0, 326.0, 559.0, 1044.0, 2215.0, 5395.0, 16160.0, 85561.0, 3555786.0, 471026.0, 38110.0, 10104.0, 3857.0, 1706.0, 812.0, 429.0, 230.0, 162.0, 91.0, 74.0, 42.0, 24.0, 14.0, 12.0, 10.0, 7.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03717041015625, -0.03592252731323242, -0.034674644470214844, -0.033426761627197266, -0.03217887878417969, -0.03093099594116211, -0.02968311309814453, -0.028435230255126953, -0.027187347412109375, -0.025939464569091797, -0.02469158172607422, -0.02344369888305664, -0.022195816040039062, -0.020947933197021484, -0.019700050354003906, -0.018452167510986328, -0.01720428466796875, -0.015956401824951172, -0.014708518981933594, -0.013460636138916016, -0.012212753295898438, -0.01096487045288086, -0.009716987609863281, -0.008469104766845703, -0.007221221923828125, -0.005973339080810547, -0.004725456237792969, -0.0034775733947753906, -0.0022296905517578125, -0.0009818077087402344, 0.00026607513427734375, 0.0015139579772949219, 0.0027618408203125, 0.004009723663330078, 0.005257606506347656, 0.006505489349365234, 0.0077533721923828125, 0.00900125503540039, 0.010249137878417969, 0.011497020721435547, 0.012744903564453125, 0.013992786407470703, 0.015240669250488281, 0.01648855209350586, 0.017736434936523438, 0.018984317779541016, 0.020232200622558594, 0.021480083465576172, 0.02272796630859375, 0.023975849151611328, 0.025223731994628906, 0.026471614837646484, 0.027719497680664062, 0.02896738052368164, 0.03021526336669922, 0.0314631462097168, 0.032711029052734375, 0.03395891189575195, 0.03520679473876953, 0.03645467758178711, 0.03770256042480469, 0.038950443267822266, 0.040198326110839844, 0.04144620895385742, 0.042694091796875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 8.0, 9.0, 10.0, 24.0, 32.0, 36.0, 40.0, 55.0, 67.0, 79.0, 87.0, 73.0, 70.0, 68.0, 74.0, 51.0, 44.0, 50.0, 36.0, 21.0, 19.0, 9.0, 14.0, 4.0, 8.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0182342529296875, -0.017725110054016113, -0.017215967178344727, -0.01670682430267334, -0.016197681427001953, -0.015688538551330566, -0.01517939567565918, -0.014670252799987793, -0.014161109924316406, -0.01365196704864502, -0.013142824172973633, -0.012633681297302246, -0.01212453842163086, -0.011615395545959473, -0.011106252670288086, -0.0105971097946167, -0.010087966918945312, -0.009578824043273926, -0.009069681167602539, -0.008560538291931152, -0.008051395416259766, -0.007542252540588379, -0.007033109664916992, -0.0065239667892456055, -0.006014823913574219, -0.005505681037902832, -0.004996538162231445, -0.004487395286560059, -0.003978252410888672, -0.003469109535217285, -0.0029599666595458984, -0.0024508237838745117, -0.001941680908203125, -0.0014325380325317383, -0.0009233951568603516, -0.00041425228118896484, 9.489059448242188e-05, 0.0006040334701538086, 0.0011131763458251953, 0.001622319221496582, 0.0021314620971679688, 0.0026406049728393555, 0.003149747848510742, 0.003658890724182129, 0.004168033599853516, 0.004677176475524902, 0.005186319351196289, 0.005695462226867676, 0.0062046051025390625, 0.006713747978210449, 0.007222890853881836, 0.007732033729553223, 0.00824117660522461, 0.008750319480895996, 0.009259462356567383, 0.00976860523223877, 0.010277748107910156, 0.010786890983581543, 0.01129603385925293, 0.011805176734924316, 0.012314319610595703, 0.01282346248626709, 0.013332605361938477, 0.013841748237609863, 0.01435089111328125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 4.0, 10.0, 27.0, 36.0, 65.0, 117.0, 235.0, 465.0, 1171.0, 4005.0, 28043.0, 3802687.0, 341279.0, 11815.0, 2482.0, 923.0, 438.0, 206.0, 130.0, 70.0, 21.0, 22.0, 11.0, 5.0, 7.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06158447265625, -0.05964851379394531, -0.057712554931640625, -0.05577659606933594, -0.05384063720703125, -0.05190467834472656, -0.049968719482421875, -0.04803276062011719, -0.0460968017578125, -0.04416084289550781, -0.042224884033203125, -0.04028892517089844, -0.03835296630859375, -0.03641700744628906, -0.034481048583984375, -0.03254508972167969, -0.030609130859375, -0.028673171997070312, -0.026737213134765625, -0.024801254272460938, -0.02286529541015625, -0.020929336547851562, -0.018993377685546875, -0.017057418823242188, -0.0151214599609375, -0.013185501098632812, -0.011249542236328125, -0.009313583374023438, -0.00737762451171875, -0.0054416656494140625, -0.003505706787109375, -0.0015697479248046875, 0.0003662109375, 0.0023021697998046875, 0.004238128662109375, 0.0061740875244140625, 0.00811004638671875, 0.010046005249023438, 0.011981964111328125, 0.013917922973632812, 0.0158538818359375, 0.017789840698242188, 0.019725799560546875, 0.021661758422851562, 0.02359771728515625, 0.025533676147460938, 0.027469635009765625, 0.029405593872070312, 0.031341552734375, 0.03327751159667969, 0.035213470458984375, 0.03714942932128906, 0.03908538818359375, 0.04102134704589844, 0.042957305908203125, 0.04489326477050781, 0.0468292236328125, 0.04876518249511719, 0.050701141357421875, 0.05263710021972656, 0.05457305908203125, 0.05650901794433594, 0.058444976806640625, 0.06038093566894531, 0.06231689453125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 3.0, 4.0, 7.0, 20.0, 42.0, 117.0, 290.0, 1772.0, 1412.0, 241.0, 80.0, 26.0, 16.0, 15.0, 9.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0179443359375, -0.017195463180541992, -0.016446590423583984, -0.015697717666625977, -0.014948844909667969, -0.014199972152709961, -0.013451099395751953, -0.012702226638793945, -0.011953353881835938, -0.01120448112487793, -0.010455608367919922, -0.009706735610961914, -0.008957862854003906, -0.008208990097045898, -0.007460117340087891, -0.006711244583129883, -0.005962371826171875, -0.005213499069213867, -0.004464626312255859, -0.0037157535552978516, -0.0029668807983398438, -0.002218008041381836, -0.0014691352844238281, -0.0007202625274658203, 2.86102294921875e-05, 0.0007774829864501953, 0.0015263557434082031, 0.002275228500366211, 0.0030241012573242188, 0.0037729740142822266, 0.004521846771240234, 0.005270719528198242, 0.00601959228515625, 0.006768465042114258, 0.007517337799072266, 0.008266210556030273, 0.009015083312988281, 0.009763956069946289, 0.010512828826904297, 0.011261701583862305, 0.012010574340820312, 0.01275944709777832, 0.013508319854736328, 0.014257192611694336, 0.015006065368652344, 0.01575493812561035, 0.01650381088256836, 0.017252683639526367, 0.018001556396484375, 0.018750429153442383, 0.01949930191040039, 0.0202481746673584, 0.020997047424316406, 0.021745920181274414, 0.022494792938232422, 0.02324366569519043, 0.023992538452148438, 0.024741411209106445, 0.025490283966064453, 0.02623915672302246, 0.02698802947998047, 0.027736902236938477, 0.028485774993896484, 0.029234647750854492, 0.0299835205078125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 8.0, 11.0, 40.0, 132.0, 247.0, 277.0, 179.0, 59.0, 28.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04558504745364189, -0.04158882796764374, -0.03759261220693588, -0.03359639272093773, -0.029600173234939575, -0.02560395374894142, -0.021607736125588417, -0.017611518502235413, -0.013615299016237259, -0.00961908046156168, -0.005622861906886101, -0.0016266433522105217, 0.0023695752024650574, 0.006365794688463211, 0.010362012311816216, 0.01435822993516922, 0.018354449421167374, 0.022350668907165527, 0.026346886530518532, 0.030343104153871536, 0.03433932363986969, 0.038335543125867844, 0.042331762611866, 0.04632797837257385, 0.050324197858572006, 0.05432041734457016, 0.058316633105278015, 0.06231285259127617, 0.06630907207727432, 0.07030528783798218, 0.07430151104927063, 0.07829772680997849, 0.08229395747184753, 0.08629017323255539, 0.09028639644384384, 0.0942826122045517, 0.09827883541584015, 0.102275051176548, 0.10627126693725586, 0.11026749014854431, 0.11426370590925217, 0.11825992166996002, 0.12225614488124847, 0.12625236809253693, 0.13024857640266418, 0.13424479961395264, 0.1382410228252411, 0.14223723113536835, 0.1462334543466568, 0.15022967755794525, 0.1542258858680725, 0.15822210907936096, 0.16221833229064941, 0.16621455550193787, 0.17021076381206512, 0.17420698702335358, 0.17820319533348083, 0.1821994185447693, 0.18619562685489655, 0.190191850066185, 0.19418807327747345, 0.1981842815876007, 0.20218050479888916, 0.2061767280101776, 0.21017295122146606]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 2.0, 5.0, 6.0, 10.0, 21.0, 25.0, 23.0, 24.0, 43.0, 48.0, 50.0, 58.0, 80.0, 83.0, 80.0, 99.0, 59.0, 64.0, 46.0, 48.0, 32.0, 27.0, 20.0, 15.0, 17.0, 6.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06990444660186768, -0.06785410642623901, -0.06580376625061035, -0.06375342607498169, -0.06170308589935303, -0.059652745723724365, -0.0576024055480957, -0.05555206537246704, -0.05350172519683838, -0.05145138502120972, -0.049401044845581055, -0.04735070466995239, -0.04530036449432373, -0.04325002431869507, -0.041199684143066406, -0.039149343967437744, -0.03709900379180908, -0.03504866361618042, -0.03299832344055176, -0.030947983264923096, -0.028897643089294434, -0.02684730291366577, -0.02479696273803711, -0.022746622562408447, -0.020696282386779785, -0.018645942211151123, -0.01659560203552246, -0.014545261859893799, -0.012494921684265137, -0.010444581508636475, -0.008394241333007812, -0.00634390115737915, -0.004293560981750488, -0.002243220806121826, -0.00019288063049316406, 0.001857459545135498, 0.00390779972076416, 0.005958139896392822, 0.008008480072021484, 0.010058820247650146, 0.012109160423278809, 0.01415950059890747, 0.016209840774536133, 0.018260180950164795, 0.020310521125793457, 0.02236086130142212, 0.02441120147705078, 0.026461541652679443, 0.028511881828308105, 0.030562222003936768, 0.03261256217956543, 0.03466290235519409, 0.036713242530822754, 0.038763582706451416, 0.04081392288208008, 0.04286426305770874, 0.0449146032333374, 0.046964943408966064, 0.04901528358459473, 0.05106562376022339, 0.05311596393585205, 0.05516630411148071, 0.057216644287109375, 0.05926698446273804, 0.0613173246383667]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 3.0, 3.0, 10.0, 22.0, 34.0, 69.0, 115.0, 186.0, 422.0, 987.0, 2831.0, 12395.0, 106844.0, 718513.0, 182063.0, 18102.0, 3697.0, 1252.0, 494.0, 211.0, 119.0, 68.0, 43.0, 27.0, 12.0, 9.0, 11.0, 6.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056182861328125, -0.054459571838378906, -0.05273628234863281, -0.05101299285888672, -0.049289703369140625, -0.04756641387939453, -0.04584312438964844, -0.044119834899902344, -0.04239654541015625, -0.040673255920410156, -0.03894996643066406, -0.03722667694091797, -0.035503387451171875, -0.03378009796142578, -0.03205680847167969, -0.030333518981933594, -0.0286102294921875, -0.026886940002441406, -0.025163650512695312, -0.02344036102294922, -0.021717071533203125, -0.01999378204345703, -0.018270492553710938, -0.016547203063964844, -0.01482391357421875, -0.013100624084472656, -0.011377334594726562, -0.009654045104980469, -0.007930755615234375, -0.006207466125488281, -0.0044841766357421875, -0.0027608871459960938, -0.00103759765625, 0.0006856918334960938, 0.0024089813232421875, 0.004132270812988281, 0.005855560302734375, 0.007578849792480469, 0.009302139282226562, 0.011025428771972656, 0.01274871826171875, 0.014472007751464844, 0.016195297241210938, 0.01791858673095703, 0.019641876220703125, 0.02136516571044922, 0.023088455200195312, 0.024811744689941406, 0.0265350341796875, 0.028258323669433594, 0.029981613159179688, 0.03170490264892578, 0.033428192138671875, 0.03515148162841797, 0.03687477111816406, 0.038598060607910156, 0.04032135009765625, 0.042044639587402344, 0.04376792907714844, 0.04549121856689453, 0.047214508056640625, 0.04893779754638672, 0.05066108703613281, 0.052384376525878906, 0.054107666015625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 12.0, 7.0, 9.0, 15.0, 20.0, 35.0, 45.0, 57.0, 89.0, 58.0, 83.0, 83.0, 80.0, 74.0, 73.0, 53.0, 52.0, 46.0, 31.0, 23.0, 16.0, 11.0, 7.0, 8.0, 3.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.019012451171875, -0.01848292350769043, -0.01795339584350586, -0.01742386817932129, -0.01689434051513672, -0.01636481285095215, -0.015835285186767578, -0.015305757522583008, -0.014776229858398438, -0.014246702194213867, -0.013717174530029297, -0.013187646865844727, -0.012658119201660156, -0.012128591537475586, -0.011599063873291016, -0.011069536209106445, -0.010540008544921875, -0.010010480880737305, -0.009480953216552734, -0.008951425552368164, -0.008421897888183594, -0.007892370223999023, -0.007362842559814453, -0.006833314895629883, -0.0063037872314453125, -0.005774259567260742, -0.005244731903076172, -0.0047152042388916016, -0.004185676574707031, -0.003656148910522461, -0.0031266212463378906, -0.0025970935821533203, -0.00206756591796875, -0.0015380382537841797, -0.0010085105895996094, -0.00047898292541503906, 5.054473876953125e-05, 0.0005800724029541016, 0.0011096000671386719, 0.0016391277313232422, 0.0021686553955078125, 0.002698183059692383, 0.003227710723876953, 0.0037572383880615234, 0.004286766052246094, 0.004816293716430664, 0.005345821380615234, 0.005875349044799805, 0.006404876708984375, 0.006934404373168945, 0.007463932037353516, 0.007993459701538086, 0.008522987365722656, 0.009052515029907227, 0.009582042694091797, 0.010111570358276367, 0.010641098022460938, 0.011170625686645508, 0.011700153350830078, 0.012229681015014648, 0.012759208679199219, 0.013288736343383789, 0.01381826400756836, 0.01434779167175293, 0.0148773193359375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 7.0, 5.0, 4.0, 7.0, 10.0, 5.0, 20.0, 27.0, 21.0, 42.0, 56.0, 60.0, 96.0, 170.0, 349.0, 832.0, 3715.0, 22008.0, 167672.0, 616468.0, 204117.0, 26449.0, 4419.0, 1030.0, 390.0, 180.0, 115.0, 64.0, 54.0, 36.0, 35.0, 23.0, 17.0, 20.0, 10.0, 7.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.031982421875, -0.030968666076660156, -0.029954910278320312, -0.02894115447998047, -0.027927398681640625, -0.02691364288330078, -0.025899887084960938, -0.024886131286621094, -0.02387237548828125, -0.022858619689941406, -0.021844863891601562, -0.02083110809326172, -0.019817352294921875, -0.01880359649658203, -0.017789840698242188, -0.016776084899902344, -0.0157623291015625, -0.014748573303222656, -0.013734817504882812, -0.012721061706542969, -0.011707305908203125, -0.010693550109863281, -0.009679794311523438, -0.008666038513183594, -0.00765228271484375, -0.006638526916503906, -0.0056247711181640625, -0.004611015319824219, -0.003597259521484375, -0.0025835037231445312, -0.0015697479248046875, -0.0005559921264648438, 0.000457763671875, 0.0014715194702148438, 0.0024852752685546875, 0.0034990310668945312, 0.004512786865234375, 0.005526542663574219, 0.0065402984619140625, 0.007554054260253906, 0.00856781005859375, 0.009581565856933594, 0.010595321655273438, 0.011609077453613281, 0.012622833251953125, 0.013636589050292969, 0.014650344848632812, 0.015664100646972656, 0.0166778564453125, 0.017691612243652344, 0.018705368041992188, 0.01971912384033203, 0.020732879638671875, 0.02174663543701172, 0.022760391235351562, 0.023774147033691406, 0.02478790283203125, 0.025801658630371094, 0.026815414428710938, 0.02782917022705078, 0.028842926025390625, 0.02985668182373047, 0.030870437622070312, 0.031884193420410156, 0.03289794921875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 10.0, 6.0, 8.0, 9.0, 12.0, 14.0, 20.0, 21.0, 29.0, 29.0, 29.0, 41.0, 39.0, 39.0, 40.0, 43.0, 39.0, 57.0, 47.0, 41.0, 47.0, 36.0, 44.0, 36.0, 37.0, 37.0, 28.0, 23.0, 27.0, 15.0, 16.0, 10.0, 17.0, 12.0, 12.0, 11.0, 9.0, 1.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.039093017578125, -0.038004159927368164, -0.03691530227661133, -0.03582644462585449, -0.034737586975097656, -0.03364872932434082, -0.032559871673583984, -0.03147101402282715, -0.030382156372070312, -0.029293298721313477, -0.02820444107055664, -0.027115583419799805, -0.02602672576904297, -0.024937868118286133, -0.023849010467529297, -0.02276015281677246, -0.021671295166015625, -0.02058243751525879, -0.019493579864501953, -0.018404722213745117, -0.01731586456298828, -0.016227006912231445, -0.01513814926147461, -0.014049291610717773, -0.012960433959960938, -0.011871576309204102, -0.010782718658447266, -0.00969386100769043, -0.008605003356933594, -0.007516145706176758, -0.006427288055419922, -0.005338430404663086, -0.00424957275390625, -0.003160715103149414, -0.002071857452392578, -0.0009829998016357422, 0.00010585784912109375, 0.0011947154998779297, 0.0022835731506347656, 0.0033724308013916016, 0.0044612884521484375, 0.0055501461029052734, 0.006639003753662109, 0.007727861404418945, 0.008816719055175781, 0.009905576705932617, 0.010994434356689453, 0.012083292007446289, 0.013172149658203125, 0.014261007308959961, 0.015349864959716797, 0.016438722610473633, 0.01752758026123047, 0.018616437911987305, 0.01970529556274414, 0.020794153213500977, 0.021883010864257812, 0.02297186851501465, 0.024060726165771484, 0.02514958381652832, 0.026238441467285156, 0.027327299118041992, 0.028416156768798828, 0.029505014419555664, 0.0305938720703125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 14.0, 8.0, 11.0, 16.0, 13.0, 13.0, 29.0, 21.0, 41.0, 44.0, 63.0, 93.0, 113.0, 138.0, 251.0, 447.0, 763.0, 2082.0, 7549.0, 56816.0, 495452.0, 428305.0, 45844.0, 6584.0, 1771.0, 740.0, 420.0, 253.0, 166.0, 107.0, 114.0, 71.0, 55.0, 41.0, 29.0, 18.0, 12.0, 12.0, 11.0, 8.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.01374053955078125, -0.013358354568481445, -0.01297616958618164, -0.012593984603881836, -0.012211799621582031, -0.011829614639282227, -0.011447429656982422, -0.011065244674682617, -0.010683059692382812, -0.010300874710083008, -0.009918689727783203, -0.009536504745483398, -0.009154319763183594, -0.008772134780883789, -0.008389949798583984, -0.00800776481628418, -0.007625579833984375, -0.00724339485168457, -0.006861209869384766, -0.006479024887084961, -0.006096839904785156, -0.0057146549224853516, -0.005332469940185547, -0.004950284957885742, -0.0045680999755859375, -0.004185914993286133, -0.003803730010986328, -0.0034215450286865234, -0.0030393600463867188, -0.002657175064086914, -0.0022749900817871094, -0.0018928050994873047, -0.0015106201171875, -0.0011284351348876953, -0.0007462501525878906, -0.00036406517028808594, 1.811981201171875e-05, 0.00040030479431152344, 0.0007824897766113281, 0.0011646747589111328, 0.0015468597412109375, 0.0019290447235107422, 0.002311229705810547, 0.0026934146881103516, 0.0030755996704101562, 0.003457784652709961, 0.0038399696350097656, 0.00422215461730957, 0.004604339599609375, 0.00498652458190918, 0.005368709564208984, 0.005750894546508789, 0.006133079528808594, 0.0065152645111083984, 0.006897449493408203, 0.007279634475708008, 0.0076618194580078125, 0.008044004440307617, 0.008426189422607422, 0.008808374404907227, 0.009190559387207031, 0.009572744369506836, 0.00995492935180664, 0.010337114334106445, 0.01071929931640625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 7.0, 8.0, 25.0, 56.0, 123.0, 259.0, 267.0, 150.0, 61.0, 30.0, 11.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022554397583007812, -0.00021928176283836365, -0.00021301954984664917, -0.0002067573368549347, -0.00020049512386322021, -0.00019423291087150574, -0.00018797069787979126, -0.00018170848488807678, -0.0001754462718963623, -0.00016918405890464783, -0.00016292184591293335, -0.00015665963292121887, -0.0001503974199295044, -0.00014413520693778992, -0.00013787299394607544, -0.00013161078095436096, -0.00012534856796264648, -0.00011908635497093201, -0.00011282414197921753, -0.00010656192898750305, -0.00010029971599578857, -9.40375030040741e-05, -8.777529001235962e-05, -8.151307702064514e-05, -7.525086402893066e-05, -6.898865103721619e-05, -6.272643804550171e-05, -5.646422505378723e-05, -5.0202012062072754e-05, -4.3939799070358276e-05, -3.76775860786438e-05, -3.141537308692932e-05, -2.5153160095214844e-05, -1.8890947103500366e-05, -1.2628734111785889e-05, -6.366521120071411e-06, -1.043081283569336e-07, 6.157904863357544e-06, 1.2420117855072021e-05, 1.86823308467865e-05, 2.4944543838500977e-05, 3.1206756830215454e-05, 3.746896982192993e-05, 4.373118281364441e-05, 4.999339580535889e-05, 5.6255608797073364e-05, 6.251782178878784e-05, 6.878003478050232e-05, 7.50422477722168e-05, 8.130446076393127e-05, 8.756667375564575e-05, 9.382888674736023e-05, 0.00010009109973907471, 0.00010635331273078918, 0.00011261552572250366, 0.00011887773871421814, 0.00012513995170593262, 0.0001314021646976471, 0.00013766437768936157, 0.00014392659068107605, 0.00015018880367279053, 0.000156451016664505, 0.00016271322965621948, 0.00016897544264793396, 0.00017523765563964844]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 10.0, 7.0, 23.0, 37.0, 63.0, 133.0, 270.0, 626.0, 2040.0, 18186.0, 527355.0, 480339.0, 16357.0, 1984.0, 593.0, 255.0, 129.0, 72.0, 25.0, 21.0, 14.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.0270843505859375, -0.02645421028137207, -0.02582406997680664, -0.02519392967224121, -0.02456378936767578, -0.02393364906311035, -0.023303508758544922, -0.022673368453979492, -0.022043228149414062, -0.021413087844848633, -0.020782947540283203, -0.020152807235717773, -0.019522666931152344, -0.018892526626586914, -0.018262386322021484, -0.017632246017456055, -0.017002105712890625, -0.016371965408325195, -0.015741825103759766, -0.015111684799194336, -0.014481544494628906, -0.013851404190063477, -0.013221263885498047, -0.012591123580932617, -0.011960983276367188, -0.011330842971801758, -0.010700702667236328, -0.010070562362670898, -0.009440422058105469, -0.008810281753540039, -0.00818014144897461, -0.00755000114440918, -0.00691986083984375, -0.00628972053527832, -0.005659580230712891, -0.005029439926147461, -0.004399299621582031, -0.0037691593170166016, -0.003139019012451172, -0.002508878707885742, -0.0018787384033203125, -0.0012485980987548828, -0.0006184577941894531, 1.1682510375976562e-05, 0.0006418228149414062, 0.001271963119506836, 0.0019021034240722656, 0.0025322437286376953, 0.003162384033203125, 0.0037925243377685547, 0.004422664642333984, 0.005052804946899414, 0.005682945251464844, 0.0063130855560302734, 0.006943225860595703, 0.007573366165161133, 0.008203506469726562, 0.008833646774291992, 0.009463787078857422, 0.010093927383422852, 0.010724067687988281, 0.011354207992553711, 0.01198434829711914, 0.01261448860168457, 0.01324462890625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 6.0, 10.0, 22.0, 31.0, 58.0, 89.0, 112.0, 130.0, 145.0, 127.0, 98.0, 73.0, 46.0, 23.0, 13.0, 6.0, 4.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02392578125, -0.023298263549804688, -0.022670745849609375, -0.022043228149414062, -0.02141571044921875, -0.020788192749023438, -0.020160675048828125, -0.019533157348632812, -0.0189056396484375, -0.018278121948242188, -0.017650604248046875, -0.017023086547851562, -0.01639556884765625, -0.015768051147460938, -0.015140533447265625, -0.014513015747070312, -0.013885498046875, -0.013257980346679688, -0.012630462646484375, -0.012002944946289062, -0.01137542724609375, -0.010747909545898438, -0.010120391845703125, -0.009492874145507812, -0.0088653564453125, -0.008237838745117188, -0.007610321044921875, -0.0069828033447265625, -0.00635528564453125, -0.0057277679443359375, -0.005100250244140625, -0.0044727325439453125, -0.00384521484375, -0.0032176971435546875, -0.002590179443359375, -0.0019626617431640625, -0.00133514404296875, -0.0007076263427734375, -8.0108642578125e-05, 0.0005474090576171875, 0.0011749267578125, 0.0018024444580078125, 0.002429962158203125, 0.0030574798583984375, 0.00368499755859375, 0.0043125152587890625, 0.004940032958984375, 0.0055675506591796875, 0.006195068359375, 0.0068225860595703125, 0.007450103759765625, 0.008077621459960938, 0.00870513916015625, 0.009332656860351562, 0.009960174560546875, 0.010587692260742188, 0.0112152099609375, 0.011842727661132812, 0.012470245361328125, 0.013097763061523438, 0.01372528076171875, 0.014352798461914062, 0.014980316162109375, 0.015607833862304688, 0.0162353515625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 10.0, 143.0, 655.0, 192.0, 10.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7687674760818481, -0.7418866753578186, -0.7150059342384338, -0.6881251335144043, -0.6612443923950195, -0.63436359167099, -0.6074827909469604, -0.5806020498275757, -0.5537213087081909, -0.5268405079841614, -0.4999597668647766, -0.47307896614074707, -0.4461982250213623, -0.41931742429733276, -0.3924366533756256, -0.36555588245391846, -0.3386750817298889, -0.31179431080818176, -0.2849135398864746, -0.25803273916244507, -0.2311519831418991, -0.20427121222019196, -0.1773904263973236, -0.15050965547561646, -0.1236288845539093, -0.09674811363220215, -0.0698673352599144, -0.04298655688762665, -0.016105785965919495, 0.010774984955787659, 0.037655770778656006, 0.06453654170036316, 0.09141731262207031, 0.11829808354377747, 0.14517885446548462, 0.17205964028835297, 0.19894041121006012, 0.22582118213176727, 0.2527019679546356, 0.2795827388763428, 0.3064635097980499, 0.3333442807197571, 0.36022505164146423, 0.3871058225631714, 0.4139866232872009, 0.4408673644065857, 0.46774816513061523, 0.4946289360523224, 0.5215097069740295, 0.5483905076980591, 0.5752712488174438, 0.6021520495414734, 0.6290327906608582, 0.6559135913848877, 0.6827943325042725, 0.709675133228302, 0.7365559339523315, 0.7634367346763611, 0.7903174757957458, 0.8171982765197754, 0.8440790176391602, 0.8709598183631897, 0.8978406190872192, 0.924721360206604, 0.9516021013259888]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 6.0, 8.0, 10.0, 12.0, 15.0, 14.0, 15.0, 19.0, 18.0, 19.0, 36.0, 31.0, 43.0, 44.0, 37.0, 36.0, 41.0, 43.0, 47.0, 40.0, 49.0, 40.0, 37.0, 44.0, 51.0, 29.0, 31.0, 35.0, 23.0, 19.0, 14.0, 16.0, 15.0, 9.0, 18.0, 9.0, 11.0, 4.0, 4.0, 10.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16052979230880737, -0.15533432364463806, -0.15013884007930756, -0.14494337141513824, -0.13974788784980774, -0.13455241918563843, -0.12935693562030792, -0.12416146695613861, -0.1189659908413887, -0.1137705147266388, -0.10857503861188889, -0.10337956249713898, -0.09818409383296967, -0.09298861026763916, -0.08779314160346985, -0.08259766548871994, -0.07740218937397003, -0.07220671325922012, -0.06701123714447021, -0.061815764755010605, -0.056620288640260696, -0.05142481252551079, -0.04622934013605118, -0.04103386402130127, -0.03583838790655136, -0.030642911791801453, -0.025447437539696693, -0.020251963287591934, -0.015056487172842026, -0.009861011058092117, -0.004665536805987358, 0.0005299374461174011, 0.00572541356086731, 0.010920888744294643, 0.016116363927721977, 0.021311838179826736, 0.026507314294576645, 0.03170279040932655, 0.03689826279878616, 0.04209373891353607, 0.04728921502828598, 0.05248469114303589, 0.0576801672577858, 0.0628756433725357, 0.06807111203670502, 0.07326659560203552, 0.07846206426620483, 0.08365754038095474, 0.08885301649570465, 0.09404849261045456, 0.09924396872520447, 0.10443944483995438, 0.10963492095470428, 0.1148303896188736, 0.1200258657336235, 0.1252213418483734, 0.13041681051254272, 0.13561227917671204, 0.14080776274204254, 0.14600323140621185, 0.15119871497154236, 0.15639418363571167, 0.16158966720104218, 0.1667851358652115, 0.171980619430542]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 6.0, 11.0, 22.0, 33.0, 67.0, 127.0, 212.0, 488.0, 1526.0, 7132.0, 101771.0, 4048279.0, 28646.0, 4099.0, 1088.0, 361.0, 183.0, 91.0, 56.0, 23.0, 26.0, 10.0, 9.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11083984375, -0.1077871322631836, -0.10473442077636719, -0.10168170928955078, -0.09862899780273438, -0.09557628631591797, -0.09252357482910156, -0.08947086334228516, -0.08641815185546875, -0.08336544036865234, -0.08031272888183594, -0.07726001739501953, -0.07420730590820312, -0.07115459442138672, -0.06810188293457031, -0.0650491714477539, -0.0619964599609375, -0.058943748474121094, -0.05589103698730469, -0.05283832550048828, -0.049785614013671875, -0.04673290252685547, -0.04368019104003906, -0.040627479553222656, -0.03757476806640625, -0.034522056579589844, -0.03146934509277344, -0.02841663360595703, -0.025363922119140625, -0.02231121063232422, -0.019258499145507812, -0.016205787658691406, -0.013153076171875, -0.010100364685058594, -0.0070476531982421875, -0.003994941711425781, -0.000942230224609375, 0.0021104812622070312, 0.0051631927490234375, 0.008215904235839844, 0.01126861572265625, 0.014321327209472656, 0.017374038696289062, 0.02042675018310547, 0.023479461669921875, 0.02653217315673828, 0.029584884643554688, 0.032637596130371094, 0.0356903076171875, 0.038743019104003906, 0.04179573059082031, 0.04484844207763672, 0.047901153564453125, 0.05095386505126953, 0.05400657653808594, 0.057059288024902344, 0.06011199951171875, 0.06316471099853516, 0.06621742248535156, 0.06927013397216797, 0.07232284545898438, 0.07537555694580078, 0.07842826843261719, 0.0814809799194336, 0.08453369140625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 10.0, 15.0, 15.0, 22.0, 37.0, 52.0, 56.0, 64.0, 71.0, 89.0, 84.0, 84.0, 88.0, 69.0, 56.0, 54.0, 30.0, 31.0, 16.0, 14.0, 11.0, 4.0, 4.0, 6.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0192718505859375, -0.018731236457824707, -0.018190622329711914, -0.01765000820159912, -0.017109394073486328, -0.016568779945373535, -0.016028165817260742, -0.01548755168914795, -0.014946937561035156, -0.014406323432922363, -0.01386570930480957, -0.013325095176696777, -0.012784481048583984, -0.012243866920471191, -0.011703252792358398, -0.011162638664245605, -0.010622024536132812, -0.01008141040802002, -0.009540796279907227, -0.009000182151794434, -0.00845956802368164, -0.007918953895568848, -0.007378339767456055, -0.006837725639343262, -0.006297111511230469, -0.005756497383117676, -0.005215883255004883, -0.00467526912689209, -0.004134654998779297, -0.003594040870666504, -0.003053426742553711, -0.002512812614440918, -0.001972198486328125, -0.001431584358215332, -0.0008909702301025391, -0.0003503561019897461, 0.00019025802612304688, 0.0007308721542358398, 0.0012714862823486328, 0.0018121004104614258, 0.0023527145385742188, 0.0028933286666870117, 0.0034339427947998047, 0.003974556922912598, 0.004515171051025391, 0.005055785179138184, 0.0055963993072509766, 0.0061370134353637695, 0.0066776275634765625, 0.0072182416915893555, 0.0077588558197021484, 0.008299469947814941, 0.008840084075927734, 0.009380698204040527, 0.00992131233215332, 0.010461926460266113, 0.011002540588378906, 0.0115431547164917, 0.012083768844604492, 0.012624382972717285, 0.013164997100830078, 0.013705611228942871, 0.014246225357055664, 0.014786839485168457, 0.01532745361328125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 10.0, 11.0, 21.0, 22.0, 46.0, 78.0, 125.0, 218.0, 345.0, 751.0, 1857.0, 6081.0, 29706.0, 767458.0, 3334705.0, 40904.0, 7631.0, 2360.0, 910.0, 420.0, 242.0, 145.0, 88.0, 61.0, 36.0, 20.0, 10.0, 6.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04779052734375, -0.04642820358276367, -0.045065879821777344, -0.043703556060791016, -0.04234123229980469, -0.04097890853881836, -0.03961658477783203, -0.0382542610168457, -0.036891937255859375, -0.03552961349487305, -0.03416728973388672, -0.03280496597290039, -0.03144264221191406, -0.030080318450927734, -0.028717994689941406, -0.027355670928955078, -0.02599334716796875, -0.024631023406982422, -0.023268699645996094, -0.021906375885009766, -0.020544052124023438, -0.01918172836303711, -0.01781940460205078, -0.016457080841064453, -0.015094757080078125, -0.013732433319091797, -0.012370109558105469, -0.01100778579711914, -0.009645462036132812, -0.008283138275146484, -0.006920814514160156, -0.005558490753173828, -0.0041961669921875, -0.002833843231201172, -0.0014715194702148438, -0.00010919570922851562, 0.0012531280517578125, 0.0026154518127441406, 0.003977775573730469, 0.005340099334716797, 0.006702423095703125, 0.008064746856689453, 0.009427070617675781, 0.01078939437866211, 0.012151718139648438, 0.013514041900634766, 0.014876365661621094, 0.016238689422607422, 0.01760101318359375, 0.018963336944580078, 0.020325660705566406, 0.021687984466552734, 0.023050308227539062, 0.02441263198852539, 0.02577495574951172, 0.027137279510498047, 0.028499603271484375, 0.029861927032470703, 0.03122425079345703, 0.03258657455444336, 0.03394889831542969, 0.035311222076416016, 0.036673545837402344, 0.03803586959838867, 0.039398193359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 8.0, 7.0, 9.0, 23.0, 43.0, 62.0, 212.0, 2333.0, 1058.0, 165.0, 65.0, 34.0, 16.0, 16.0, 7.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0221710205078125, -0.02142930030822754, -0.020687580108642578, -0.019945859909057617, -0.019204139709472656, -0.018462419509887695, -0.017720699310302734, -0.016978979110717773, -0.016237258911132812, -0.015495538711547852, -0.01475381851196289, -0.01401209831237793, -0.013270378112792969, -0.012528657913208008, -0.011786937713623047, -0.011045217514038086, -0.010303497314453125, -0.009561777114868164, -0.008820056915283203, -0.008078336715698242, -0.007336616516113281, -0.00659489631652832, -0.005853176116943359, -0.0051114559173583984, -0.0043697357177734375, -0.0036280155181884766, -0.0028862953186035156, -0.0021445751190185547, -0.0014028549194335938, -0.0006611347198486328, 8.058547973632812e-05, 0.0008223056793212891, 0.00156402587890625, 0.002305746078491211, 0.003047466278076172, 0.003789186477661133, 0.004530906677246094, 0.005272626876831055, 0.006014347076416016, 0.0067560672760009766, 0.0074977874755859375, 0.008239507675170898, 0.00898122787475586, 0.00972294807434082, 0.010464668273925781, 0.011206388473510742, 0.011948108673095703, 0.012689828872680664, 0.013431549072265625, 0.014173269271850586, 0.014914989471435547, 0.015656709671020508, 0.01639842987060547, 0.01714015007019043, 0.01788187026977539, 0.01862359046936035, 0.019365310668945312, 0.020107030868530273, 0.020848751068115234, 0.021590471267700195, 0.022332191467285156, 0.023073911666870117, 0.023815631866455078, 0.02455735206604004, 0.025299072265625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 6.0, 25.0, 185.0, 464.0, 260.0, 39.0, 11.0, 5.0, 3.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17471513152122498, -0.16899962723255157, -0.16328412294387817, -0.15756861865520477, -0.15185311436653137, -0.14613761007785797, -0.14042210578918457, -0.13470660150051117, -0.12899109721183777, -0.12327559292316437, -0.11756008863449097, -0.11184458434581757, -0.10612908005714417, -0.10041357576847076, -0.09469807147979736, -0.08898256719112396, -0.08326706290245056, -0.07755155861377716, -0.07183605432510376, -0.06612055003643036, -0.06040504574775696, -0.05468954145908356, -0.048974037170410156, -0.043258532881736755, -0.037543028593063354, -0.031827524304389954, -0.026112020015716553, -0.020396515727043152, -0.014681011438369751, -0.00896550714969635, -0.0032500028610229492, 0.0024655014276504517, 0.008180990815162659, 0.01389649510383606, 0.01961199939250946, 0.02532750368118286, 0.031043007969856262, 0.03675851225852966, 0.042474016547203064, 0.048189520835876465, 0.053905025124549866, 0.05962052941322327, 0.06533603370189667, 0.07105153799057007, 0.07676704227924347, 0.08248254656791687, 0.08819805085659027, 0.09391355514526367, 0.09962905943393707, 0.10534456372261047, 0.11106006801128387, 0.11677557229995728, 0.12249107658863068, 0.12820658087730408, 0.13392208516597748, 0.13963758945465088, 0.14535309374332428, 0.15106859803199768, 0.15678410232067108, 0.16249960660934448, 0.16821511089801788, 0.17393061518669128, 0.17964611947536469, 0.18536162376403809, 0.1910771280527115]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 1.0, 7.0, 7.0, 17.0, 15.0, 13.0, 36.0, 41.0, 66.0, 83.0, 91.0, 111.0, 85.0, 84.0, 85.0, 64.0, 55.0, 41.0, 28.0, 20.0, 15.0, 12.0, 4.0, 6.0, 6.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06244534254074097, -0.060321059077978134, -0.0581967756152153, -0.05607248842716217, -0.05394820496439934, -0.051823921501636505, -0.049699634313583374, -0.04757535085082054, -0.04545106738805771, -0.043326783925294876, -0.04120250046253204, -0.03907821327447891, -0.03695392981171608, -0.03482964634895325, -0.032705359160900116, -0.030581075698137283, -0.02845679223537445, -0.026332508772611618, -0.024208223447203636, -0.022083938121795654, -0.01995965465903282, -0.01783537119626999, -0.015711085870862007, -0.0135868014767766, -0.011462517082691193, -0.009338232688605785, -0.007213948294520378, -0.005089663900434971, -0.0029653795063495636, -0.0008410951122641563, 0.001283189281821251, 0.003407473675906658, 0.005531758069992065, 0.007656042464077473, 0.00978032685816288, 0.011904611252248287, 0.014028895646333694, 0.016153179109096527, 0.01827746443450451, 0.02040174975991249, 0.022526033222675323, 0.024650316685438156, 0.026774602010846138, 0.02889888733625412, 0.031023170799016953, 0.033147454261779785, 0.035271741449832916, 0.03739602491259575, 0.03952030837535858, 0.041644591838121414, 0.04376887530088425, 0.04589316248893738, 0.04801744595170021, 0.05014172941446304, 0.052266016602516174, 0.05439030006527901, 0.05651458352804184, 0.05863886699080467, 0.060763150453567505, 0.06288743764162064, 0.06501172482967377, 0.0671360045671463, 0.06926029175519943, 0.07138457149267197, 0.0735088586807251]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 4.0, 4.0, 8.0, 17.0, 18.0, 37.0, 51.0, 55.0, 85.0, 145.0, 246.0, 473.0, 830.0, 1756.0, 4289.0, 14780.0, 87899.0, 565705.0, 317461.0, 40239.0, 8569.0, 2982.0, 1324.0, 647.0, 346.0, 202.0, 105.0, 79.0, 54.0, 32.0, 29.0, 20.0, 17.0, 10.0, 9.0, 3.0, 6.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04302978515625, -0.0417180061340332, -0.040406227111816406, -0.03909444808959961, -0.03778266906738281, -0.036470890045166016, -0.03515911102294922, -0.03384733200073242, -0.032535552978515625, -0.031223773956298828, -0.02991199493408203, -0.028600215911865234, -0.027288436889648438, -0.02597665786743164, -0.024664878845214844, -0.023353099822998047, -0.02204132080078125, -0.020729541778564453, -0.019417762756347656, -0.01810598373413086, -0.016794204711914062, -0.015482425689697266, -0.014170646667480469, -0.012858867645263672, -0.011547088623046875, -0.010235309600830078, -0.008923530578613281, -0.007611751556396484, -0.0062999725341796875, -0.004988193511962891, -0.0036764144897460938, -0.002364635467529297, -0.0010528564453125, 0.0002589225769042969, 0.0015707015991210938, 0.0028824806213378906, 0.0041942596435546875, 0.005506038665771484, 0.006817817687988281, 0.008129596710205078, 0.009441375732421875, 0.010753154754638672, 0.012064933776855469, 0.013376712799072266, 0.014688491821289062, 0.01600027084350586, 0.017312049865722656, 0.018623828887939453, 0.01993560791015625, 0.021247386932373047, 0.022559165954589844, 0.02387094497680664, 0.025182723999023438, 0.026494503021240234, 0.02780628204345703, 0.029118061065673828, 0.030429840087890625, 0.03174161911010742, 0.03305339813232422, 0.034365177154541016, 0.03567695617675781, 0.03698873519897461, 0.038300514221191406, 0.0396122932434082, 0.040924072265625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 7.0, 13.0, 21.0, 12.0, 27.0, 46.0, 54.0, 62.0, 80.0, 83.0, 72.0, 99.0, 88.0, 82.0, 71.0, 43.0, 40.0, 30.0, 20.0, 11.0, 10.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.020294189453125, -0.019730091094970703, -0.019165992736816406, -0.01860189437866211, -0.018037796020507812, -0.017473697662353516, -0.01690959930419922, -0.016345500946044922, -0.015781402587890625, -0.015217304229736328, -0.014653205871582031, -0.014089107513427734, -0.013525009155273438, -0.01296091079711914, -0.012396812438964844, -0.011832714080810547, -0.01126861572265625, -0.010704517364501953, -0.010140419006347656, -0.00957632064819336, -0.009012222290039062, -0.008448123931884766, -0.007884025573730469, -0.007319927215576172, -0.006755828857421875, -0.006191730499267578, -0.005627632141113281, -0.005063533782958984, -0.0044994354248046875, -0.003935337066650391, -0.0033712387084960938, -0.002807140350341797, -0.0022430419921875, -0.0016789436340332031, -0.0011148452758789062, -0.0005507469177246094, 1.33514404296875e-05, 0.0005774497985839844, 0.0011415481567382812, 0.0017056465148925781, 0.002269744873046875, 0.002833843231201172, 0.0033979415893554688, 0.003962039947509766, 0.0045261383056640625, 0.005090236663818359, 0.005654335021972656, 0.006218433380126953, 0.00678253173828125, 0.007346630096435547, 0.007910728454589844, 0.00847482681274414, 0.009038925170898438, 0.009603023529052734, 0.010167121887207031, 0.010731220245361328, 0.011295318603515625, 0.011859416961669922, 0.012423515319824219, 0.012987613677978516, 0.013551712036132812, 0.01411581039428711, 0.014679908752441406, 0.015244007110595703, 0.01580810546875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 8.0, 5.0, 12.0, 20.0, 23.0, 23.0, 43.0, 47.0, 55.0, 85.0, 113.0, 139.0, 230.0, 347.0, 471.0, 903.0, 1795.0, 4911.0, 17593.0, 86502.0, 436556.0, 398730.0, 75509.0, 15829.0, 4442.0, 1694.0, 908.0, 461.0, 331.0, 205.0, 136.0, 109.0, 74.0, 58.0, 42.0, 37.0, 27.0, 20.0, 18.0, 10.0, 10.0, 9.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.027496337890625, -0.02673172950744629, -0.025967121124267578, -0.025202512741088867, -0.024437904357910156, -0.023673295974731445, -0.022908687591552734, -0.022144079208374023, -0.021379470825195312, -0.0206148624420166, -0.01985025405883789, -0.01908564567565918, -0.01832103729248047, -0.017556428909301758, -0.016791820526123047, -0.016027212142944336, -0.015262603759765625, -0.014497995376586914, -0.013733386993408203, -0.012968778610229492, -0.012204170227050781, -0.01143956184387207, -0.01067495346069336, -0.009910345077514648, -0.009145736694335938, -0.008381128311157227, -0.007616519927978516, -0.006851911544799805, -0.006087303161621094, -0.005322694778442383, -0.004558086395263672, -0.003793478012084961, -0.00302886962890625, -0.002264261245727539, -0.0014996528625488281, -0.0007350444793701172, 2.956390380859375e-05, 0.0007941722869873047, 0.0015587806701660156, 0.0023233890533447266, 0.0030879974365234375, 0.0038526058197021484, 0.004617214202880859, 0.00538182258605957, 0.006146430969238281, 0.006911039352416992, 0.007675647735595703, 0.008440256118774414, 0.009204864501953125, 0.009969472885131836, 0.010734081268310547, 0.011498689651489258, 0.012263298034667969, 0.01302790641784668, 0.01379251480102539, 0.014557123184204102, 0.015321731567382812, 0.016086339950561523, 0.016850948333740234, 0.017615556716918945, 0.018380165100097656, 0.019144773483276367, 0.019909381866455078, 0.02067399024963379, 0.0214385986328125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 5.0, 4.0, 7.0, 11.0, 4.0, 9.0, 18.0, 11.0, 17.0, 17.0, 28.0, 20.0, 27.0, 30.0, 38.0, 36.0, 43.0, 40.0, 39.0, 48.0, 41.0, 45.0, 42.0, 27.0, 43.0, 35.0, 35.0, 40.0, 27.0, 23.0, 33.0, 28.0, 19.0, 25.0, 17.0, 13.0, 10.0, 6.0, 7.0, 6.0, 1.0, 6.0, 8.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.03436279296875, -0.03330183029174805, -0.032240867614746094, -0.03117990493774414, -0.030118942260742188, -0.029057979583740234, -0.02799701690673828, -0.026936054229736328, -0.025875091552734375, -0.024814128875732422, -0.02375316619873047, -0.022692203521728516, -0.021631240844726562, -0.02057027816772461, -0.019509315490722656, -0.018448352813720703, -0.01738739013671875, -0.016326427459716797, -0.015265464782714844, -0.01420450210571289, -0.013143539428710938, -0.012082576751708984, -0.011021614074707031, -0.009960651397705078, -0.008899688720703125, -0.007838726043701172, -0.006777763366699219, -0.005716800689697266, -0.0046558380126953125, -0.0035948753356933594, -0.0025339126586914062, -0.0014729499816894531, -0.0004119873046875, 0.0006489753723144531, 0.0017099380493164062, 0.0027709007263183594, 0.0038318634033203125, 0.004892826080322266, 0.005953788757324219, 0.007014751434326172, 0.008075714111328125, 0.009136676788330078, 0.010197639465332031, 0.011258602142333984, 0.012319564819335938, 0.01338052749633789, 0.014441490173339844, 0.015502452850341797, 0.01656341552734375, 0.017624378204345703, 0.018685340881347656, 0.01974630355834961, 0.020807266235351562, 0.021868228912353516, 0.02292919158935547, 0.023990154266357422, 0.025051116943359375, 0.026112079620361328, 0.02717304229736328, 0.028234004974365234, 0.029294967651367188, 0.03035593032836914, 0.031416893005371094, 0.03247785568237305, 0.033538818359375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 8.0, 13.0, 13.0, 26.0, 45.0, 55.0, 127.0, 256.0, 472.0, 1133.0, 4397.0, 42702.0, 726529.0, 255792.0, 13295.0, 2228.0, 753.0, 312.0, 160.0, 89.0, 50.0, 29.0, 23.0, 22.0, 10.0, 7.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02117919921875, -0.02058720588684082, -0.01999521255493164, -0.01940321922302246, -0.01881122589111328, -0.0182192325592041, -0.017627239227294922, -0.017035245895385742, -0.016443252563476562, -0.015851259231567383, -0.015259265899658203, -0.014667272567749023, -0.014075279235839844, -0.013483285903930664, -0.012891292572021484, -0.012299299240112305, -0.011707305908203125, -0.011115312576293945, -0.010523319244384766, -0.009931325912475586, -0.009339332580566406, -0.008747339248657227, -0.008155345916748047, -0.007563352584838867, -0.0069713592529296875, -0.006379365921020508, -0.005787372589111328, -0.0051953792572021484, -0.004603385925292969, -0.004011392593383789, -0.0034193992614746094, -0.0028274059295654297, -0.00223541259765625, -0.0016434192657470703, -0.0010514259338378906, -0.00045943260192871094, 0.00013256072998046875, 0.0007245540618896484, 0.0013165473937988281, 0.0019085407257080078, 0.0025005340576171875, 0.003092527389526367, 0.003684520721435547, 0.0042765140533447266, 0.004868507385253906, 0.005460500717163086, 0.006052494049072266, 0.006644487380981445, 0.007236480712890625, 0.007828474044799805, 0.008420467376708984, 0.009012460708618164, 0.009604454040527344, 0.010196447372436523, 0.010788440704345703, 0.011380434036254883, 0.011972427368164062, 0.012564420700073242, 0.013156414031982422, 0.013748407363891602, 0.014340400695800781, 0.014932394027709961, 0.01552438735961914, 0.01611638069152832, 0.0167083740234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 13.0, 27.0, 62.0, 111.0, 212.0, 229.0, 174.0, 100.0, 38.0, 20.0, 9.0, 7.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012302398681640625, -0.0001186951994895935, -0.00011436641216278076, -0.00011003762483596802, -0.00010570883750915527, -0.00010138005018234253, -9.705126285552979e-05, -9.272247552871704e-05, -8.83936882019043e-05, -8.406490087509155e-05, -7.973611354827881e-05, -7.540732622146606e-05, -7.107853889465332e-05, -6.674975156784058e-05, -6.242096424102783e-05, -5.809217691421509e-05, -5.3763389587402344e-05, -4.94346022605896e-05, -4.5105814933776855e-05, -4.077702760696411e-05, -3.644824028015137e-05, -3.211945295333862e-05, -2.779066562652588e-05, -2.3461878299713135e-05, -1.913309097290039e-05, -1.4804303646087646e-05, -1.0475516319274902e-05, -6.146728992462158e-06, -1.817941665649414e-06, 2.51084566116333e-06, 6.839632987976074e-06, 1.1168420314788818e-05, 1.5497207641601562e-05, 1.9825994968414307e-05, 2.415478229522705e-05, 2.8483569622039795e-05, 3.281235694885254e-05, 3.714114427566528e-05, 4.146993160247803e-05, 4.579871892929077e-05, 5.0127506256103516e-05, 5.445629358291626e-05, 5.8785080909729004e-05, 6.311386823654175e-05, 6.744265556335449e-05, 7.177144289016724e-05, 7.610023021697998e-05, 8.042901754379272e-05, 8.475780487060547e-05, 8.908659219741821e-05, 9.341537952423096e-05, 9.77441668510437e-05, 0.00010207295417785645, 0.00010640174150466919, 0.00011073052883148193, 0.00011505931615829468, 0.00011938810348510742, 0.00012371689081192017, 0.0001280456781387329, 0.00013237446546554565, 0.0001367032527923584, 0.00014103204011917114, 0.0001453608274459839, 0.00014968961477279663, 0.00015401840209960938]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 12.0, 15.0, 34.0, 66.0, 174.0, 385.0, 1318.0, 12544.0, 747650.0, 279744.0, 5214.0, 843.0, 328.0, 120.0, 63.0, 17.0, 8.0, 4.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0162200927734375, -0.015359640121459961, -0.014499187469482422, -0.013638734817504883, -0.012778282165527344, -0.011917829513549805, -0.011057376861572266, -0.010196924209594727, -0.009336471557617188, -0.008476018905639648, -0.007615566253662109, -0.00675511360168457, -0.005894660949707031, -0.005034208297729492, -0.004173755645751953, -0.003313302993774414, -0.002452850341796875, -0.001592397689819336, -0.0007319450378417969, 0.0001285076141357422, 0.0009889602661132812, 0.0018494129180908203, 0.0027098655700683594, 0.0035703182220458984, 0.0044307708740234375, 0.0052912235260009766, 0.006151676177978516, 0.007012128829956055, 0.007872581481933594, 0.008733034133911133, 0.009593486785888672, 0.010453939437866211, 0.01131439208984375, 0.012174844741821289, 0.013035297393798828, 0.013895750045776367, 0.014756202697753906, 0.015616655349731445, 0.016477108001708984, 0.017337560653686523, 0.018198013305664062, 0.0190584659576416, 0.01991891860961914, 0.02077937126159668, 0.02163982391357422, 0.022500276565551758, 0.023360729217529297, 0.024221181869506836, 0.025081634521484375, 0.025942087173461914, 0.026802539825439453, 0.027662992477416992, 0.02852344512939453, 0.02938389778137207, 0.03024435043334961, 0.03110480308532715, 0.03196525573730469, 0.03282570838928223, 0.033686161041259766, 0.034546613693237305, 0.035407066345214844, 0.03626751899719238, 0.03712797164916992, 0.03798842430114746, 0.038848876953125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 19.0, 49.0, 74.0, 142.0, 193.0, 221.0, 161.0, 79.0, 28.0, 16.0, 14.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0161285400390625, -0.01517796516418457, -0.01422739028930664, -0.013276815414428711, -0.012326240539550781, -0.011375665664672852, -0.010425090789794922, -0.009474515914916992, -0.008523941040039062, -0.007573366165161133, -0.006622791290283203, -0.0056722164154052734, -0.004721641540527344, -0.003771066665649414, -0.0028204917907714844, -0.0018699169158935547, -0.000919342041015625, 3.123283386230469e-05, 0.0009818077087402344, 0.001932382583618164, 0.0028829574584960938, 0.0038335323333740234, 0.004784107208251953, 0.005734682083129883, 0.0066852569580078125, 0.007635831832885742, 0.008586406707763672, 0.009536981582641602, 0.010487556457519531, 0.011438131332397461, 0.01238870620727539, 0.01333928108215332, 0.01428985595703125, 0.01524043083190918, 0.01619100570678711, 0.01714158058166504, 0.01809215545654297, 0.0190427303314209, 0.019993305206298828, 0.020943880081176758, 0.021894454956054688, 0.022845029830932617, 0.023795604705810547, 0.024746179580688477, 0.025696754455566406, 0.026647329330444336, 0.027597904205322266, 0.028548479080200195, 0.029499053955078125, 0.030449628829956055, 0.031400203704833984, 0.032350778579711914, 0.033301353454589844, 0.03425192832946777, 0.0352025032043457, 0.03615307807922363, 0.03710365295410156, 0.03805422782897949, 0.03900480270385742, 0.03995537757873535, 0.04090595245361328, 0.04185652732849121, 0.04280710220336914, 0.04375767707824707, 0.044708251953125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 11.0, 57.0, 179.0, 301.0, 238.0, 142.0, 46.0, 18.0, 7.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17521151900291443, -0.16320161521434784, -0.15119171142578125, -0.13918179273605347, -0.12717190384864807, -0.11516199260950089, -0.1031520813703537, -0.09114217758178711, -0.07913227379322052, -0.06712237000465393, -0.05511246249079704, -0.043102554976940155, -0.031092651188373566, -0.019082747399806976, -0.00707283616065979, 0.004937067627906799, 0.01694697141647339, 0.028956877067685127, 0.040966782718896866, 0.052976690232753754, 0.06498659402132034, 0.07699649780988693, 0.08900640904903412, 0.10101631283760071, 0.1130262166261673, 0.1250361204147339, 0.13704602420330048, 0.14905592799186707, 0.16106584668159485, 0.17307573556900024, 0.18508565425872803, 0.19709555804729462, 0.20910543203353882, 0.2211153358221054, 0.233125239610672, 0.24513515830039978, 0.2571450471878052, 0.26915496587753296, 0.28116488456726074, 0.29317477345466614, 0.30518466234207153, 0.3171945810317993, 0.3292044699192047, 0.3412143886089325, 0.3532242774963379, 0.3652341961860657, 0.37724411487579346, 0.38925400376319885, 0.40126392245292664, 0.4132738411426544, 0.4252837300300598, 0.4372936487197876, 0.449303537607193, 0.4613134562969208, 0.47332334518432617, 0.48533326387405396, 0.49734318256378174, 0.5093531012535095, 0.5213630199432373, 0.5333728790283203, 0.5453827977180481, 0.5573927164077759, 0.5694026350975037, 0.5814125537872314, 0.5934224128723145]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 1.0, 3.0, 5.0, 8.0, 14.0, 15.0, 14.0, 14.0, 14.0, 27.0, 22.0, 22.0, 34.0, 37.0, 33.0, 41.0, 40.0, 41.0, 42.0, 44.0, 50.0, 42.0, 44.0, 54.0, 36.0, 34.0, 30.0, 27.0, 34.0, 23.0, 21.0, 23.0, 20.0, 22.0, 12.0, 17.0, 9.0, 2.0, 6.0, 4.0, 3.0, 2.0, 8.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15338724851608276, -0.14796870946884155, -0.14255017042160034, -0.13713164627552032, -0.1317131072282791, -0.1262945681810379, -0.12087603658437729, -0.11545750498771667, -0.11003896594047546, -0.10462042689323425, -0.09920189529657364, -0.09378336369991302, -0.08836482465267181, -0.0829462856054306, -0.07752775400876999, -0.07210922241210938, -0.06669068336486816, -0.06127214804291725, -0.05585361272096634, -0.05043507739901543, -0.045016542077064514, -0.0395980067551136, -0.03417947143316269, -0.028760936111211777, -0.023342400789260864, -0.017923865467309952, -0.01250533014535904, -0.007086794823408127, -0.0016682595014572144, 0.003750275820493698, 0.00916881114244461, 0.014587346464395523, 0.020005881786346436, 0.025424417108297348, 0.03084295243024826, 0.03626148775219917, 0.041680023074150085, 0.047098558396101, 0.05251709371805191, 0.05793562904000282, 0.06335416436195374, 0.06877270340919495, 0.07419123500585556, 0.07960976660251617, 0.08502830564975739, 0.0904468446969986, 0.09586537629365921, 0.10128390789031982, 0.10670244693756104, 0.11212098598480225, 0.11753951758146286, 0.12295804917812347, 0.12837658822536469, 0.1337951272726059, 0.1392136514186859, 0.14463219046592712, 0.15005072951316833, 0.15546926856040955, 0.16088780760765076, 0.16630633175373077, 0.17172487080097198, 0.1771434098482132, 0.1825619339942932, 0.18798047304153442, 0.19339901208877563]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 6.0, 6.0, 4.0, 9.0, 14.0, 23.0, 23.0, 25.0, 32.0, 55.0, 83.0, 134.0, 237.0, 378.0, 694.0, 1330.0, 2911.0, 7288.0, 24710.0, 253671.0, 3828491.0, 52988.0, 12237.0, 4332.0, 1963.0, 997.0, 573.0, 358.0, 213.0, 150.0, 104.0, 69.0, 57.0, 33.0, 26.0, 14.0, 15.0, 11.0, 7.0, 4.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044464111328125, -0.04308462142944336, -0.04170513153076172, -0.04032564163208008, -0.03894615173339844, -0.0375666618347168, -0.036187171936035156, -0.034807682037353516, -0.033428192138671875, -0.032048702239990234, -0.030669212341308594, -0.029289722442626953, -0.027910232543945312, -0.026530742645263672, -0.02515125274658203, -0.02377176284790039, -0.02239227294921875, -0.02101278305053711, -0.01963329315185547, -0.018253803253173828, -0.016874313354492188, -0.015494823455810547, -0.014115333557128906, -0.012735843658447266, -0.011356353759765625, -0.009976863861083984, -0.008597373962402344, -0.007217884063720703, -0.0058383941650390625, -0.004458904266357422, -0.0030794143676757812, -0.0016999244689941406, -0.0003204345703125, 0.0010590553283691406, 0.0024385452270507812, 0.003818035125732422, 0.0051975250244140625, 0.006577014923095703, 0.007956504821777344, 0.009335994720458984, 0.010715484619140625, 0.012094974517822266, 0.013474464416503906, 0.014853954315185547, 0.016233444213867188, 0.017612934112548828, 0.01899242401123047, 0.02037191390991211, 0.02175140380859375, 0.02313089370727539, 0.02451038360595703, 0.025889873504638672, 0.027269363403320312, 0.028648853302001953, 0.030028343200683594, 0.031407833099365234, 0.032787322998046875, 0.034166812896728516, 0.035546302795410156, 0.0369257926940918, 0.03830528259277344, 0.03968477249145508, 0.04106426239013672, 0.04244375228881836, 0.0438232421875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 11.0, 12.0, 10.0, 23.0, 28.0, 49.0, 46.0, 70.0, 65.0, 76.0, 87.0, 102.0, 88.0, 72.0, 74.0, 58.0, 37.0, 23.0, 19.0, 11.0, 14.0, 6.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0203399658203125, -0.019743680953979492, -0.019147396087646484, -0.018551111221313477, -0.01795482635498047, -0.01735854148864746, -0.016762256622314453, -0.016165971755981445, -0.015569686889648438, -0.01497340202331543, -0.014377117156982422, -0.013780832290649414, -0.013184547424316406, -0.012588262557983398, -0.01199197769165039, -0.011395692825317383, -0.010799407958984375, -0.010203123092651367, -0.00960683822631836, -0.009010553359985352, -0.008414268493652344, -0.007817983627319336, -0.007221698760986328, -0.00662541389465332, -0.0060291290283203125, -0.005432844161987305, -0.004836559295654297, -0.004240274429321289, -0.0036439895629882812, -0.0030477046966552734, -0.0024514198303222656, -0.0018551349639892578, -0.00125885009765625, -0.0006625652313232422, -6.628036499023438e-05, 0.0005300045013427734, 0.0011262893676757812, 0.001722574234008789, 0.002318859100341797, 0.0029151439666748047, 0.0035114288330078125, 0.00410771369934082, 0.004703998565673828, 0.005300283432006836, 0.005896568298339844, 0.0064928531646728516, 0.007089138031005859, 0.007685422897338867, 0.008281707763671875, 0.008877992630004883, 0.00947427749633789, 0.010070562362670898, 0.010666847229003906, 0.011263132095336914, 0.011859416961669922, 0.01245570182800293, 0.013051986694335938, 0.013648271560668945, 0.014244556427001953, 0.014840841293334961, 0.015437126159667969, 0.016033411026000977, 0.016629695892333984, 0.017225980758666992, 0.017822265625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 10.0, 5.0, 12.0, 25.0, 42.0, 62.0, 108.0, 198.0, 389.0, 789.0, 2125.0, 8153.0, 68797.0, 4033029.0, 68810.0, 8025.0, 2091.0, 806.0, 394.0, 187.0, 91.0, 68.0, 29.0, 14.0, 12.0, 4.0, 3.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048828125, -0.04727792739868164, -0.04572772979736328, -0.04417753219604492, -0.04262733459472656, -0.0410771369934082, -0.039526939392089844, -0.037976741790771484, -0.036426544189453125, -0.034876346588134766, -0.033326148986816406, -0.03177595138549805, -0.030225753784179688, -0.028675556182861328, -0.02712535858154297, -0.02557516098022461, -0.02402496337890625, -0.02247476577758789, -0.02092456817626953, -0.019374370574951172, -0.017824172973632812, -0.016273975372314453, -0.014723777770996094, -0.013173580169677734, -0.011623382568359375, -0.010073184967041016, -0.008522987365722656, -0.006972789764404297, -0.0054225921630859375, -0.003872394561767578, -0.0023221969604492188, -0.0007719993591308594, 0.0007781982421875, 0.0023283958435058594, 0.0038785934448242188, 0.005428791046142578, 0.0069789886474609375, 0.008529186248779297, 0.010079383850097656, 0.011629581451416016, 0.013179779052734375, 0.014729976654052734, 0.016280174255371094, 0.017830371856689453, 0.019380569458007812, 0.020930767059326172, 0.02248096466064453, 0.02403116226196289, 0.02558135986328125, 0.02713155746459961, 0.02868175506591797, 0.030231952667236328, 0.03178215026855469, 0.03333234786987305, 0.034882545471191406, 0.036432743072509766, 0.037982940673828125, 0.039533138275146484, 0.041083335876464844, 0.0426335334777832, 0.04418373107910156, 0.04573392868041992, 0.04728412628173828, 0.04883432388305664, 0.050384521484375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 6.0, 10.0, 17.0, 40.0, 39.0, 152.0, 2322.0, 1246.0, 126.0, 48.0, 25.0, 13.0, 9.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019561767578125, -0.018626689910888672, -0.017691612243652344, -0.016756534576416016, -0.015821456909179688, -0.01488637924194336, -0.013951301574707031, -0.013016223907470703, -0.012081146240234375, -0.011146068572998047, -0.010210990905761719, -0.00927591323852539, -0.008340835571289062, -0.007405757904052734, -0.006470680236816406, -0.005535602569580078, -0.00460052490234375, -0.003665447235107422, -0.0027303695678710938, -0.0017952919006347656, -0.0008602142333984375, 7.486343383789062e-05, 0.0010099411010742188, 0.0019450187683105469, 0.002880096435546875, 0.003815174102783203, 0.004750251770019531, 0.005685329437255859, 0.0066204071044921875, 0.007555484771728516, 0.008490562438964844, 0.009425640106201172, 0.0103607177734375, 0.011295795440673828, 0.012230873107910156, 0.013165950775146484, 0.014101028442382812, 0.01503610610961914, 0.01597118377685547, 0.016906261444091797, 0.017841339111328125, 0.018776416778564453, 0.01971149444580078, 0.02064657211303711, 0.021581649780273438, 0.022516727447509766, 0.023451805114746094, 0.024386882781982422, 0.02532196044921875, 0.026257038116455078, 0.027192115783691406, 0.028127193450927734, 0.029062271118164062, 0.02999734878540039, 0.03093242645263672, 0.03186750411987305, 0.032802581787109375, 0.0337376594543457, 0.03467273712158203, 0.03560781478881836, 0.03654289245605469, 0.037477970123291016, 0.038413047790527344, 0.03934812545776367, 0.040283203125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 9.0, 49.0, 731.0, 196.0, 11.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08888839185237885, -0.07727264612913132, -0.06565690040588379, -0.05404115468263626, -0.04242540895938873, -0.030809663236141205, -0.019193917512893677, -0.007578171789646149, 0.004037573933601379, 0.015653319656848907, 0.027269065380096436, 0.038884811103343964, 0.05050055682659149, 0.06211630254983902, 0.07373204827308655, 0.08534779399633408, 0.0969635397195816, 0.10857928544282913, 0.12019503116607666, 0.13181078433990479, 0.14342652261257172, 0.15504226088523865, 0.16665801405906677, 0.1782737672328949, 0.18988950550556183, 0.20150524377822876, 0.21312099695205688, 0.224736750125885, 0.23635248839855194, 0.24796822667121887, 0.259583979845047, 0.2711997330188751, 0.28281545639038086, 0.294431209564209, 0.3060469627380371, 0.31766268610954285, 0.32927843928337097, 0.3408941924571991, 0.35250991582870483, 0.36412566900253296, 0.3757414221763611, 0.3873571753501892, 0.39897292852401733, 0.41058865189552307, 0.4222044050693512, 0.4338201582431793, 0.44543588161468506, 0.4570516347885132, 0.4686673879623413, 0.48028314113616943, 0.49189889430999756, 0.5035146474838257, 0.5151304006576538, 0.5267460942268372, 0.5383618474006653, 0.5499776005744934, 0.5615933537483215, 0.5732091069221497, 0.5848248600959778, 0.5964406132698059, 0.6080563068389893, 0.6196720600128174, 0.6312878131866455, 0.6429035663604736, 0.6545193195343018]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 8.0, 14.0, 11.0, 26.0, 32.0, 31.0, 61.0, 63.0, 64.0, 84.0, 96.0, 86.0, 73.0, 81.0, 75.0, 49.0, 45.0, 28.0, 18.0, 19.0, 7.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07468616962432861, -0.0723508894443512, -0.07001560926437378, -0.06768032908439636, -0.06534504890441895, -0.06300976127386093, -0.060674481093883514, -0.0583392009139061, -0.05600392073392868, -0.05366864055395126, -0.051333360373973846, -0.04899807646870613, -0.046662796288728714, -0.0443275161087513, -0.04199223220348358, -0.039656952023506165, -0.03732167184352875, -0.03498639166355133, -0.032651111483573914, -0.030315827578306198, -0.02798054739832878, -0.025645267218351364, -0.023309985175728798, -0.02097470313310623, -0.018639422953128815, -0.016304142773151398, -0.013968860730528831, -0.01163357961922884, -0.009298298507928848, -0.006963017396628857, -0.004627736285328865, -0.002292454242706299, 4.2825937271118164e-05, 0.0023781070485711098, 0.004713388159871101, 0.007048669271171093, 0.009383950382471085, 0.011719231493771076, 0.014054512605071068, 0.016389794647693634, 0.01872507482767105, 0.021060355007648468, 0.023395637050271034, 0.0257309190928936, 0.028066199272871017, 0.030401479452848434, 0.03273676335811615, 0.03507204353809357, 0.037407323718070984, 0.0397426038980484, 0.04207788407802582, 0.04441316798329353, 0.04674844816327095, 0.04908372834324837, 0.05141901224851608, 0.0537542924284935, 0.05608957260847092, 0.058424852788448334, 0.06076013296842575, 0.06309541314840317, 0.06543070077896118, 0.0677659809589386, 0.07010126113891602, 0.07243654131889343, 0.07477182149887085]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 10.0, 17.0, 25.0, 44.0, 74.0, 132.0, 253.0, 611.0, 1910.0, 8288.0, 83529.0, 743592.0, 190995.0, 14809.0, 2800.0, 809.0, 325.0, 135.0, 77.0, 35.0, 25.0, 14.0, 11.0, 5.0, 3.0, 4.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05474853515625, -0.053212642669677734, -0.05167675018310547, -0.0501408576965332, -0.04860496520996094, -0.04706907272338867, -0.045533180236816406, -0.04399728775024414, -0.042461395263671875, -0.04092550277709961, -0.039389610290527344, -0.03785371780395508, -0.03631782531738281, -0.03478193283081055, -0.03324604034423828, -0.031710147857666016, -0.03017425537109375, -0.028638362884521484, -0.02710247039794922, -0.025566577911376953, -0.024030685424804688, -0.022494792938232422, -0.020958900451660156, -0.01942300796508789, -0.017887115478515625, -0.01635122299194336, -0.014815330505371094, -0.013279438018798828, -0.011743545532226562, -0.010207653045654297, -0.008671760559082031, -0.007135868072509766, -0.0055999755859375, -0.004064083099365234, -0.0025281906127929688, -0.0009922981262207031, 0.0005435943603515625, 0.002079486846923828, 0.0036153793334960938, 0.005151271820068359, 0.006687164306640625, 0.00822305679321289, 0.009758949279785156, 0.011294841766357422, 0.012830734252929688, 0.014366626739501953, 0.01590251922607422, 0.017438411712646484, 0.01897430419921875, 0.020510196685791016, 0.02204608917236328, 0.023581981658935547, 0.025117874145507812, 0.026653766632080078, 0.028189659118652344, 0.02972555160522461, 0.031261444091796875, 0.03279733657836914, 0.034333229064941406, 0.03586912155151367, 0.03740501403808594, 0.0389409065246582, 0.04047679901123047, 0.042012691497802734, 0.043548583984375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 7.0, 12.0, 13.0, 14.0, 29.0, 41.0, 43.0, 55.0, 82.0, 70.0, 76.0, 104.0, 85.0, 73.0, 69.0, 61.0, 53.0, 40.0, 21.0, 14.0, 8.0, 8.0, 3.0, 4.0, 5.0, 2.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0205535888671875, -0.019941091537475586, -0.019328594207763672, -0.018716096878051758, -0.018103599548339844, -0.01749110221862793, -0.016878604888916016, -0.0162661075592041, -0.015653610229492188, -0.015041112899780273, -0.01442861557006836, -0.013816118240356445, -0.013203620910644531, -0.012591123580932617, -0.011978626251220703, -0.011366128921508789, -0.010753631591796875, -0.010141134262084961, -0.009528636932373047, -0.008916139602661133, -0.008303642272949219, -0.007691144943237305, -0.007078647613525391, -0.0064661502838134766, -0.0058536529541015625, -0.0052411556243896484, -0.004628658294677734, -0.00401616096496582, -0.0034036636352539062, -0.002791166305541992, -0.002178668975830078, -0.001566171646118164, -0.00095367431640625, -0.00034117698669433594, 0.0002713203430175781, 0.0008838176727294922, 0.0014963150024414062, 0.0021088123321533203, 0.0027213096618652344, 0.0033338069915771484, 0.0039463043212890625, 0.0045588016510009766, 0.005171298980712891, 0.005783796310424805, 0.006396293640136719, 0.007008790969848633, 0.007621288299560547, 0.008233785629272461, 0.008846282958984375, 0.009458780288696289, 0.010071277618408203, 0.010683774948120117, 0.011296272277832031, 0.011908769607543945, 0.01252126693725586, 0.013133764266967773, 0.013746261596679688, 0.014358758926391602, 0.014971256256103516, 0.01558375358581543, 0.016196250915527344, 0.016808748245239258, 0.017421245574951172, 0.018033742904663086, 0.018646240234375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 7.0, 3.0, 4.0, 9.0, 9.0, 11.0, 20.0, 24.0, 46.0, 58.0, 79.0, 110.0, 160.0, 236.0, 387.0, 739.0, 1846.0, 8723.0, 85938.0, 781398.0, 151308.0, 12966.0, 2407.0, 834.0, 375.0, 274.0, 197.0, 120.0, 71.0, 56.0, 43.0, 33.0, 21.0, 10.0, 10.0, 8.0, 10.0, 1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03607177734375, -0.03493022918701172, -0.03378868103027344, -0.032647132873535156, -0.031505584716796875, -0.030364036560058594, -0.029222488403320312, -0.02808094024658203, -0.02693939208984375, -0.02579784393310547, -0.024656295776367188, -0.023514747619628906, -0.022373199462890625, -0.021231651306152344, -0.020090103149414062, -0.01894855499267578, -0.0178070068359375, -0.01666545867919922, -0.015523910522460938, -0.014382362365722656, -0.013240814208984375, -0.012099266052246094, -0.010957717895507812, -0.009816169738769531, -0.00867462158203125, -0.007533073425292969, -0.0063915252685546875, -0.005249977111816406, -0.004108428955078125, -0.0029668807983398438, -0.0018253326416015625, -0.0006837844848632812, 0.000457763671875, 0.0015993118286132812, 0.0027408599853515625, 0.0038824081420898438, 0.005023956298828125, 0.006165504455566406, 0.0073070526123046875, 0.008448600769042969, 0.00959014892578125, 0.010731697082519531, 0.011873245239257812, 0.013014793395996094, 0.014156341552734375, 0.015297889709472656, 0.016439437866210938, 0.01758098602294922, 0.0187225341796875, 0.01986408233642578, 0.021005630493164062, 0.022147178649902344, 0.023288726806640625, 0.024430274963378906, 0.025571823120117188, 0.02671337127685547, 0.02785491943359375, 0.02899646759033203, 0.030138015747070312, 0.031279563903808594, 0.032421112060546875, 0.033562660217285156, 0.03470420837402344, 0.03584575653076172, 0.0369873046875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 9.0, 10.0, 14.0, 9.0, 14.0, 16.0, 24.0, 27.0, 21.0, 35.0, 36.0, 37.0, 47.0, 40.0, 49.0, 42.0, 58.0, 51.0, 52.0, 48.0, 39.0, 52.0, 25.0, 38.0, 40.0, 31.0, 23.0, 21.0, 19.0, 11.0, 9.0, 8.0, 10.0, 4.0, 2.0, 10.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04486083984375, -0.04352569580078125, -0.0421905517578125, -0.04085540771484375, -0.039520263671875, -0.03818511962890625, -0.0368499755859375, -0.03551483154296875, -0.0341796875, -0.03284454345703125, -0.0315093994140625, -0.03017425537109375, -0.028839111328125, -0.02750396728515625, -0.0261688232421875, -0.02483367919921875, -0.02349853515625, -0.02216339111328125, -0.0208282470703125, -0.01949310302734375, -0.018157958984375, -0.01682281494140625, -0.0154876708984375, -0.01415252685546875, -0.0128173828125, -0.01148223876953125, -0.0101470947265625, -0.00881195068359375, -0.007476806640625, -0.00614166259765625, -0.0048065185546875, -0.00347137451171875, -0.00213623046875, -0.00080108642578125, 0.0005340576171875, 0.00186920166015625, 0.003204345703125, 0.00453948974609375, 0.0058746337890625, 0.00720977783203125, 0.008544921875, 0.00988006591796875, 0.0112152099609375, 0.01255035400390625, 0.013885498046875, 0.01522064208984375, 0.0165557861328125, 0.01789093017578125, 0.01922607421875, 0.02056121826171875, 0.0218963623046875, 0.02323150634765625, 0.024566650390625, 0.02590179443359375, 0.0272369384765625, 0.02857208251953125, 0.0299072265625, 0.03124237060546875, 0.0325775146484375, 0.03391265869140625, 0.035247802734375, 0.03658294677734375, 0.0379180908203125, 0.03925323486328125, 0.04058837890625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 8.0, 14.0, 18.0, 29.0, 70.0, 125.0, 248.0, 505.0, 1204.0, 3420.0, 13673.0, 89159.0, 744466.0, 168023.0, 20061.0, 4730.0, 1557.0, 618.0, 281.0, 158.0, 74.0, 40.0, 28.0, 13.0, 10.0, 8.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01313018798828125, -0.012714982032775879, -0.012299776077270508, -0.011884570121765137, -0.011469364166259766, -0.011054158210754395, -0.010638952255249023, -0.010223746299743652, -0.009808540344238281, -0.00939333438873291, -0.008978128433227539, -0.008562922477722168, -0.008147716522216797, -0.007732510566711426, -0.007317304611206055, -0.006902098655700684, -0.0064868927001953125, -0.006071686744689941, -0.00565648078918457, -0.005241274833679199, -0.004826068878173828, -0.004410862922668457, -0.003995656967163086, -0.003580451011657715, -0.0031652450561523438, -0.0027500391006469727, -0.0023348331451416016, -0.0019196271896362305, -0.0015044212341308594, -0.0010892152786254883, -0.0006740093231201172, -0.0002588033676147461, 0.000156402587890625, 0.0005716085433959961, 0.0009868144989013672, 0.0014020204544067383, 0.0018172264099121094, 0.0022324323654174805, 0.0026476383209228516, 0.0030628442764282227, 0.0034780502319335938, 0.003893256187438965, 0.004308462142944336, 0.004723668098449707, 0.005138874053955078, 0.005554080009460449, 0.00596928596496582, 0.006384491920471191, 0.0067996978759765625, 0.007214903831481934, 0.007630109786987305, 0.008045315742492676, 0.008460521697998047, 0.008875727653503418, 0.009290933609008789, 0.00970613956451416, 0.010121345520019531, 0.010536551475524902, 0.010951757431030273, 0.011366963386535645, 0.011782169342041016, 0.012197375297546387, 0.012612581253051758, 0.013027787208557129, 0.0134429931640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 9.0, 11.0, 12.0, 26.0, 24.0, 70.0, 105.0, 136.0, 157.0, 163.0, 118.0, 61.0, 39.0, 30.0, 18.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.18235969543457e-05, -6.890296936035156e-05, -6.598234176635742e-05, -6.306171417236328e-05, -6.014108657836914e-05, -5.7220458984375e-05, -5.429983139038086e-05, -5.137920379638672e-05, -4.845857620239258e-05, -4.553794860839844e-05, -4.26173210144043e-05, -3.9696693420410156e-05, -3.6776065826416016e-05, -3.3855438232421875e-05, -3.0934810638427734e-05, -2.8014183044433594e-05, -2.5093555450439453e-05, -2.2172927856445312e-05, -1.9252300262451172e-05, -1.633167266845703e-05, -1.341104507446289e-05, -1.049041748046875e-05, -7.569789886474609e-06, -4.649162292480469e-06, -1.7285346984863281e-06, 1.1920928955078125e-06, 4.112720489501953e-06, 7.033348083496094e-06, 9.953975677490234e-06, 1.2874603271484375e-05, 1.5795230865478516e-05, 1.8715858459472656e-05, 2.1636486053466797e-05, 2.4557113647460938e-05, 2.7477741241455078e-05, 3.039836883544922e-05, 3.331899642944336e-05, 3.62396240234375e-05, 3.916025161743164e-05, 4.208087921142578e-05, 4.500150680541992e-05, 4.792213439941406e-05, 5.08427619934082e-05, 5.3763389587402344e-05, 5.6684017181396484e-05, 5.9604644775390625e-05, 6.252527236938477e-05, 6.54458999633789e-05, 6.836652755737305e-05, 7.128715515136719e-05, 7.420778274536133e-05, 7.712841033935547e-05, 8.004903793334961e-05, 8.296966552734375e-05, 8.589029312133789e-05, 8.881092071533203e-05, 9.173154830932617e-05, 9.465217590332031e-05, 9.757280349731445e-05, 0.0001004934310913086, 0.00010341405868530273, 0.00010633468627929688, 0.00010925531387329102, 0.00011217594146728516, 0.0001150965690612793]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 5.0, 2.0, 6.0, 14.0, 15.0, 17.0, 37.0, 47.0, 71.0, 120.0, 169.0, 284.0, 487.0, 1025.0, 1938.0, 5067.0, 14481.0, 57215.0, 306557.0, 514346.0, 108699.0, 24721.0, 7619.0, 2759.0, 1265.0, 645.0, 358.0, 203.0, 134.0, 81.0, 55.0, 35.0, 21.0, 13.0, 11.0, 12.0, 5.0, 4.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00905609130859375, -0.008791327476501465, -0.00852656364440918, -0.008261799812316895, -0.00799703598022461, -0.007732272148132324, -0.007467508316040039, -0.007202744483947754, -0.006937980651855469, -0.006673216819763184, -0.0064084529876708984, -0.006143689155578613, -0.005878925323486328, -0.005614161491394043, -0.005349397659301758, -0.005084633827209473, -0.0048198699951171875, -0.004555106163024902, -0.004290342330932617, -0.004025578498840332, -0.003760814666748047, -0.0034960508346557617, -0.0032312870025634766, -0.0029665231704711914, -0.0027017593383789062, -0.002436995506286621, -0.002172231674194336, -0.0019074678421020508, -0.0016427040100097656, -0.0013779401779174805, -0.0011131763458251953, -0.0008484125137329102, -0.000583648681640625, -0.00031888484954833984, -5.412101745605469e-05, 0.00021064281463623047, 0.0004754066467285156, 0.0007401704788208008, 0.001004934310913086, 0.001269698143005371, 0.0015344619750976562, 0.0017992258071899414, 0.0020639896392822266, 0.0023287534713745117, 0.002593517303466797, 0.002858281135559082, 0.003123044967651367, 0.0033878087997436523, 0.0036525726318359375, 0.003917336463928223, 0.004182100296020508, 0.004446864128112793, 0.004711627960205078, 0.004976391792297363, 0.0052411556243896484, 0.005505919456481934, 0.005770683288574219, 0.006035447120666504, 0.006300210952758789, 0.006564974784851074, 0.006829738616943359, 0.0070945024490356445, 0.00735926628112793, 0.007624030113220215, 0.0078887939453125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 7.0, 6.0, 10.0, 10.0, 21.0, 26.0, 59.0, 75.0, 82.0, 98.0, 106.0, 121.0, 89.0, 93.0, 67.0, 39.0, 29.0, 24.0, 10.0, 11.0, 4.0, 5.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.016387939453125, -0.015978693962097168, -0.015569448471069336, -0.015160202980041504, -0.014750957489013672, -0.01434171199798584, -0.013932466506958008, -0.013523221015930176, -0.013113975524902344, -0.012704730033874512, -0.01229548454284668, -0.011886239051818848, -0.011476993560791016, -0.011067748069763184, -0.010658502578735352, -0.01024925708770752, -0.009840011596679688, -0.009430766105651855, -0.009021520614624023, -0.008612275123596191, -0.00820302963256836, -0.007793784141540527, -0.007384538650512695, -0.006975293159484863, -0.006566047668457031, -0.006156802177429199, -0.005747556686401367, -0.005338311195373535, -0.004929065704345703, -0.004519820213317871, -0.004110574722290039, -0.003701329231262207, -0.003292083740234375, -0.002882838249206543, -0.002473592758178711, -0.002064347267150879, -0.0016551017761230469, -0.0012458562850952148, -0.0008366107940673828, -0.0004273653030395508, -1.811981201171875e-05, 0.0003911256790161133, 0.0008003711700439453, 0.0012096166610717773, 0.0016188621520996094, 0.0020281076431274414, 0.0024373531341552734, 0.0028465986251831055, 0.0032558441162109375, 0.0036650896072387695, 0.0040743350982666016, 0.004483580589294434, 0.004892826080322266, 0.005302071571350098, 0.00571131706237793, 0.006120562553405762, 0.006529808044433594, 0.006939053535461426, 0.007348299026489258, 0.00775754451751709, 0.008166790008544922, 0.008576035499572754, 0.008985280990600586, 0.009394526481628418, 0.00980377197265625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 13.0, 42.0, 153.0, 286.0, 297.0, 144.0, 43.0, 18.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31041884422302246, -0.2979366183280945, -0.2854543924331665, -0.2729721665382385, -0.26048994064331055, -0.24800771474838257, -0.2355254888534546, -0.2230432629585266, -0.21056103706359863, -0.19807881116867065, -0.18559658527374268, -0.1731143593788147, -0.16063213348388672, -0.14814990758895874, -0.13566768169403076, -0.12318544834852219, -0.11070321500301361, -0.09822098910808563, -0.08573876321315765, -0.07325653731822968, -0.0607743076980114, -0.04829208180308342, -0.03580985218286514, -0.023327626287937164, -0.010845400393009186, 0.0016368264332413673, 0.01411905325949192, 0.026601281017065048, 0.03908350691199303, 0.051565732806921005, 0.06404796242713928, 0.07653018832206726, 0.08901241421699524, 0.10149464011192322, 0.1139768660068512, 0.12645909190177917, 0.13894131779670715, 0.15142354369163513, 0.1639057695865631, 0.1763879954814911, 0.18887022137641907, 0.20135244727134705, 0.21383467316627502, 0.226316899061203, 0.23879912495613098, 0.25128135085105896, 0.26376357674598694, 0.2762458026409149, 0.2887280583381653, 0.30121028423309326, 0.31369251012802124, 0.3261747360229492, 0.3386569619178772, 0.3511391878128052, 0.36362141370773315, 0.37610363960266113, 0.3885858654975891, 0.4010680913925171, 0.41355031728744507, 0.42603254318237305, 0.438514769077301, 0.450996994972229, 0.463479220867157, 0.47596144676208496, 0.48844367265701294]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 1.0, 4.0, 3.0, 8.0, 11.0, 13.0, 12.0, 15.0, 19.0, 20.0, 18.0, 22.0, 17.0, 25.0, 28.0, 29.0, 25.0, 20.0, 44.0, 41.0, 32.0, 43.0, 36.0, 40.0, 42.0, 39.0, 36.0, 46.0, 43.0, 33.0, 30.0, 19.0, 19.0, 22.0, 19.0, 21.0, 15.0, 11.0, 13.0, 14.0, 7.0, 9.0, 9.0, 6.0, 6.0, 5.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.17645269632339478, -0.1709679812192917, -0.1654832810163498, -0.1599985659122467, -0.1545138657093048, -0.14902915060520172, -0.14354443550109863, -0.13805973529815674, -0.13257502019405365, -0.12709030508995056, -0.12160560488700867, -0.11612088978290558, -0.11063618212938309, -0.1051514744758606, -0.09966675937175751, -0.09418205171823502, -0.08869734406471252, -0.08321263641119003, -0.07772792875766754, -0.07224321365356445, -0.06675850600004196, -0.06127379834651947, -0.05578908696770668, -0.05030437558889389, -0.0448196679353714, -0.03933496028184891, -0.03385024890303612, -0.028365539386868477, -0.022880829870700836, -0.017396120354533195, -0.011911410838365555, -0.006426699459552765, -0.0009419918060302734, 0.004542717710137367, 0.010027427226305008, 0.015512136742472649, 0.02099684625864029, 0.02648155577480793, 0.03196626529097557, 0.03745097666978836, 0.04293568432331085, 0.048420391976833344, 0.05390510335564613, 0.05938981473445892, 0.06487452238798141, 0.0703592300415039, 0.075843945145607, 0.08132865279912949, 0.08681336045265198, 0.09229806810617447, 0.09778277575969696, 0.10326749086380005, 0.10875219851732254, 0.11423690617084503, 0.11972162127494812, 0.12520632147789001, 0.1306910365819931, 0.1361757516860962, 0.14166045188903809, 0.14714516699314117, 0.15262988209724426, 0.15811458230018616, 0.16359929740428925, 0.16908401250839233, 0.17456871271133423]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 1.0, 1.0, 5.0, 3.0, 7.0, 10.0, 3.0, 13.0, 18.0, 31.0, 39.0, 78.0, 148.0, 302.0, 567.0, 1443.0, 5075.0, 60219.0, 4101364.0, 19740.0, 3174.0, 1030.0, 417.0, 221.0, 125.0, 90.0, 39.0, 31.0, 15.0, 19.0, 8.0, 10.0, 5.0, 5.0, 7.0, 3.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04119873046875, -0.0397944450378418, -0.038390159606933594, -0.03698587417602539, -0.03558158874511719, -0.034177303314208984, -0.03277301788330078, -0.03136873245239258, -0.029964447021484375, -0.028560161590576172, -0.02715587615966797, -0.025751590728759766, -0.024347305297851562, -0.02294301986694336, -0.021538734436035156, -0.020134449005126953, -0.01873016357421875, -0.017325878143310547, -0.015921592712402344, -0.01451730728149414, -0.013113021850585938, -0.011708736419677734, -0.010304450988769531, -0.008900165557861328, -0.007495880126953125, -0.006091594696044922, -0.004687309265136719, -0.0032830238342285156, -0.0018787384033203125, -0.0004744529724121094, 0.0009298324584960938, 0.002334117889404297, 0.0037384033203125, 0.005142688751220703, 0.006546974182128906, 0.00795125961303711, 0.009355545043945312, 0.010759830474853516, 0.012164115905761719, 0.013568401336669922, 0.014972686767578125, 0.016376972198486328, 0.01778125762939453, 0.019185543060302734, 0.020589828491210938, 0.02199411392211914, 0.023398399353027344, 0.024802684783935547, 0.02620697021484375, 0.027611255645751953, 0.029015541076660156, 0.03041982650756836, 0.03182411193847656, 0.033228397369384766, 0.03463268280029297, 0.03603696823120117, 0.037441253662109375, 0.03884553909301758, 0.04024982452392578, 0.041654109954833984, 0.04305839538574219, 0.04446268081665039, 0.045866966247558594, 0.0472712516784668, 0.048675537109375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 6.0, 8.0, 7.0, 11.0, 19.0, 26.0, 35.0, 60.0, 59.0, 71.0, 87.0, 74.0, 89.0, 86.0, 72.0, 72.0, 54.0, 44.0, 30.0, 31.0, 15.0, 11.0, 8.0, 6.0, 4.0, 2.0, 1.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021148681640625, -0.02051544189453125, -0.0198822021484375, -0.01924896240234375, -0.01861572265625, -0.01798248291015625, -0.0173492431640625, -0.01671600341796875, -0.016082763671875, -0.01544952392578125, -0.0148162841796875, -0.01418304443359375, -0.0135498046875, -0.01291656494140625, -0.0122833251953125, -0.01165008544921875, -0.011016845703125, -0.01038360595703125, -0.0097503662109375, -0.00911712646484375, -0.00848388671875, -0.00785064697265625, -0.0072174072265625, -0.00658416748046875, -0.005950927734375, -0.00531768798828125, -0.0046844482421875, -0.00405120849609375, -0.00341796875, -0.00278472900390625, -0.0021514892578125, -0.00151824951171875, -0.000885009765625, -0.00025177001953125, 0.0003814697265625, 0.00101470947265625, 0.00164794921875, 0.00228118896484375, 0.0029144287109375, 0.00354766845703125, 0.004180908203125, 0.00481414794921875, 0.0054473876953125, 0.00608062744140625, 0.0067138671875, 0.00734710693359375, 0.0079803466796875, 0.00861358642578125, 0.009246826171875, 0.00988006591796875, 0.0105133056640625, 0.01114654541015625, 0.01177978515625, 0.01241302490234375, 0.0130462646484375, 0.01367950439453125, 0.014312744140625, 0.01494598388671875, 0.0155792236328125, 0.01621246337890625, 0.016845703125, 0.01747894287109375, 0.0181121826171875, 0.01874542236328125, 0.019378662109375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 8.0, 4.0, 7.0, 14.0, 19.0, 32.0, 31.0, 46.0, 70.0, 93.0, 125.0, 187.0, 282.0, 443.0, 740.0, 1387.0, 2849.0, 6785.0, 22561.0, 384559.0, 3726938.0, 31604.0, 8230.0, 3357.0, 1548.0, 860.0, 475.0, 307.0, 181.0, 146.0, 111.0, 71.0, 54.0, 44.0, 23.0, 30.0, 12.0, 9.0, 14.0, 7.0, 7.0, 3.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0162811279296875, -0.01575756072998047, -0.015233993530273438, -0.014710426330566406, -0.014186859130859375, -0.013663291931152344, -0.013139724731445312, -0.012616157531738281, -0.01209259033203125, -0.011569023132324219, -0.011045455932617188, -0.010521888732910156, -0.009998321533203125, -0.009474754333496094, -0.008951187133789062, -0.008427619934082031, -0.007904052734375, -0.007380485534667969, -0.0068569183349609375, -0.006333351135253906, -0.005809783935546875, -0.005286216735839844, -0.0047626495361328125, -0.004239082336425781, -0.00371551513671875, -0.0031919479370117188, -0.0026683807373046875, -0.0021448135375976562, -0.001621246337890625, -0.0010976791381835938, -0.0005741119384765625, -5.054473876953125e-05, 0.0004730224609375, 0.0009965896606445312, 0.0015201568603515625, 0.0020437240600585938, 0.002567291259765625, 0.0030908584594726562, 0.0036144256591796875, 0.004137992858886719, 0.00466156005859375, 0.005185127258300781, 0.0057086944580078125, 0.006232261657714844, 0.006755828857421875, 0.007279396057128906, 0.0078029632568359375, 0.008326530456542969, 0.00885009765625, 0.009373664855957031, 0.009897232055664062, 0.010420799255371094, 0.010944366455078125, 0.011467933654785156, 0.011991500854492188, 0.012515068054199219, 0.01303863525390625, 0.013562202453613281, 0.014085769653320312, 0.014609336853027344, 0.015132904052734375, 0.015656471252441406, 0.016180038452148438, 0.01670360565185547, 0.0172271728515625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 3.0, 5.0, 6.0, 5.0, 8.0, 14.0, 23.0, 54.0, 155.0, 3149.0, 457.0, 105.0, 37.0, 14.0, 7.0, 12.0, 6.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00331878662109375, -0.003185272216796875, -0.0030517578125, -0.002918243408203125, -0.00278472900390625, -0.002651214599609375, -0.0025177001953125, -0.002384185791015625, -0.00225067138671875, -0.002117156982421875, -0.001983642578125, -0.001850128173828125, -0.00171661376953125, -0.001583099365234375, -0.0014495849609375, -0.001316070556640625, -0.00118255615234375, -0.001049041748046875, -0.00091552734375, -0.000782012939453125, -0.00064849853515625, -0.000514984130859375, -0.0003814697265625, -0.000247955322265625, -0.00011444091796875, 1.9073486328125e-05, 0.000152587890625, 0.000286102294921875, 0.00041961669921875, 0.000553131103515625, 0.0006866455078125, 0.000820159912109375, 0.00095367431640625, 0.001087188720703125, 0.001220703125, 0.001354217529296875, 0.00148773193359375, 0.001621246337890625, 0.0017547607421875, 0.001888275146484375, 0.00202178955078125, 0.002155303955078125, 0.002288818359375, 0.002422332763671875, 0.00255584716796875, 0.002689361572265625, 0.0028228759765625, 0.002956390380859375, 0.00308990478515625, 0.003223419189453125, 0.00335693359375, 0.003490447998046875, 0.00362396240234375, 0.003757476806640625, 0.0038909912109375, 0.004024505615234375, 0.00415802001953125, 0.004291534423828125, 0.004425048828125, 0.004558563232421875, 0.00469207763671875, 0.004825592041015625, 0.0049591064453125, 0.005092620849609375, 0.00522613525390625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 10.0, 16.0, 53.0, 95.0, 149.0, 191.0, 189.0, 139.0, 67.0, 46.0, 14.0, 15.0, 8.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020072799175977707, -0.019483080133795738, -0.01889336109161377, -0.0183036420494318, -0.017713923007249832, -0.017124203965067863, -0.016534484922885895, -0.015944765880703926, -0.015355046838521957, -0.014765327796339989, -0.01417560875415802, -0.013585889711976051, -0.012996170669794083, -0.012406451627612114, -0.011816732585430145, -0.011227013543248177, -0.010637293569743633, -0.010047574527561665, -0.009457855485379696, -0.008868136443197727, -0.008278417401015759, -0.00768869835883379, -0.007098978850990534, -0.006509259808808565, -0.0059195407666265965, -0.005329821724444628, -0.004740102682262659, -0.004150383174419403, -0.003560664365068078, -0.0029709453228861094, -0.002381226047873497, -0.0017915070056915283, -0.0012017879635095596, -0.00061206886311993, -2.2349762730300426e-05, 0.0005673693958669901, 0.0011570884380489588, 0.0017468074802309275, 0.00233652675524354, 0.0029262457974255085, 0.003515964839607477, 0.004105683881789446, 0.0046954029239714146, 0.0052851224318146706, 0.005874841473996639, 0.006464560516178608, 0.007054279558360577, 0.007643998600542545, 0.008233717642724514, 0.008823436684906483, 0.009413155727088451, 0.01000287476927042, 0.010592593811452389, 0.011182312853634357, 0.0117720328271389, 0.01236175186932087, 0.012951470911502838, 0.013541189953684807, 0.014130908995866776, 0.014720628038048744, 0.015310347080230713, 0.01590006612241268, 0.01648978516459465, 0.01707950420677662, 0.017669223248958588]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 3.0, 9.0, 8.0, 4.0, 13.0, 8.0, 15.0, 12.0, 14.0, 22.0, 23.0, 26.0, 33.0, 40.0, 42.0, 40.0, 40.0, 41.0, 46.0, 37.0, 44.0, 48.0, 37.0, 50.0, 38.0, 58.0, 31.0, 34.0, 27.0, 18.0, 30.0, 23.0, 20.0, 20.0, 14.0, 8.0, 7.0, 5.0, 3.0, 10.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.007131099700927734, -0.006917395628988743, -0.006703691557049751, -0.00648998748511076, -0.006276283413171768, -0.006062579341232777, -0.005848875269293785, -0.0056351711973547935, -0.005421467125415802, -0.0052077630534768105, -0.004994058981537819, -0.004780354909598827, -0.004566650837659836, -0.004352946765720844, -0.004139242693781853, -0.003925538621842861, -0.0037118345499038696, -0.003498130477964878, -0.0032844264060258865, -0.003070722334086895, -0.0028570182621479034, -0.002643314190208912, -0.0024296101182699203, -0.002215906046330929, -0.0020022019743919373, -0.0017884979024529457, -0.0015747938305139542, -0.0013610897585749626, -0.001147385686635971, -0.0009336816146969795, -0.000719977542757988, -0.0005062734708189964, -0.0002925693988800049, -7.886532694101334e-05, 0.0001348387449979782, 0.00034854281693696976, 0.0005622468888759613, 0.0007759509608149529, 0.0009896550327539444, 0.001203359104692936, 0.0014170631766319275, 0.001630767248570919, 0.0018444713205099106, 0.002058175392448902, 0.0022718794643878937, 0.0024855835363268852, 0.0026992876082658768, 0.0029129916802048683, 0.00312669575214386, 0.0033403998240828514, 0.003554103896021843, 0.0037678079679608345, 0.003981512039899826, 0.004195216111838818, 0.004408920183777809, 0.004622624255716801, 0.004836328327655792, 0.005050032399594784, 0.005263736471533775, 0.005477440543472767, 0.005691144615411758, 0.00590484868735075, 0.0061185527592897415, 0.006332256831228733, 0.006545960903167725]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 2.0, 3.0, 9.0, 16.0, 19.0, 36.0, 42.0, 100.0, 169.0, 416.0, 953.0, 3070.0, 14543.0, 114880.0, 635166.0, 244675.0, 27205.0, 4820.0, 1346.0, 559.0, 232.0, 108.0, 61.0, 42.0, 25.0, 9.0, 9.0, 9.0, 0.0, 5.0, 6.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.033294677734375, -0.03224325180053711, -0.03119182586669922, -0.030140399932861328, -0.029088973999023438, -0.028037548065185547, -0.026986122131347656, -0.025934696197509766, -0.024883270263671875, -0.023831844329833984, -0.022780418395996094, -0.021728992462158203, -0.020677566528320312, -0.019626140594482422, -0.01857471466064453, -0.01752328872680664, -0.01647186279296875, -0.01542043685913086, -0.014369010925292969, -0.013317584991455078, -0.012266159057617188, -0.011214733123779297, -0.010163307189941406, -0.009111881256103516, -0.008060455322265625, -0.007009029388427734, -0.005957603454589844, -0.004906177520751953, -0.0038547515869140625, -0.002803325653076172, -0.0017518997192382812, -0.0007004737854003906, 0.0003509521484375, 0.0014023780822753906, 0.0024538040161132812, 0.003505229949951172, 0.0045566558837890625, 0.005608081817626953, 0.006659507751464844, 0.007710933685302734, 0.008762359619140625, 0.009813785552978516, 0.010865211486816406, 0.011916637420654297, 0.012968063354492188, 0.014019489288330078, 0.015070915222167969, 0.01612234115600586, 0.01717376708984375, 0.01822519302368164, 0.01927661895751953, 0.020328044891357422, 0.021379470825195312, 0.022430896759033203, 0.023482322692871094, 0.024533748626708984, 0.025585174560546875, 0.026636600494384766, 0.027688026428222656, 0.028739452362060547, 0.029790878295898438, 0.030842304229736328, 0.03189373016357422, 0.03294515609741211, 0.03399658203125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 3.0, 11.0, 5.0, 12.0, 17.0, 26.0, 47.0, 42.0, 63.0, 72.0, 80.0, 78.0, 86.0, 93.0, 79.0, 58.0, 52.0, 48.0, 29.0, 36.0, 18.0, 9.0, 5.0, 9.0, 2.0, 3.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02117919921875, -0.020545482635498047, -0.019911766052246094, -0.01927804946899414, -0.018644332885742188, -0.018010616302490234, -0.01737689971923828, -0.016743183135986328, -0.016109466552734375, -0.015475749969482422, -0.014842033386230469, -0.014208316802978516, -0.013574600219726562, -0.01294088363647461, -0.012307167053222656, -0.011673450469970703, -0.01103973388671875, -0.010406017303466797, -0.009772300720214844, -0.00913858413696289, -0.008504867553710938, -0.007871150970458984, -0.007237434387207031, -0.006603717803955078, -0.005970001220703125, -0.005336284637451172, -0.004702568054199219, -0.004068851470947266, -0.0034351348876953125, -0.0028014183044433594, -0.0021677017211914062, -0.0015339851379394531, -0.0009002685546875, -0.0002665519714355469, 0.00036716461181640625, 0.0010008811950683594, 0.0016345977783203125, 0.0022683143615722656, 0.0029020309448242188, 0.003535747528076172, 0.004169464111328125, 0.004803180694580078, 0.005436897277832031, 0.006070613861083984, 0.0067043304443359375, 0.007338047027587891, 0.007971763610839844, 0.008605480194091797, 0.00923919677734375, 0.009872913360595703, 0.010506629943847656, 0.01114034652709961, 0.011774063110351562, 0.012407779693603516, 0.013041496276855469, 0.013675212860107422, 0.014308929443359375, 0.014942646026611328, 0.015576362609863281, 0.016210079193115234, 0.016843795776367188, 0.01747751235961914, 0.018111228942871094, 0.018744945526123047, 0.019378662109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 8.0, 7.0, 9.0, 14.0, 22.0, 20.0, 33.0, 45.0, 60.0, 76.0, 108.0, 167.0, 200.0, 315.0, 556.0, 1150.0, 4610.0, 33096.0, 424499.0, 532840.0, 42400.0, 5430.0, 1231.0, 580.0, 302.0, 210.0, 148.0, 114.0, 75.0, 60.0, 44.0, 36.0, 24.0, 19.0, 15.0, 8.0, 6.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02801513671875, -0.02708292007446289, -0.02615070343017578, -0.025218486785888672, -0.024286270141601562, -0.023354053497314453, -0.022421836853027344, -0.021489620208740234, -0.020557403564453125, -0.019625186920166016, -0.018692970275878906, -0.017760753631591797, -0.016828536987304688, -0.015896320343017578, -0.014964103698730469, -0.01403188705444336, -0.01309967041015625, -0.01216745376586914, -0.011235237121582031, -0.010303020477294922, -0.009370803833007812, -0.008438587188720703, -0.007506370544433594, -0.006574153900146484, -0.005641937255859375, -0.004709720611572266, -0.0037775039672851562, -0.002845287322998047, -0.0019130706787109375, -0.0009808540344238281, -4.863739013671875e-05, 0.0008835792541503906, 0.0018157958984375, 0.0027480125427246094, 0.0036802291870117188, 0.004612445831298828, 0.0055446624755859375, 0.006476879119873047, 0.007409095764160156, 0.008341312408447266, 0.009273529052734375, 0.010205745697021484, 0.011137962341308594, 0.012070178985595703, 0.013002395629882812, 0.013934612274169922, 0.014866828918457031, 0.01579904556274414, 0.01673126220703125, 0.01766347885131836, 0.01859569549560547, 0.019527912139892578, 0.020460128784179688, 0.021392345428466797, 0.022324562072753906, 0.023256778717041016, 0.024188995361328125, 0.025121212005615234, 0.026053428649902344, 0.026985645294189453, 0.027917861938476562, 0.028850078582763672, 0.02978229522705078, 0.03071451187133789, 0.031646728515625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 6.0, 13.0, 8.0, 7.0, 14.0, 20.0, 17.0, 24.0, 27.0, 23.0, 39.0, 38.0, 37.0, 43.0, 50.0, 41.0, 41.0, 54.0, 51.0, 50.0, 50.0, 44.0, 47.0, 26.0, 41.0, 27.0, 24.0, 24.0, 22.0, 22.0, 17.0, 11.0, 6.0, 6.0, 6.0, 7.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.03961181640625, -0.038254737854003906, -0.03689765930175781, -0.03554058074951172, -0.034183502197265625, -0.03282642364501953, -0.03146934509277344, -0.030112266540527344, -0.02875518798828125, -0.027398109436035156, -0.026041030883789062, -0.02468395233154297, -0.023326873779296875, -0.02196979522705078, -0.020612716674804688, -0.019255638122558594, -0.0178985595703125, -0.016541481018066406, -0.015184402465820312, -0.013827323913574219, -0.012470245361328125, -0.011113166809082031, -0.009756088256835938, -0.008399009704589844, -0.00704193115234375, -0.005684852600097656, -0.0043277740478515625, -0.0029706954956054688, -0.001613616943359375, -0.00025653839111328125, 0.0011005401611328125, 0.0024576187133789062, 0.003814697265625, 0.005171775817871094, 0.0065288543701171875, 0.007885932922363281, 0.009243011474609375, 0.010600090026855469, 0.011957168579101562, 0.013314247131347656, 0.01467132568359375, 0.016028404235839844, 0.017385482788085938, 0.01874256134033203, 0.020099639892578125, 0.02145671844482422, 0.022813796997070312, 0.024170875549316406, 0.0255279541015625, 0.026885032653808594, 0.028242111206054688, 0.02959918975830078, 0.030956268310546875, 0.03231334686279297, 0.03367042541503906, 0.035027503967285156, 0.03638458251953125, 0.037741661071777344, 0.03909873962402344, 0.04045581817626953, 0.041812896728515625, 0.04316997528076172, 0.04452705383300781, 0.045884132385253906, 0.0472412109375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 8.0, 11.0, 12.0, 30.0, 32.0, 54.0, 86.0, 127.0, 201.0, 342.0, 585.0, 1213.0, 2604.0, 6052.0, 16451.0, 55734.0, 238227.0, 504363.0, 161380.0, 39293.0, 12430.0, 4813.0, 2133.0, 1022.0, 526.0, 309.0, 184.0, 105.0, 76.0, 39.0, 37.0, 19.0, 12.0, 9.0, 11.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0066986083984375, -0.006491661071777344, -0.0062847137451171875, -0.006077766418457031, -0.005870819091796875, -0.005663871765136719, -0.0054569244384765625, -0.005249977111816406, -0.00504302978515625, -0.004836082458496094, -0.0046291351318359375, -0.004422187805175781, -0.004215240478515625, -0.004008293151855469, -0.0038013458251953125, -0.0035943984985351562, -0.003387451171875, -0.0031805038452148438, -0.0029735565185546875, -0.0027666091918945312, -0.002559661865234375, -0.0023527145385742188, -0.0021457672119140625, -0.0019388198852539062, -0.00173187255859375, -0.0015249252319335938, -0.0013179779052734375, -0.0011110305786132812, -0.000904083251953125, -0.0006971359252929688, -0.0004901885986328125, -0.00028324127197265625, -7.62939453125e-05, 0.00013065338134765625, 0.0003376007080078125, 0.0005445480346679688, 0.000751495361328125, 0.0009584426879882812, 0.0011653900146484375, 0.0013723373413085938, 0.00157928466796875, 0.0017862319946289062, 0.0019931793212890625, 0.0022001266479492188, 0.002407073974609375, 0.0026140213012695312, 0.0028209686279296875, 0.0030279159545898438, 0.00323486328125, 0.0034418106079101562, 0.0036487579345703125, 0.0038557052612304688, 0.004062652587890625, 0.004269599914550781, 0.0044765472412109375, 0.004683494567871094, 0.00489044189453125, 0.005097389221191406, 0.0053043365478515625, 0.005511283874511719, 0.005718231201171875, 0.005925178527832031, 0.0061321258544921875, 0.006339073181152344, 0.0065460205078125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 9.0, 5.0, 5.0, 8.0, 15.0, 17.0, 19.0, 21.0, 22.0, 36.0, 37.0, 49.0, 47.0, 68.0, 73.0, 89.0, 81.0, 90.0, 54.0, 51.0, 42.0, 42.0, 28.0, 18.0, 19.0, 17.0, 10.0, 7.0, 5.0, 8.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.167722702026367e-05, -5.034264177083969e-05, -4.900805652141571e-05, -4.767347127199173e-05, -4.633888602256775e-05, -4.500430077314377e-05, -4.366971552371979e-05, -4.233513027429581e-05, -4.1000545024871826e-05, -3.9665959775447845e-05, -3.8331374526023865e-05, -3.6996789276599884e-05, -3.56622040271759e-05, -3.432761877775192e-05, -3.299303352832794e-05, -3.165844827890396e-05, -3.032386302947998e-05, -2.8989277780056e-05, -2.765469253063202e-05, -2.632010728120804e-05, -2.4985522031784058e-05, -2.3650936782360077e-05, -2.2316351532936096e-05, -2.0981766283512115e-05, -1.9647181034088135e-05, -1.8312595784664154e-05, -1.6978010535240173e-05, -1.5643425285816193e-05, -1.4308840036392212e-05, -1.2974254786968231e-05, -1.163966953754425e-05, -1.030508428812027e-05, -8.970499038696289e-06, -7.635913789272308e-06, -6.301328539848328e-06, -4.966743290424347e-06, -3.632158041000366e-06, -2.2975727915763855e-06, -9.629875421524048e-07, 3.7159770727157593e-07, 1.7061829566955566e-06, 3.0407682061195374e-06, 4.375353455543518e-06, 5.709938704967499e-06, 7.0445239543914795e-06, 8.37910920381546e-06, 9.713694453239441e-06, 1.1048279702663422e-05, 1.2382864952087402e-05, 1.3717450201511383e-05, 1.5052035450935364e-05, 1.6386620700359344e-05, 1.7721205949783325e-05, 1.9055791199207306e-05, 2.0390376448631287e-05, 2.1724961698055267e-05, 2.3059546947479248e-05, 2.439413219690323e-05, 2.572871744632721e-05, 2.706330269575119e-05, 2.839788794517517e-05, 2.973247319459915e-05, 3.106705844402313e-05, 3.240164369344711e-05, 3.3736228942871094e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 3.0, 7.0, 6.0, 9.0, 13.0, 26.0, 40.0, 42.0, 62.0, 141.0, 236.0, 333.0, 617.0, 1436.0, 3481.0, 9610.0, 35869.0, 176324.0, 549689.0, 210410.0, 42019.0, 10934.0, 3853.0, 1630.0, 755.0, 407.0, 225.0, 129.0, 71.0, 55.0, 39.0, 19.0, 20.0, 11.0, 10.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00632476806640625, -0.006086587905883789, -0.005848407745361328, -0.005610227584838867, -0.005372047424316406, -0.005133867263793945, -0.004895687103271484, -0.0046575069427490234, -0.0044193267822265625, -0.0041811466217041016, -0.003942966461181641, -0.0037047863006591797, -0.0034666061401367188, -0.003228425979614258, -0.002990245819091797, -0.002752065658569336, -0.002513885498046875, -0.002275705337524414, -0.002037525177001953, -0.0017993450164794922, -0.0015611648559570312, -0.0013229846954345703, -0.0010848045349121094, -0.0008466243743896484, -0.0006084442138671875, -0.00037026405334472656, -0.00013208389282226562, 0.00010609626770019531, 0.00034427642822265625, 0.0005824565887451172, 0.0008206367492675781, 0.001058816909790039, 0.0012969970703125, 0.001535177230834961, 0.0017733573913574219, 0.002011537551879883, 0.0022497177124023438, 0.0024878978729248047, 0.0027260780334472656, 0.0029642581939697266, 0.0032024383544921875, 0.0034406185150146484, 0.0036787986755371094, 0.00391697883605957, 0.004155158996582031, 0.004393339157104492, 0.004631519317626953, 0.004869699478149414, 0.005107879638671875, 0.005346059799194336, 0.005584239959716797, 0.005822420120239258, 0.006060600280761719, 0.00629878044128418, 0.006536960601806641, 0.0067751407623291016, 0.0070133209228515625, 0.0072515010833740234, 0.007489681243896484, 0.007727861404418945, 0.007966041564941406, 0.008204221725463867, 0.008442401885986328, 0.008680582046508789, 0.00891876220703125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 7.0, 8.0, 10.0, 16.0, 24.0, 22.0, 40.0, 36.0, 46.0, 57.0, 64.0, 76.0, 86.0, 98.0, 59.0, 71.0, 55.0, 44.0, 43.0, 41.0, 18.0, 16.0, 16.0, 16.0, 7.0, 5.0, 10.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00841522216796875, -0.008103728294372559, -0.007792234420776367, -0.007480740547180176, -0.007169246673583984, -0.006857752799987793, -0.0065462589263916016, -0.00623476505279541, -0.005923271179199219, -0.005611777305603027, -0.005300283432006836, -0.0049887895584106445, -0.004677295684814453, -0.004365801811218262, -0.00405430793762207, -0.003742814064025879, -0.0034313201904296875, -0.003119826316833496, -0.0028083324432373047, -0.0024968385696411133, -0.002185344696044922, -0.0018738508224487305, -0.001562356948852539, -0.0012508630752563477, -0.0009393692016601562, -0.0006278753280639648, -0.00031638145446777344, -4.887580871582031e-06, 0.0003066062927246094, 0.0006181001663208008, 0.0009295940399169922, 0.0012410879135131836, 0.001552581787109375, 0.0018640756607055664, 0.002175569534301758, 0.0024870634078979492, 0.0027985572814941406, 0.003110051155090332, 0.0034215450286865234, 0.003733038902282715, 0.004044532775878906, 0.004356026649475098, 0.004667520523071289, 0.0049790143966674805, 0.005290508270263672, 0.005602002143859863, 0.005913496017456055, 0.006224989891052246, 0.0065364837646484375, 0.006847977638244629, 0.00715947151184082, 0.007470965385437012, 0.007782459259033203, 0.008093953132629395, 0.008405447006225586, 0.008716940879821777, 0.009028434753417969, 0.00933992862701416, 0.009651422500610352, 0.009962916374206543, 0.010274410247802734, 0.010585904121398926, 0.010897397994995117, 0.011208891868591309, 0.0115203857421875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 8.0, 60.0, 316.0, 451.0, 150.0, 21.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.518557071685791, -0.4995139539241791, -0.48047083616256714, -0.4614277482032776, -0.44238463044166565, -0.4233415126800537, -0.40429842472076416, -0.3852553069591522, -0.3662121891975403, -0.34716907143592834, -0.3281259536743164, -0.30908286571502686, -0.2900397479534149, -0.270996630191803, -0.2519535422325134, -0.2329104244709015, -0.21386730670928955, -0.1948241889476776, -0.17578108608722687, -0.15673798322677612, -0.13769486546516418, -0.11865175515413284, -0.0996086448431015, -0.08056554198265076, -0.06152242422103882, -0.04247931391000748, -0.023436203598976135, -0.004393093287944794, 0.014650017023086548, 0.03369312733411789, 0.05273623764514923, 0.07177934050559998, 0.09082245826721191, 0.10986556857824326, 0.1289086788892746, 0.14795178174972534, 0.16699489951133728, 0.18603801727294922, 0.20508112013339996, 0.2241242229938507, 0.24316734075546265, 0.2622104585170746, 0.2812535762786865, 0.3002966642379761, 0.319339781999588, 0.33838289976119995, 0.3574259877204895, 0.37646910548210144, 0.3955122232437134, 0.4145553410053253, 0.43359845876693726, 0.4526415467262268, 0.47168466448783875, 0.4907277822494507, 0.5097708702087402, 0.5288139581680298, 0.5478571057319641, 0.5669001936912537, 0.585943341255188, 0.6049864292144775, 0.6240295171737671, 0.6430726647377014, 0.662115752696991, 0.6811589002609253, 0.7002019882202148]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 5.0, 10.0, 5.0, 6.0, 10.0, 10.0, 12.0, 18.0, 29.0, 21.0, 24.0, 18.0, 28.0, 26.0, 38.0, 42.0, 37.0, 44.0, 49.0, 50.0, 43.0, 36.0, 44.0, 39.0, 34.0, 45.0, 28.0, 26.0, 29.0, 37.0, 23.0, 22.0, 18.0, 14.0, 12.0, 11.0, 8.0, 9.0, 3.0, 9.0, 6.0, 4.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 4.0], "bins": [-0.20752465724945068, -0.2016763836145401, -0.19582809507846832, -0.18997982144355774, -0.18413153290748596, -0.17828325927257538, -0.1724349856376648, -0.16658669710159302, -0.16073842346668243, -0.15489014983177185, -0.14904186129570007, -0.1431935876607895, -0.1373453140258789, -0.13149702548980713, -0.12564875185489655, -0.11980047076940536, -0.11395218968391418, -0.108103908598423, -0.10225562751293182, -0.09640735387802124, -0.09055907279253006, -0.08471079170703888, -0.0788625180721283, -0.07301423698663712, -0.06716595590114594, -0.061317674815654755, -0.05546939745545387, -0.04962112009525299, -0.04377283900976181, -0.03792455792427063, -0.03207628056406975, -0.026228003203868866, -0.020379722118377686, -0.014531442895531654, -0.008683163672685623, -0.002834884449839592, 0.003013394773006439, 0.00886167399585247, 0.014709953218698502, 0.020558230578899384, 0.026406511664390564, 0.032254792749881744, 0.038103070110082626, 0.04395134747028351, 0.04979962855577469, 0.05564790964126587, 0.06149618700146675, 0.06734446436166763, 0.07319274544715881, 0.07904102653265, 0.08488930761814117, 0.09073758125305176, 0.09658586233854294, 0.10243414342403412, 0.1082824170589447, 0.11413069814443588, 0.11997897922992706, 0.12582725286483765, 0.13167554140090942, 0.13752381503582, 0.1433720886707306, 0.14922037720680237, 0.15506865084171295, 0.16091692447662354, 0.1667652130126953]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 7.0, 6.0, 7.0, 10.0, 15.0, 24.0, 41.0, 60.0, 65.0, 153.0, 239.0, 440.0, 1016.0, 3049.0, 14503.0, 525816.0, 3626915.0, 16527.0, 3199.0, 1062.0, 481.0, 230.0, 142.0, 81.0, 73.0, 28.0, 21.0, 20.0, 4.0, 12.0, 3.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0231781005859375, -0.022287607192993164, -0.021397113800048828, -0.020506620407104492, -0.019616127014160156, -0.01872563362121582, -0.017835140228271484, -0.01694464683532715, -0.016054153442382812, -0.015163660049438477, -0.01427316665649414, -0.013382673263549805, -0.012492179870605469, -0.011601686477661133, -0.010711193084716797, -0.009820699691772461, -0.008930206298828125, -0.008039712905883789, -0.007149219512939453, -0.006258726119995117, -0.005368232727050781, -0.004477739334106445, -0.0035872459411621094, -0.0026967525482177734, -0.0018062591552734375, -0.0009157657623291016, -2.5272369384765625e-05, 0.0008652210235595703, 0.0017557144165039062, 0.002646207809448242, 0.003536701202392578, 0.004427194595336914, 0.00531768798828125, 0.006208181381225586, 0.007098674774169922, 0.007989168167114258, 0.008879661560058594, 0.00977015495300293, 0.010660648345947266, 0.011551141738891602, 0.012441635131835938, 0.013332128524780273, 0.01422262191772461, 0.015113115310668945, 0.01600360870361328, 0.016894102096557617, 0.017784595489501953, 0.01867508888244629, 0.019565582275390625, 0.02045607566833496, 0.021346569061279297, 0.022237062454223633, 0.02312755584716797, 0.024018049240112305, 0.02490854263305664, 0.025799036026000977, 0.026689529418945312, 0.02758002281188965, 0.028470516204833984, 0.02936100959777832, 0.030251502990722656, 0.031141996383666992, 0.03203248977661133, 0.032922983169555664, 0.0338134765625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 1.0, 7.0, 9.0, 8.0, 26.0, 30.0, 38.0, 37.0, 54.0, 73.0, 66.0, 85.0, 85.0, 74.0, 82.0, 85.0, 54.0, 51.0, 36.0, 30.0, 15.0, 10.0, 3.0, 8.0, 7.0, 6.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021087646484375, -0.020461082458496094, -0.019834518432617188, -0.01920795440673828, -0.018581390380859375, -0.01795482635498047, -0.017328262329101562, -0.016701698303222656, -0.01607513427734375, -0.015448570251464844, -0.014822006225585938, -0.014195442199707031, -0.013568878173828125, -0.012942314147949219, -0.012315750122070312, -0.011689186096191406, -0.0110626220703125, -0.010436058044433594, -0.009809494018554688, -0.009182929992675781, -0.008556365966796875, -0.007929801940917969, -0.0073032379150390625, -0.006676673889160156, -0.00605010986328125, -0.005423545837402344, -0.0047969818115234375, -0.004170417785644531, -0.003543853759765625, -0.0029172897338867188, -0.0022907257080078125, -0.0016641616821289062, -0.00103759765625, -0.00041103363037109375, 0.0002155303955078125, 0.0008420944213867188, 0.001468658447265625, 0.0020952224731445312, 0.0027217864990234375, 0.0033483505249023438, 0.00397491455078125, 0.004601478576660156, 0.0052280426025390625, 0.005854606628417969, 0.006481170654296875, 0.007107734680175781, 0.0077342987060546875, 0.008360862731933594, 0.0089874267578125, 0.009613990783691406, 0.010240554809570312, 0.010867118835449219, 0.011493682861328125, 0.012120246887207031, 0.012746810913085938, 0.013373374938964844, 0.01399993896484375, 0.014626502990722656, 0.015253067016601562, 0.01587963104248047, 0.016506195068359375, 0.01713275909423828, 0.017759323120117188, 0.018385887145996094, 0.019012451171875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 0.0, 7.0, 11.0, 3.0, 18.0, 12.0, 27.0, 30.0, 36.0, 49.0, 69.0, 93.0, 128.0, 177.0, 295.0, 526.0, 893.0, 1782.0, 3444.0, 9251.0, 37220.0, 456455.0, 3605461.0, 56946.0, 12163.0, 4396.0, 2034.0, 1107.0, 595.0, 311.0, 210.0, 141.0, 91.0, 64.0, 58.0, 38.0, 34.0, 27.0, 15.0, 13.0, 11.0, 10.0, 15.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0117034912109375, -0.011339068412780762, -0.010974645614624023, -0.010610222816467285, -0.010245800018310547, -0.009881377220153809, -0.00951695442199707, -0.009152531623840332, -0.008788108825683594, -0.008423686027526855, -0.008059263229370117, -0.007694840431213379, -0.007330417633056641, -0.006965994834899902, -0.006601572036743164, -0.006237149238586426, -0.0058727264404296875, -0.005508303642272949, -0.005143880844116211, -0.004779458045959473, -0.004415035247802734, -0.004050612449645996, -0.003686189651489258, -0.0033217668533325195, -0.0029573440551757812, -0.002592921257019043, -0.0022284984588623047, -0.0018640756607055664, -0.0014996528625488281, -0.0011352300643920898, -0.0007708072662353516, -0.0004063844680786133, -4.1961669921875e-05, 0.0003224611282348633, 0.0006868839263916016, 0.0010513067245483398, 0.0014157295227050781, 0.0017801523208618164, 0.0021445751190185547, 0.002508997917175293, 0.0028734207153320312, 0.0032378435134887695, 0.003602266311645508, 0.003966689109802246, 0.004331111907958984, 0.004695534706115723, 0.005059957504272461, 0.005424380302429199, 0.0057888031005859375, 0.006153225898742676, 0.006517648696899414, 0.006882071495056152, 0.007246494293212891, 0.007610917091369629, 0.007975339889526367, 0.008339762687683105, 0.008704185485839844, 0.009068608283996582, 0.00943303108215332, 0.009797453880310059, 0.010161876678466797, 0.010526299476623535, 0.010890722274780273, 0.011255145072937012, 0.01161956787109375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 9.0, 7.0, 10.0, 12.0, 17.0, 43.0, 89.0, 192.0, 2862.0, 518.0, 141.0, 72.0, 38.0, 12.0, 14.0, 10.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.003871917724609375, -0.0037640929222106934, -0.0036562681198120117, -0.00354844331741333, -0.0034406185150146484, -0.003332793712615967, -0.003224968910217285, -0.0031171441078186035, -0.003009319305419922, -0.0029014945030212402, -0.0027936697006225586, -0.002685844898223877, -0.0025780200958251953, -0.0024701952934265137, -0.002362370491027832, -0.0022545456886291504, -0.0021467208862304688, -0.002038896083831787, -0.0019310712814331055, -0.0018232464790344238, -0.0017154216766357422, -0.0016075968742370605, -0.001499772071838379, -0.0013919472694396973, -0.0012841224670410156, -0.001176297664642334, -0.0010684728622436523, -0.0009606480598449707, -0.0008528232574462891, -0.0007449984550476074, -0.0006371736526489258, -0.0005293488502502441, -0.0004215240478515625, -0.00031369924545288086, -0.00020587444305419922, -9.804964065551758e-05, 9.775161743164062e-06, 0.0001175999641418457, 0.00022542476654052734, 0.000333249568939209, 0.0004410743713378906, 0.0005488991737365723, 0.0006567239761352539, 0.0007645487785339355, 0.0008723735809326172, 0.0009801983833312988, 0.0010880231857299805, 0.0011958479881286621, 0.0013036727905273438, 0.0014114975929260254, 0.001519322395324707, 0.0016271471977233887, 0.0017349720001220703, 0.001842796802520752, 0.0019506216049194336, 0.0020584464073181152, 0.002166271209716797, 0.0022740960121154785, 0.00238192081451416, 0.002489745616912842, 0.0025975704193115234, 0.002705395221710205, 0.0028132200241088867, 0.0029210448265075684, 0.00302886962890625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 14.0, 32.0, 168.0, 436.0, 287.0, 59.0, 12.0, 1.0, 1.0, 1.0], "bins": [-0.09188259392976761, -0.09029620885848999, -0.08870981633663177, -0.08712343126535416, -0.08553703874349594, -0.08395065367221832, -0.0823642686009407, -0.08077787607908249, -0.07919149100780487, -0.07760510593652725, -0.07601871341466904, -0.07443232834339142, -0.0728459358215332, -0.07125955075025558, -0.06967316567897797, -0.06808677315711975, -0.06650038808584213, -0.06491400301456451, -0.0633276104927063, -0.06174122542142868, -0.060154836624860764, -0.05856844782829285, -0.05698205903172493, -0.05539567023515701, -0.053809281438589096, -0.05222289264202118, -0.05063650384545326, -0.049050118774175644, -0.04746372997760773, -0.04587734118103981, -0.04429095238447189, -0.042704567313194275, -0.04111817851662636, -0.03953178972005844, -0.037945400923490524, -0.036359015852212906, -0.03477262705564499, -0.03318623825907707, -0.031599849462509155, -0.030013462528586388, -0.02842707559466362, -0.026840686798095703, -0.025254299864172935, -0.02366791106760502, -0.02208152413368225, -0.020495135337114334, -0.018908746540546417, -0.01732235960662365, -0.015735970810055733, -0.01414958294481039, -0.012563195079565048, -0.010976806282997131, -0.009390419349074364, -0.007804030552506447, -0.006217642687261105, -0.004631254822015762, -0.00304486695677042, -0.001458478975109756, 0.0001279090065509081, 0.001714297104626894, 0.0033006849698722363, 0.004887073300778866, 0.006473461166024208, 0.00805984903126955, 0.009646236896514893]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 2.0, 12.0, 8.0, 14.0, 16.0, 10.0, 16.0, 19.0, 24.0, 19.0, 36.0, 28.0, 31.0, 41.0, 28.0, 41.0, 39.0, 26.0, 33.0, 43.0, 39.0, 38.0, 37.0, 46.0, 31.0, 50.0, 38.0, 30.0, 19.0, 30.0, 28.0, 19.0, 17.0, 22.0, 12.0, 9.0, 14.0, 9.0, 6.0, 5.0, 5.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.007353544235229492, -0.007127969525754452, -0.006902394816279411, -0.006676820106804371, -0.0064512453973293304, -0.00622567068785429, -0.00600009597837925, -0.005774521268904209, -0.005548946559429169, -0.005323371849954128, -0.005097797140479088, -0.004872222431004047, -0.004646647721529007, -0.0044210730120539665, -0.004195498302578926, -0.003969923593103886, -0.003744348883628845, -0.0035187741741538048, -0.0032931994646787643, -0.003067624755203724, -0.0028420500457286835, -0.002616475336253643, -0.0023909006267786026, -0.002165325917303562, -0.0019397512078285217, -0.0017141764983534813, -0.0014886017888784409, -0.0012630270794034004, -0.00103745236992836, -0.0008118776604533195, -0.0005863029509782791, -0.0003607282415032387, -0.00013515353202819824, 9.04211774468422e-05, 0.00031599588692188263, 0.0005415705963969231, 0.0007671453058719635, 0.000992720015347004, 0.0012182947248220444, 0.0014438694342970848, 0.0016694441437721252, 0.0018950188532471657, 0.002120593562722206, 0.0023461682721972466, 0.002571742981672287, 0.0027973176911473274, 0.003022892400622368, 0.0032484671100974083, 0.0034740418195724487, 0.003699616529047489, 0.00392519123852253, 0.00415076594799757, 0.0043763406574726105, 0.004601915366947651, 0.004827490076422691, 0.005053064785897732, 0.005278639495372772, 0.005504214204847813, 0.005729788914322853, 0.0059553636237978935, 0.006180938333272934, 0.006406513042747974, 0.006632087752223015, 0.006857662461698055, 0.007083237171173096]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 4.0, 6.0, 5.0, 12.0, 20.0, 30.0, 44.0, 75.0, 145.0, 298.0, 551.0, 1260.0, 3087.0, 8925.0, 32006.0, 157326.0, 530439.0, 247697.0, 47229.0, 12331.0, 4055.0, 1555.0, 697.0, 342.0, 171.0, 98.0, 53.0, 22.0, 19.0, 14.0, 7.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.02239990234375, -0.0217134952545166, -0.021027088165283203, -0.020340681076049805, -0.019654273986816406, -0.018967866897583008, -0.01828145980834961, -0.01759505271911621, -0.016908645629882812, -0.016222238540649414, -0.015535831451416016, -0.014849424362182617, -0.014163017272949219, -0.01347661018371582, -0.012790203094482422, -0.012103796005249023, -0.011417388916015625, -0.010730981826782227, -0.010044574737548828, -0.00935816764831543, -0.008671760559082031, -0.007985353469848633, -0.007298946380615234, -0.006612539291381836, -0.0059261322021484375, -0.005239725112915039, -0.004553318023681641, -0.003866910934448242, -0.0031805038452148438, -0.0024940967559814453, -0.0018076896667480469, -0.0011212825775146484, -0.00043487548828125, 0.00025153160095214844, 0.0009379386901855469, 0.0016243457794189453, 0.0023107528686523438, 0.002997159957885742, 0.0036835670471191406, 0.004369974136352539, 0.0050563812255859375, 0.005742788314819336, 0.006429195404052734, 0.007115602493286133, 0.007802009582519531, 0.00848841667175293, 0.009174823760986328, 0.009861230850219727, 0.010547637939453125, 0.011234045028686523, 0.011920452117919922, 0.01260685920715332, 0.013293266296386719, 0.013979673385620117, 0.014666080474853516, 0.015352487564086914, 0.016038894653320312, 0.01672530174255371, 0.01741170883178711, 0.018098115921020508, 0.018784523010253906, 0.019470930099487305, 0.020157337188720703, 0.0208437442779541, 0.0215301513671875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 6.0, 3.0, 13.0, 11.0, 17.0, 33.0, 33.0, 39.0, 42.0, 69.0, 78.0, 78.0, 80.0, 80.0, 76.0, 72.0, 74.0, 55.0, 37.0, 33.0, 17.0, 13.0, 4.0, 8.0, 4.0, 7.0, 7.0, 0.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02117919921875, -0.0205538272857666, -0.019928455352783203, -0.019303083419799805, -0.018677711486816406, -0.018052339553833008, -0.01742696762084961, -0.01680159568786621, -0.016176223754882812, -0.015550851821899414, -0.014925479888916016, -0.014300107955932617, -0.013674736022949219, -0.01304936408996582, -0.012423992156982422, -0.011798620223999023, -0.011173248291015625, -0.010547876358032227, -0.009922504425048828, -0.00929713249206543, -0.008671760559082031, -0.008046388626098633, -0.007421016693115234, -0.006795644760131836, -0.0061702728271484375, -0.005544900894165039, -0.004919528961181641, -0.004294157028198242, -0.0036687850952148438, -0.0030434131622314453, -0.002418041229248047, -0.0017926692962646484, -0.00116729736328125, -0.0005419254302978516, 8.344650268554688e-05, 0.0007088184356689453, 0.0013341903686523438, 0.001959562301635742, 0.0025849342346191406, 0.003210306167602539, 0.0038356781005859375, 0.004461050033569336, 0.005086421966552734, 0.005711793899536133, 0.006337165832519531, 0.00696253776550293, 0.007587909698486328, 0.008213281631469727, 0.008838653564453125, 0.009464025497436523, 0.010089397430419922, 0.01071476936340332, 0.011340141296386719, 0.011965513229370117, 0.012590885162353516, 0.013216257095336914, 0.013841629028320312, 0.014467000961303711, 0.01509237289428711, 0.015717744827270508, 0.016343116760253906, 0.016968488693237305, 0.017593860626220703, 0.0182192325592041, 0.0188446044921875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 13.0, 10.0, 20.0, 31.0, 44.0, 83.0, 144.0, 243.0, 522.0, 1657.0, 12867.0, 682002.0, 341039.0, 7474.0, 1318.0, 482.0, 246.0, 126.0, 74.0, 45.0, 43.0, 26.0, 14.0, 9.0, 8.0, 3.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041290283203125, -0.03986167907714844, -0.038433074951171875, -0.03700447082519531, -0.03557586669921875, -0.03414726257324219, -0.032718658447265625, -0.03129005432128906, -0.0298614501953125, -0.028432846069335938, -0.027004241943359375, -0.025575637817382812, -0.02414703369140625, -0.022718429565429688, -0.021289825439453125, -0.019861221313476562, -0.0184326171875, -0.017004013061523438, -0.015575408935546875, -0.014146804809570312, -0.01271820068359375, -0.011289596557617188, -0.009860992431640625, -0.008432388305664062, -0.0070037841796875, -0.0055751800537109375, -0.004146575927734375, -0.0027179718017578125, -0.00128936767578125, 0.0001392364501953125, 0.001567840576171875, 0.0029964447021484375, 0.004425048828125, 0.0058536529541015625, 0.007282257080078125, 0.008710861206054688, 0.01013946533203125, 0.011568069458007812, 0.012996673583984375, 0.014425277709960938, 0.0158538818359375, 0.017282485961914062, 0.018711090087890625, 0.020139694213867188, 0.02156829833984375, 0.022996902465820312, 0.024425506591796875, 0.025854110717773438, 0.02728271484375, 0.028711318969726562, 0.030139923095703125, 0.03156852722167969, 0.03299713134765625, 0.03442573547363281, 0.035854339599609375, 0.03728294372558594, 0.0387115478515625, 0.04014015197753906, 0.041568756103515625, 0.04299736022949219, 0.04442596435546875, 0.04585456848144531, 0.047283172607421875, 0.04871177673339844, 0.050140380859375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 7.0, 17.0, 14.0, 15.0, 25.0, 27.0, 23.0, 26.0, 49.0, 51.0, 51.0, 72.0, 72.0, 47.0, 64.0, 57.0, 64.0, 49.0, 58.0, 42.0, 44.0, 32.0, 25.0, 13.0, 16.0, 18.0, 6.0, 5.0, 3.0, 5.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05078125, -0.049007415771484375, -0.04723358154296875, -0.045459747314453125, -0.0436859130859375, -0.041912078857421875, -0.04013824462890625, -0.038364410400390625, -0.036590576171875, -0.034816741943359375, -0.03304290771484375, -0.031269073486328125, -0.0294952392578125, -0.027721405029296875, -0.02594757080078125, -0.024173736572265625, -0.02239990234375, -0.020626068115234375, -0.01885223388671875, -0.017078399658203125, -0.0153045654296875, -0.013530731201171875, -0.01175689697265625, -0.009983062744140625, -0.008209228515625, -0.006435394287109375, -0.00466156005859375, -0.002887725830078125, -0.0011138916015625, 0.000659942626953125, 0.00243377685546875, 0.004207611083984375, 0.0059814453125, 0.007755279541015625, 0.00952911376953125, 0.011302947998046875, 0.0130767822265625, 0.014850616455078125, 0.01662445068359375, 0.018398284912109375, 0.020172119140625, 0.021945953369140625, 0.02371978759765625, 0.025493621826171875, 0.0272674560546875, 0.029041290283203125, 0.03081512451171875, 0.032588958740234375, 0.03436279296875, 0.036136627197265625, 0.03791046142578125, 0.039684295654296875, 0.0414581298828125, 0.043231964111328125, 0.04500579833984375, 0.046779632568359375, 0.048553466796875, 0.050327301025390625, 0.05210113525390625, 0.053874969482421875, 0.0556488037109375, 0.057422637939453125, 0.05919647216796875, 0.060970306396484375, 0.062744140625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 4.0, 7.0, 9.0, 13.0, 38.0, 83.0, 231.0, 866.0, 18099.0, 1017896.0, 10319.0, 630.0, 204.0, 77.0, 38.0, 16.0, 6.0, 6.0, 7.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.054351806640625, -0.05318140983581543, -0.05201101303100586, -0.05084061622619629, -0.04967021942138672, -0.04849982261657715, -0.04732942581176758, -0.04615902900695801, -0.04498863220214844, -0.04381823539733887, -0.0426478385925293, -0.04147744178771973, -0.040307044982910156, -0.039136648178100586, -0.037966251373291016, -0.036795854568481445, -0.035625457763671875, -0.034455060958862305, -0.033284664154052734, -0.032114267349243164, -0.030943870544433594, -0.029773473739624023, -0.028603076934814453, -0.027432680130004883, -0.026262283325195312, -0.025091886520385742, -0.023921489715576172, -0.0227510929107666, -0.02158069610595703, -0.02041029930114746, -0.01923990249633789, -0.01806950569152832, -0.01689910888671875, -0.01572871208190918, -0.01455831527709961, -0.013387918472290039, -0.012217521667480469, -0.011047124862670898, -0.009876728057861328, -0.008706331253051758, -0.0075359344482421875, -0.006365537643432617, -0.005195140838623047, -0.0040247440338134766, -0.0028543472290039062, -0.001683950424194336, -0.0005135536193847656, 0.0006568431854248047, 0.001827239990234375, 0.0029976367950439453, 0.004168033599853516, 0.005338430404663086, 0.006508827209472656, 0.0076792240142822266, 0.008849620819091797, 0.010020017623901367, 0.011190414428710938, 0.012360811233520508, 0.013531208038330078, 0.014701604843139648, 0.01587200164794922, 0.01704239845275879, 0.01821279525756836, 0.01938319206237793, 0.0205535888671875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 9.0, 14.0, 23.0, 48.0, 83.0, 144.0, 202.0, 206.0, 111.0, 75.0, 34.0, 15.0, 13.0, 13.0, 5.0, 6.0, 0.0, 4.0, 0.0, 2.0], "bins": [-0.00016641616821289062, -0.00016314350068569183, -0.00015987083315849304, -0.00015659816563129425, -0.00015332549810409546, -0.00015005283057689667, -0.00014678016304969788, -0.00014350749552249908, -0.0001402348279953003, -0.0001369621604681015, -0.0001336894929409027, -0.00013041682541370392, -0.00012714415788650513, -0.00012387149035930634, -0.00012059882283210754, -0.00011732615530490875, -0.00011405348777770996, -0.00011078082025051117, -0.00010750815272331238, -0.00010423548519611359, -0.0001009628176689148, -9.7690150141716e-05, -9.441748261451721e-05, -9.114481508731842e-05, -8.787214756011963e-05, -8.459948003292084e-05, -8.132681250572205e-05, -7.805414497852325e-05, -7.478147745132446e-05, -7.150880992412567e-05, -6.823614239692688e-05, -6.496347486972809e-05, -6.16908073425293e-05, -5.8418139815330505e-05, -5.5145472288131714e-05, -5.187280476093292e-05, -4.860013723373413e-05, -4.532746970653534e-05, -4.205480217933655e-05, -3.8782134652137756e-05, -3.5509467124938965e-05, -3.223679959774017e-05, -2.8964132070541382e-05, -2.569146454334259e-05, -2.24187970161438e-05, -1.9146129488945007e-05, -1.5873461961746216e-05, -1.2600794434547424e-05, -9.328126907348633e-06, -6.055459380149841e-06, -2.78279185295105e-06, 4.898756742477417e-07, 3.762543201446533e-06, 7.035210728645325e-06, 1.0307878255844116e-05, 1.3580545783042908e-05, 1.68532133102417e-05, 2.012588083744049e-05, 2.3398548364639282e-05, 2.6671215891838074e-05, 2.9943883419036865e-05, 3.321655094623566e-05, 3.648921847343445e-05, 3.976188600063324e-05, 4.303455352783203e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 10.0, 16.0, 18.0, 36.0, 68.0, 157.0, 298.0, 974.0, 5597.0, 325743.0, 705468.0, 8273.0, 1178.0, 358.0, 180.0, 88.0, 38.0, 16.0, 11.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02093505859375, -0.020189523696899414, -0.019443988800048828, -0.018698453903198242, -0.017952919006347656, -0.01720738410949707, -0.016461849212646484, -0.0157163143157959, -0.014970779418945312, -0.014225244522094727, -0.01347970962524414, -0.012734174728393555, -0.011988639831542969, -0.011243104934692383, -0.010497570037841797, -0.009752035140991211, -0.009006500244140625, -0.008260965347290039, -0.007515430450439453, -0.006769895553588867, -0.006024360656738281, -0.005278825759887695, -0.004533290863037109, -0.0037877559661865234, -0.0030422210693359375, -0.0022966861724853516, -0.0015511512756347656, -0.0008056163787841797, -6.008148193359375e-05, 0.0006854534149169922, 0.0014309883117675781, 0.002176523208618164, 0.00292205810546875, 0.003667593002319336, 0.004413127899169922, 0.005158662796020508, 0.005904197692871094, 0.00664973258972168, 0.007395267486572266, 0.008140802383422852, 0.008886337280273438, 0.009631872177124023, 0.01037740707397461, 0.011122941970825195, 0.011868476867675781, 0.012614011764526367, 0.013359546661376953, 0.014105081558227539, 0.014850616455078125, 0.015596151351928711, 0.016341686248779297, 0.017087221145629883, 0.01783275604248047, 0.018578290939331055, 0.01932382583618164, 0.020069360733032227, 0.020814895629882812, 0.0215604305267334, 0.022305965423583984, 0.02305150032043457, 0.023797035217285156, 0.024542570114135742, 0.025288105010986328, 0.026033639907836914, 0.0267791748046875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 11.0, 36.0, 128.0, 325.0, 329.0, 115.0, 32.0, 18.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036102294921875, -0.034714698791503906, -0.03332710266113281, -0.03193950653076172, -0.030551910400390625, -0.02916431427001953, -0.027776718139648438, -0.026389122009277344, -0.02500152587890625, -0.023613929748535156, -0.022226333618164062, -0.02083873748779297, -0.019451141357421875, -0.01806354522705078, -0.016675949096679688, -0.015288352966308594, -0.0139007568359375, -0.012513160705566406, -0.011125564575195312, -0.009737968444824219, -0.008350372314453125, -0.006962776184082031, -0.0055751800537109375, -0.004187583923339844, -0.00279998779296875, -0.0014123916625976562, -2.47955322265625e-05, 0.0013628005981445312, 0.002750396728515625, 0.004137992858886719, 0.0055255889892578125, 0.006913185119628906, 0.00830078125, 0.009688377380371094, 0.011075973510742188, 0.012463569641113281, 0.013851165771484375, 0.015238761901855469, 0.016626358032226562, 0.018013954162597656, 0.01940155029296875, 0.020789146423339844, 0.022176742553710938, 0.02356433868408203, 0.024951934814453125, 0.02633953094482422, 0.027727127075195312, 0.029114723205566406, 0.0305023193359375, 0.031889915466308594, 0.03327751159667969, 0.03466510772705078, 0.036052703857421875, 0.03744029998779297, 0.03882789611816406, 0.040215492248535156, 0.04160308837890625, 0.042990684509277344, 0.04437828063964844, 0.04576587677001953, 0.047153472900390625, 0.04854106903076172, 0.04992866516113281, 0.051316261291503906, 0.052703857421875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 7.0, 94.0, 316.0, 370.0, 132.0, 41.0, 14.0, 15.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42696258425712585, -0.4121873378753662, -0.39741209149360657, -0.3826368451118469, -0.3678615987300873, -0.35308635234832764, -0.338311105966568, -0.32353585958480835, -0.3087606132030487, -0.29398536682128906, -0.2792101204395294, -0.2644348740577698, -0.24965962767601013, -0.2348843812942505, -0.22010913491249084, -0.2053338885307312, -0.19055864214897156, -0.17578339576721191, -0.16100814938545227, -0.14623290300369263, -0.13145765662193298, -0.11668241024017334, -0.1019071638584137, -0.08713191747665405, -0.07235667109489441, -0.057581424713134766, -0.04280617833137512, -0.02803093194961548, -0.013255685567855835, 0.0015195608139038086, 0.016294807195663452, 0.031070053577423096, 0.04584532976150513, 0.06062057614326477, 0.07539582252502441, 0.09017106890678406, 0.1049463152885437, 0.11972156167030334, 0.134496808052063, 0.14927205443382263, 0.16404730081558228, 0.17882254719734192, 0.19359779357910156, 0.2083730399608612, 0.22314828634262085, 0.2379235327243805, 0.25269877910614014, 0.2674740254878998, 0.2822492718696594, 0.29702451825141907, 0.3117997646331787, 0.32657501101493835, 0.341350257396698, 0.35612550377845764, 0.3709007501602173, 0.38567599654197693, 0.4004512429237366, 0.4152264893054962, 0.43000173568725586, 0.4447769820690155, 0.45955222845077515, 0.4743274748325348, 0.48910272121429443, 0.5038779973983765, 0.5186532139778137]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 7.0, 12.0, 9.0, 9.0, 15.0, 23.0, 28.0, 33.0, 39.0, 40.0, 61.0, 40.0, 68.0, 56.0, 58.0, 68.0, 58.0, 60.0, 51.0, 44.0, 41.0, 42.0, 24.0, 26.0, 16.0, 22.0, 16.0, 11.0, 5.0, 9.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.34668922424316406, -0.3384120464324951, -0.33013486862182617, -0.3218576908111572, -0.3135804831981659, -0.30530330538749695, -0.297026127576828, -0.28874894976615906, -0.2804717719554901, -0.27219459414482117, -0.2639174163341522, -0.2556402087211609, -0.24736304581165314, -0.239085853099823, -0.23080867528915405, -0.2225314974784851, -0.21425430476665497, -0.20597712695598602, -0.19769993424415588, -0.18942275643348694, -0.181145578622818, -0.17286840081214905, -0.1645912081003189, -0.15631403028964996, -0.14803683757781982, -0.13975965976715088, -0.13148246705532074, -0.1232052892446518, -0.11492811143398285, -0.1066509261727333, -0.09837374091148376, -0.09009656310081482, -0.08181938529014587, -0.07354220002889633, -0.06526502221822739, -0.056987836956977844, -0.0487106554210186, -0.04043347388505936, -0.032156288623809814, -0.02387910708785057, -0.015601925551891327, -0.0073247430846095085, 0.0009524393826723099, 0.009229622781276703, 0.017506804317235947, 0.02578398585319519, 0.03406117111444473, 0.042338352650403976, 0.05061553418636322, 0.058892715722322464, 0.06716989725828171, 0.07544708251953125, 0.0837242603302002, 0.09200144559144974, 0.10027863085269928, 0.10855580866336823, 0.11683299392461777, 0.1251101791858673, 0.13338735699653625, 0.1416645348072052, 0.14994172751903534, 0.15821890532970428, 0.16649609804153442, 0.17477327585220337, 0.18305045366287231]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 14.0, 28.0, 31.0, 43.0, 55.0, 67.0, 112.0, 182.0, 429.0, 1975.0, 229224.0, 3958835.0, 2248.0, 457.0, 206.0, 111.0, 87.0, 54.0, 43.0, 16.0, 29.0, 11.0, 9.0, 3.0, 1.0, 5.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08172607421875, -0.07939338684082031, -0.07706069946289062, -0.07472801208496094, -0.07239532470703125, -0.07006263732910156, -0.06772994995117188, -0.06539726257324219, -0.0630645751953125, -0.06073188781738281, -0.058399200439453125, -0.05606651306152344, -0.05373382568359375, -0.05140113830566406, -0.049068450927734375, -0.04673576354980469, -0.044403076171875, -0.04207038879394531, -0.039737701416015625, -0.03740501403808594, -0.03507232666015625, -0.03273963928222656, -0.030406951904296875, -0.028074264526367188, -0.0257415771484375, -0.023408889770507812, -0.021076202392578125, -0.018743515014648438, -0.01641082763671875, -0.014078140258789062, -0.011745452880859375, -0.009412765502929688, -0.007080078125, -0.0047473907470703125, -0.002414703369140625, -8.20159912109375e-05, 0.00225067138671875, 0.0045833587646484375, 0.006916046142578125, 0.009248733520507812, 0.0115814208984375, 0.013914108276367188, 0.016246795654296875, 0.018579483032226562, 0.02091217041015625, 0.023244857788085938, 0.025577545166015625, 0.027910232543945312, 0.030242919921875, 0.03257560729980469, 0.034908294677734375, 0.03724098205566406, 0.03957366943359375, 0.04190635681152344, 0.044239044189453125, 0.04657173156738281, 0.0489044189453125, 0.05123710632324219, 0.053569793701171875, 0.05590248107910156, 0.05823516845703125, 0.06056785583496094, 0.06290054321289062, 0.06523323059082031, 0.06756591796875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 8.0, 4.0, 8.0, 14.0, 21.0, 19.0, 44.0, 39.0, 56.0, 62.0, 70.0, 71.0, 75.0, 82.0, 85.0, 72.0, 61.0, 50.0, 41.0, 25.0, 32.0, 11.0, 10.0, 12.0, 6.0, 4.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0213165283203125, -0.02068638801574707, -0.02005624771118164, -0.01942610740661621, -0.01879596710205078, -0.01816582679748535, -0.017535686492919922, -0.016905546188354492, -0.016275405883789062, -0.015645265579223633, -0.015015125274658203, -0.014384984970092773, -0.013754844665527344, -0.013124704360961914, -0.012494564056396484, -0.011864423751831055, -0.011234283447265625, -0.010604143142700195, -0.009974002838134766, -0.009343862533569336, -0.008713722229003906, -0.008083581924438477, -0.007453441619873047, -0.006823301315307617, -0.0061931610107421875, -0.005563020706176758, -0.004932880401611328, -0.0043027400970458984, -0.0036725997924804688, -0.003042459487915039, -0.0024123191833496094, -0.0017821788787841797, -0.00115203857421875, -0.0005218982696533203, 0.00010824203491210938, 0.0007383823394775391, 0.0013685226440429688, 0.0019986629486083984, 0.002628803253173828, 0.003258943557739258, 0.0038890838623046875, 0.004519224166870117, 0.005149364471435547, 0.0057795047760009766, 0.006409645080566406, 0.007039785385131836, 0.007669925689697266, 0.008300065994262695, 0.008930206298828125, 0.009560346603393555, 0.010190486907958984, 0.010820627212524414, 0.011450767517089844, 0.012080907821655273, 0.012711048126220703, 0.013341188430786133, 0.013971328735351562, 0.014601469039916992, 0.015231609344482422, 0.01586174964904785, 0.01649188995361328, 0.01712203025817871, 0.01775217056274414, 0.01838231086730957, 0.019012451171875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 5.0, 3.0, 10.0, 5.0, 12.0, 18.0, 29.0, 29.0, 38.0, 57.0, 54.0, 83.0, 98.0, 160.0, 230.0, 392.0, 752.0, 2036.0, 8744.0, 192843.0, 3968594.0, 15012.0, 2753.0, 976.0, 412.0, 268.0, 188.0, 119.0, 77.0, 60.0, 43.0, 41.0, 35.0, 29.0, 25.0, 15.0, 9.0, 6.0, 5.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.025604248046875, -0.02478170394897461, -0.02395915985107422, -0.023136615753173828, -0.022314071655273438, -0.021491527557373047, -0.020668983459472656, -0.019846439361572266, -0.019023895263671875, -0.018201351165771484, -0.017378807067871094, -0.016556262969970703, -0.015733718872070312, -0.014911174774169922, -0.014088630676269531, -0.01326608657836914, -0.01244354248046875, -0.01162099838256836, -0.010798454284667969, -0.009975910186767578, -0.009153366088867188, -0.008330821990966797, -0.007508277893066406, -0.006685733795166016, -0.005863189697265625, -0.005040645599365234, -0.004218101501464844, -0.003395557403564453, -0.0025730133056640625, -0.0017504692077636719, -0.0009279251098632812, -0.00010538101196289062, 0.0007171630859375, 0.0015397071838378906, 0.0023622512817382812, 0.003184795379638672, 0.0040073394775390625, 0.004829883575439453, 0.005652427673339844, 0.006474971771240234, 0.007297515869140625, 0.008120059967041016, 0.008942604064941406, 0.009765148162841797, 0.010587692260742188, 0.011410236358642578, 0.012232780456542969, 0.01305532455444336, 0.01387786865234375, 0.01470041275024414, 0.015522956848144531, 0.016345500946044922, 0.017168045043945312, 0.017990589141845703, 0.018813133239746094, 0.019635677337646484, 0.020458221435546875, 0.021280765533447266, 0.022103309631347656, 0.022925853729248047, 0.023748397827148438, 0.024570941925048828, 0.02539348602294922, 0.02621603012084961, 0.02703857421875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 22.0, 50.0, 219.0, 3615.0, 110.0, 25.0, 7.0, 10.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006000518798828125, -0.0057433247566223145, -0.005486130714416504, -0.005228936672210693, -0.004971742630004883, -0.004714548587799072, -0.004457354545593262, -0.004200160503387451, -0.003942966461181641, -0.00368577241897583, -0.0034285783767700195, -0.003171384334564209, -0.0029141902923583984, -0.002656996250152588, -0.0023998022079467773, -0.002142608165740967, -0.0018854141235351562, -0.0016282200813293457, -0.0013710260391235352, -0.0011138319969177246, -0.0008566379547119141, -0.0005994439125061035, -0.00034224987030029297, -8.505582809448242e-05, 0.00017213821411132812, 0.00042933225631713867, 0.0006865262985229492, 0.0009437203407287598, 0.0012009143829345703, 0.0014581084251403809, 0.0017153024673461914, 0.001972496509552002, 0.0022296905517578125, 0.002486884593963623, 0.0027440786361694336, 0.003001272678375244, 0.0032584667205810547, 0.0035156607627868652, 0.0037728548049926758, 0.004030048847198486, 0.004287242889404297, 0.004544436931610107, 0.004801630973815918, 0.0050588250160217285, 0.005316019058227539, 0.00557321310043335, 0.00583040714263916, 0.006087601184844971, 0.006344795227050781, 0.006601989269256592, 0.006859183311462402, 0.007116377353668213, 0.0073735713958740234, 0.007630765438079834, 0.007887959480285645, 0.008145153522491455, 0.008402347564697266, 0.008659541606903076, 0.008916735649108887, 0.009173929691314697, 0.009431123733520508, 0.009688317775726318, 0.009945511817932129, 0.01020270586013794, 0.01045989990234375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 17.0, 29.0, 168.0, 386.0, 278.0, 86.0, 22.0, 11.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.08268772065639496, -0.08115063607692719, -0.07961354404687881, -0.07807645946741104, -0.07653936743736267, -0.0750022828578949, -0.07346519827842712, -0.07192810624837875, -0.07039102166891098, -0.0688539370894432, -0.06731684505939484, -0.06577976047992706, -0.06424266844987869, -0.06270558387041092, -0.06116849556565285, -0.059631407260894775, -0.058094315230846405, -0.05655722692608833, -0.05502013862133026, -0.05348305404186249, -0.051945965737104416, -0.050408877432346344, -0.04887178912758827, -0.0473347008228302, -0.04579761624336243, -0.044260527938604355, -0.04272343963384628, -0.04118635505437851, -0.03964926674962044, -0.038112178444862366, -0.036575090140104294, -0.03503800183534622, -0.03350091353058815, -0.03196382522583008, -0.030426738783717155, -0.028889650478959084, -0.02735256217420101, -0.02581547573208809, -0.024278387427330017, -0.022741299122571945, -0.021204210817813873, -0.0196671225130558, -0.01813003607094288, -0.016592947766184807, -0.015055859461426735, -0.013518772087991238, -0.01198168471455574, -0.010444596409797668, -0.008907509967684746, -0.007370422128587961, -0.005833334289491177, -0.004296246916055679, -0.0027591590769588947, -0.0012220712378621101, 0.00031501613557338715, 0.001852104440331459, 0.0033891918137669563, 0.004926279652863741, 0.0064633674919605255, 0.008000454865396023, 0.00953754223883152, 0.011074630543589592, 0.01261171791702509, 0.014148806221783161, 0.01568589359521866]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 7.0, 9.0, 10.0, 13.0, 12.0, 23.0, 19.0, 25.0, 21.0, 31.0, 44.0, 31.0, 32.0, 47.0, 54.0, 59.0, 36.0, 50.0, 48.0, 53.0, 48.0, 43.0, 38.0, 28.0, 42.0, 26.0, 20.0, 23.0, 18.0, 16.0, 15.0, 16.0, 9.0, 6.0, 5.0, 5.0, 8.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00836944580078125, -0.00805980060249567, -0.007750155404210091, -0.007440510205924511, -0.007130865007638931, -0.006821219809353352, -0.006511574611067772, -0.006201929412782192, -0.0058922842144966125, -0.005582639016211033, -0.005272993817925453, -0.0049633486196398735, -0.004653703421354294, -0.004344058223068714, -0.0040344130247831345, -0.0037247678264975548, -0.003415122628211975, -0.0031054774299263954, -0.0027958322316408157, -0.002486187033355236, -0.0021765418350696564, -0.0018668966367840767, -0.001557251438498497, -0.0012476062402129173, -0.0009379610419273376, -0.000628315843641758, -0.0003186706453561783, -9.025447070598602e-06, 0.0003006197512149811, 0.0006102649495005608, 0.0009199101477861404, 0.0012295553460717201, 0.0015392005443572998, 0.0018488457426428795, 0.002158490940928459, 0.002468136139214039, 0.0027777813374996185, 0.003087426535785198, 0.003397071734070778, 0.0037067169323563576, 0.004016362130641937, 0.004326007328927517, 0.004635652527213097, 0.004945297725498676, 0.005254942923784256, 0.005564588122069836, 0.005874233320355415, 0.006183878518640995, 0.006493523716926575, 0.006803168915212154, 0.007112814113497734, 0.007422459311783314, 0.007732104510068893, 0.008041749708354473, 0.008351394906640053, 0.008661040104925632, 0.008970685303211212, 0.009280330501496792, 0.009589975699782372, 0.009899620898067951, 0.010209266096353531, 0.01051891129463911, 0.01082855649292469, 0.01113820169121027, 0.01144784688949585]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 1.0, 12.0, 11.0, 22.0, 44.0, 44.0, 80.0, 137.0, 282.0, 454.0, 911.0, 1822.0, 4261.0, 11260.0, 34344.0, 116819.0, 336060.0, 354587.0, 128848.0, 37602.0, 12302.0, 4552.0, 2056.0, 941.0, 457.0, 261.0, 151.0, 78.0, 54.0, 38.0, 17.0, 18.0, 11.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.015289306640625, -0.014796733856201172, -0.014304161071777344, -0.013811588287353516, -0.013319015502929688, -0.01282644271850586, -0.012333869934082031, -0.011841297149658203, -0.011348724365234375, -0.010856151580810547, -0.010363578796386719, -0.00987100601196289, -0.009378433227539062, -0.008885860443115234, -0.008393287658691406, -0.007900714874267578, -0.00740814208984375, -0.006915569305419922, -0.006422996520996094, -0.005930423736572266, -0.0054378509521484375, -0.004945278167724609, -0.004452705383300781, -0.003960132598876953, -0.003467559814453125, -0.002974987030029297, -0.0024824142456054688, -0.0019898414611816406, -0.0014972686767578125, -0.0010046958923339844, -0.0005121231079101562, -1.9550323486328125e-05, 0.0004730224609375, 0.0009655952453613281, 0.0014581680297851562, 0.0019507408142089844, 0.0024433135986328125, 0.0029358863830566406, 0.0034284591674804688, 0.003921031951904297, 0.004413604736328125, 0.004906177520751953, 0.005398750305175781, 0.005891323089599609, 0.0063838958740234375, 0.006876468658447266, 0.007369041442871094, 0.007861614227294922, 0.00835418701171875, 0.008846759796142578, 0.009339332580566406, 0.009831905364990234, 0.010324478149414062, 0.01081705093383789, 0.011309623718261719, 0.011802196502685547, 0.012294769287109375, 0.012787342071533203, 0.013279914855957031, 0.01377248764038086, 0.014265060424804688, 0.014757633209228516, 0.015250205993652344, 0.015742778778076172, 0.0162353515625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 3.0, 6.0, 12.0, 14.0, 26.0, 29.0, 34.0, 50.0, 52.0, 76.0, 72.0, 69.0, 72.0, 92.0, 81.0, 66.0, 57.0, 41.0, 39.0, 30.0, 23.0, 10.0, 13.0, 3.0, 7.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0211334228515625, -0.02050161361694336, -0.01986980438232422, -0.019237995147705078, -0.018606185913085938, -0.017974376678466797, -0.017342567443847656, -0.016710758209228516, -0.016078948974609375, -0.015447139739990234, -0.014815330505371094, -0.014183521270751953, -0.013551712036132812, -0.012919902801513672, -0.012288093566894531, -0.01165628433227539, -0.01102447509765625, -0.01039266586303711, -0.009760856628417969, -0.009129047393798828, -0.008497238159179688, -0.007865428924560547, -0.007233619689941406, -0.006601810455322266, -0.005970001220703125, -0.005338191986083984, -0.004706382751464844, -0.004074573516845703, -0.0034427642822265625, -0.002810955047607422, -0.0021791458129882812, -0.0015473365783691406, -0.00091552734375, -0.0002837181091308594, 0.00034809112548828125, 0.0009799003601074219, 0.0016117095947265625, 0.002243518829345703, 0.0028753280639648438, 0.0035071372985839844, 0.004138946533203125, 0.004770755767822266, 0.005402565002441406, 0.006034374237060547, 0.0066661834716796875, 0.007297992706298828, 0.007929801940917969, 0.00856161117553711, 0.00919342041015625, 0.00982522964477539, 0.010457038879394531, 0.011088848114013672, 0.011720657348632812, 0.012352466583251953, 0.012984275817871094, 0.013616085052490234, 0.014247894287109375, 0.014879703521728516, 0.015511512756347656, 0.016143321990966797, 0.016775131225585938, 0.017406940460205078, 0.01803874969482422, 0.01867055892944336, 0.0193023681640625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 5.0, 7.0, 15.0, 13.0, 26.0, 25.0, 36.0, 31.0, 45.0, 75.0, 96.0, 145.0, 216.0, 324.0, 575.0, 1040.0, 2083.0, 4825.0, 16092.0, 102655.0, 645570.0, 232614.0, 29080.0, 6975.0, 2699.0, 1333.0, 697.0, 406.0, 218.0, 162.0, 123.0, 84.0, 63.0, 49.0, 38.0, 19.0, 23.0, 17.0, 10.0, 5.0, 11.0, 8.0, 3.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0], "bins": [-0.0223388671875, -0.02165532112121582, -0.02097177505493164, -0.02028822898864746, -0.01960468292236328, -0.0189211368560791, -0.018237590789794922, -0.017554044723510742, -0.016870498657226562, -0.016186952590942383, -0.015503406524658203, -0.014819860458374023, -0.014136314392089844, -0.013452768325805664, -0.012769222259521484, -0.012085676193237305, -0.011402130126953125, -0.010718584060668945, -0.010035037994384766, -0.009351491928100586, -0.008667945861816406, -0.007984399795532227, -0.007300853729248047, -0.006617307662963867, -0.0059337615966796875, -0.005250215530395508, -0.004566669464111328, -0.0038831233978271484, -0.0031995773315429688, -0.002516031265258789, -0.0018324851989746094, -0.0011489391326904297, -0.00046539306640625, 0.0002181529998779297, 0.0009016990661621094, 0.001585245132446289, 0.0022687911987304688, 0.0029523372650146484, 0.003635883331298828, 0.004319429397583008, 0.0050029754638671875, 0.005686521530151367, 0.006370067596435547, 0.0070536136627197266, 0.007737159729003906, 0.008420705795288086, 0.009104251861572266, 0.009787797927856445, 0.010471343994140625, 0.011154890060424805, 0.011838436126708984, 0.012521982192993164, 0.013205528259277344, 0.013889074325561523, 0.014572620391845703, 0.015256166458129883, 0.015939712524414062, 0.016623258590698242, 0.017306804656982422, 0.0179903507232666, 0.01867389678955078, 0.01935744285583496, 0.02004098892211914, 0.02072453498840332, 0.0214080810546875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 11.0, 7.0, 16.0, 14.0, 17.0, 29.0, 21.0, 40.0, 32.0, 39.0, 43.0, 40.0, 62.0, 65.0, 49.0, 44.0, 53.0, 60.0, 47.0, 56.0, 41.0, 38.0, 26.0, 22.0, 28.0, 16.0, 18.0, 11.0, 12.0, 7.0, 10.0, 5.0, 6.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055084228515625, -0.053281307220458984, -0.05147838592529297, -0.04967546463012695, -0.04787254333496094, -0.04606962203979492, -0.044266700744628906, -0.04246377944946289, -0.040660858154296875, -0.03885793685913086, -0.037055015563964844, -0.03525209426879883, -0.03344917297363281, -0.0316462516784668, -0.02984333038330078, -0.028040409088134766, -0.02623748779296875, -0.024434566497802734, -0.02263164520263672, -0.020828723907470703, -0.019025802612304688, -0.017222881317138672, -0.015419960021972656, -0.01361703872680664, -0.011814117431640625, -0.01001119613647461, -0.008208274841308594, -0.006405353546142578, -0.0046024322509765625, -0.002799510955810547, -0.0009965896606445312, 0.0008063316345214844, 0.0026092529296875, 0.004412174224853516, 0.006215095520019531, 0.008018016815185547, 0.009820938110351562, 0.011623859405517578, 0.013426780700683594, 0.01522970199584961, 0.017032623291015625, 0.01883554458618164, 0.020638465881347656, 0.022441387176513672, 0.024244308471679688, 0.026047229766845703, 0.02785015106201172, 0.029653072357177734, 0.03145599365234375, 0.033258914947509766, 0.03506183624267578, 0.0368647575378418, 0.03866767883300781, 0.04047060012817383, 0.042273521423339844, 0.04407644271850586, 0.045879364013671875, 0.04768228530883789, 0.049485206604003906, 0.05128812789916992, 0.05309104919433594, 0.05489397048950195, 0.05669689178466797, 0.058499813079833984, 0.060302734375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 3.0, 4.0, 3.0, 4.0, 10.0, 12.0, 16.0, 16.0, 22.0, 35.0, 72.0, 87.0, 168.0, 353.0, 857.0, 2637.0, 12928.0, 956717.0, 66895.0, 5024.0, 1455.0, 563.0, 284.0, 120.0, 90.0, 56.0, 42.0, 20.0, 17.0, 14.0, 5.0, 7.0, 3.0, 4.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0258636474609375, -0.02493119239807129, -0.023998737335205078, -0.023066282272338867, -0.022133827209472656, -0.021201372146606445, -0.020268917083740234, -0.019336462020874023, -0.018404006958007812, -0.0174715518951416, -0.01653909683227539, -0.01560664176940918, -0.014674186706542969, -0.013741731643676758, -0.012809276580810547, -0.011876821517944336, -0.010944366455078125, -0.010011911392211914, -0.009079456329345703, -0.008147001266479492, -0.007214546203613281, -0.00628209114074707, -0.005349636077880859, -0.0044171810150146484, -0.0034847259521484375, -0.0025522708892822266, -0.0016198158264160156, -0.0006873607635498047, 0.00024509429931640625, 0.0011775493621826172, 0.002110004425048828, 0.003042459487915039, 0.00397491455078125, 0.004907369613647461, 0.005839824676513672, 0.006772279739379883, 0.007704734802246094, 0.008637189865112305, 0.009569644927978516, 0.010502099990844727, 0.011434555053710938, 0.012367010116577148, 0.01329946517944336, 0.01423192024230957, 0.015164375305175781, 0.016096830368041992, 0.017029285430908203, 0.017961740493774414, 0.018894195556640625, 0.019826650619506836, 0.020759105682373047, 0.021691560745239258, 0.02262401580810547, 0.02355647087097168, 0.02448892593383789, 0.0254213809967041, 0.026353836059570312, 0.027286291122436523, 0.028218746185302734, 0.029151201248168945, 0.030083656311035156, 0.031016111373901367, 0.03194856643676758, 0.03288102149963379, 0.0338134765625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 4.0, 8.0, 7.0, 4.0, 5.0, 14.0, 6.0, 10.0, 15.0, 24.0, 32.0, 38.0, 41.0, 46.0, 65.0, 74.0, 88.0, 87.0, 92.0, 61.0, 55.0, 35.0, 34.0, 28.0, 17.0, 13.0, 15.0, 13.0, 10.0, 11.0, 5.0, 9.0, 5.0, 3.0, 3.0, 3.0, 4.0, 0.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0], "bins": [-3.415346145629883e-05, -3.3204443752765656e-05, -3.225542604923248e-05, -3.130640834569931e-05, -3.0357390642166138e-05, -2.9408372938632965e-05, -2.8459355235099792e-05, -2.751033753156662e-05, -2.6561319828033447e-05, -2.5612302124500275e-05, -2.4663284420967102e-05, -2.371426671743393e-05, -2.2765249013900757e-05, -2.1816231310367584e-05, -2.086721360683441e-05, -1.991819590330124e-05, -1.8969178199768066e-05, -1.8020160496234894e-05, -1.707114279270172e-05, -1.612212508916855e-05, -1.5173107385635376e-05, -1.4224089682102203e-05, -1.327507197856903e-05, -1.2326054275035858e-05, -1.1377036571502686e-05, -1.0428018867969513e-05, -9.47900116443634e-06, -8.529983460903168e-06, -7.580965757369995e-06, -6.6319480538368225e-06, -5.68293035030365e-06, -4.733912646770477e-06, -3.7848949432373047e-06, -2.835877239704132e-06, -1.8868595361709595e-06, -9.378418326377869e-07, 1.1175870895385742e-08, 9.601935744285583e-07, 1.909211277961731e-06, 2.8582289814949036e-06, 3.807246685028076e-06, 4.756264388561249e-06, 5.705282092094421e-06, 6.654299795627594e-06, 7.603317499160767e-06, 8.55233520269394e-06, 9.501352906227112e-06, 1.0450370609760284e-05, 1.1399388313293457e-05, 1.234840601682663e-05, 1.3297423720359802e-05, 1.4246441423892975e-05, 1.5195459127426147e-05, 1.614447683095932e-05, 1.7093494534492493e-05, 1.8042512238025665e-05, 1.8991529941558838e-05, 1.994054764509201e-05, 2.0889565348625183e-05, 2.1838583052158356e-05, 2.278760075569153e-05, 2.37366184592247e-05, 2.4685636162757874e-05, 2.5634653866291046e-05, 2.658367156982422e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 5.0, 9.0, 12.0, 8.0, 16.0, 20.0, 25.0, 38.0, 44.0, 76.0, 119.0, 199.0, 322.0, 537.0, 1029.0, 2171.0, 5521.0, 29212.0, 896666.0, 97984.0, 8549.0, 2874.0, 1321.0, 715.0, 400.0, 243.0, 152.0, 79.0, 56.0, 41.0, 23.0, 21.0, 19.0, 10.0, 5.0, 2.0, 7.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01690673828125, -0.016317129135131836, -0.015727519989013672, -0.015137910842895508, -0.014548301696777344, -0.01395869255065918, -0.013369083404541016, -0.012779474258422852, -0.012189865112304688, -0.011600255966186523, -0.01101064682006836, -0.010421037673950195, -0.009831428527832031, -0.009241819381713867, -0.008652210235595703, -0.008062601089477539, -0.007472991943359375, -0.006883382797241211, -0.006293773651123047, -0.005704164505004883, -0.005114555358886719, -0.004524946212768555, -0.003935337066650391, -0.0033457279205322266, -0.0027561187744140625, -0.0021665096282958984, -0.0015769004821777344, -0.0009872913360595703, -0.00039768218994140625, 0.0001919269561767578, 0.0007815361022949219, 0.001371145248413086, 0.00196075439453125, 0.002550363540649414, 0.003139972686767578, 0.003729581832885742, 0.004319190979003906, 0.00490880012512207, 0.005498409271240234, 0.0060880184173583984, 0.0066776275634765625, 0.0072672367095947266, 0.00785684585571289, 0.008446455001831055, 0.009036064147949219, 0.009625673294067383, 0.010215282440185547, 0.010804891586303711, 0.011394500732421875, 0.011984109878540039, 0.012573719024658203, 0.013163328170776367, 0.013752937316894531, 0.014342546463012695, 0.01493215560913086, 0.015521764755249023, 0.016111373901367188, 0.01670098304748535, 0.017290592193603516, 0.01788020133972168, 0.018469810485839844, 0.019059419631958008, 0.019649028778076172, 0.020238637924194336, 0.0208282470703125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 2.0, 3.0, 4.0, 4.0, 3.0, 6.0, 6.0, 7.0, 21.0, 43.0, 70.0, 159.0, 199.0, 190.0, 117.0, 55.0, 42.0, 15.0, 15.0, 4.0, 4.0, 4.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.029052734375, -0.028322696685791016, -0.02759265899658203, -0.026862621307373047, -0.026132583618164062, -0.025402545928955078, -0.024672508239746094, -0.02394247055053711, -0.023212432861328125, -0.02248239517211914, -0.021752357482910156, -0.021022319793701172, -0.020292282104492188, -0.019562244415283203, -0.01883220672607422, -0.018102169036865234, -0.01737213134765625, -0.016642093658447266, -0.01591205596923828, -0.015182018280029297, -0.014451980590820312, -0.013721942901611328, -0.012991905212402344, -0.01226186752319336, -0.011531829833984375, -0.01080179214477539, -0.010071754455566406, -0.009341716766357422, -0.008611679077148438, -0.007881641387939453, -0.007151603698730469, -0.006421566009521484, -0.0056915283203125, -0.004961490631103516, -0.004231452941894531, -0.003501415252685547, -0.0027713775634765625, -0.002041339874267578, -0.0013113021850585938, -0.0005812644958496094, 0.000148773193359375, 0.0008788108825683594, 0.0016088485717773438, 0.002338886260986328, 0.0030689239501953125, 0.003798961639404297, 0.004528999328613281, 0.005259037017822266, 0.00598907470703125, 0.006719112396240234, 0.007449150085449219, 0.008179187774658203, 0.008909225463867188, 0.009639263153076172, 0.010369300842285156, 0.01109933853149414, 0.011829376220703125, 0.01255941390991211, 0.013289451599121094, 0.014019489288330078, 0.014749526977539062, 0.015479564666748047, 0.01620960235595703, 0.016939640045166016, 0.017669677734375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 7.0, 8.0, 25.0, 87.0, 199.0, 301.0, 245.0, 80.0, 34.0, 17.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33140426874160767, -0.3185504376888275, -0.30569660663604736, -0.2928428053855896, -0.27998897433280945, -0.2671351432800293, -0.25428131222724915, -0.241427481174469, -0.22857366502285004, -0.21571983397006989, -0.20286601781845093, -0.19001218676567078, -0.17715835571289062, -0.16430453956127167, -0.15145070850849152, -0.13859689235687256, -0.1257430613040924, -0.11288923770189285, -0.1000354140996933, -0.08718158304691315, -0.07432775944471359, -0.06147393584251404, -0.04862010478973389, -0.03576628118753433, -0.022912457585334778, -0.010058632120490074, 0.0027951933443546295, 0.015649020671844482, 0.028502844274044037, 0.04135666787624359, 0.05421049892902374, 0.0670643225312233, 0.07991817593574524, 0.0927719995379448, 0.10562582314014435, 0.1184796541929245, 0.13133347034454346, 0.1441873013973236, 0.15704113245010376, 0.1698949635028839, 0.18274877965450287, 0.19560261070728302, 0.20845642685890198, 0.22131025791168213, 0.23416408896446228, 0.24701790511608124, 0.2598717212677002, 0.27272555232048035, 0.2855793833732605, 0.29843321442604065, 0.3112870454788208, 0.32414084672927856, 0.3369946777820587, 0.34984850883483887, 0.362702339887619, 0.37555617094039917, 0.38840997219085693, 0.4012638032436371, 0.41411763429641724, 0.426971435546875, 0.43982526659965515, 0.4526790976524353, 0.46553292870521545, 0.4783867597579956, 0.49124059081077576]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 2.0, 5.0, 7.0, 16.0, 7.0, 12.0, 17.0, 12.0, 21.0, 19.0, 30.0, 36.0, 32.0, 37.0, 41.0, 39.0, 41.0, 48.0, 38.0, 43.0, 40.0, 42.0, 52.0, 46.0, 30.0, 27.0, 27.0, 33.0, 24.0, 25.0, 22.0, 20.0, 12.0, 16.0, 12.0, 16.0, 15.0, 7.0, 3.0, 6.0, 5.0, 5.0, 2.0, 0.0, 4.0, 0.0, 1.0], "bins": [-0.22798937559127808, -0.22182203829288483, -0.21565470099449158, -0.20948734879493713, -0.20332001149654388, -0.19715267419815063, -0.1909853219985962, -0.18481798470020294, -0.1786506474018097, -0.17248331010341644, -0.1663159728050232, -0.16014862060546875, -0.1539812833070755, -0.14781394600868225, -0.1416465938091278, -0.13547925651073456, -0.1293119192123413, -0.12314458191394806, -0.11697723716497421, -0.11080989241600037, -0.10464255511760712, -0.09847521781921387, -0.09230787307024002, -0.08614052832126617, -0.07997319102287292, -0.07380585372447968, -0.06763850897550583, -0.06147116795182228, -0.05530382692813873, -0.049136485904455185, -0.04296914488077164, -0.03680180385708809, -0.03063446283340454, -0.024467121809720993, -0.018299780786037445, -0.012132439762353897, -0.005965098738670349, 0.00020224228501319885, 0.006369583308696747, 0.012536924332380295, 0.018704265356063843, 0.02487160637974739, 0.03103894740343094, 0.03720628842711449, 0.043373629450798035, 0.04954097047448158, 0.05570831149816513, 0.06187565252184868, 0.06804299354553223, 0.07421033084392548, 0.08037767559289932, 0.08654502034187317, 0.09271235764026642, 0.09887969493865967, 0.10504703968763351, 0.11121438443660736, 0.11738172173500061, 0.12354905903339386, 0.1297163963317871, 0.13588374853134155, 0.1420510858297348, 0.14821842312812805, 0.1543857753276825, 0.16055311262607574, 0.166720449924469]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 6.0, 5.0, 5.0, 20.0, 20.0, 39.0, 64.0, 68.0, 101.0, 167.0, 272.0, 511.0, 939.0, 2105.0, 5938.0, 32111.0, 3998030.0, 136628.0, 11089.0, 3199.0, 1308.0, 634.0, 343.0, 247.0, 142.0, 87.0, 59.0, 44.0, 33.0, 19.0, 7.0, 7.0, 7.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0267486572265625, -0.025878190994262695, -0.02500772476196289, -0.024137258529663086, -0.02326679229736328, -0.022396326065063477, -0.021525859832763672, -0.020655393600463867, -0.019784927368164062, -0.018914461135864258, -0.018043994903564453, -0.01717352867126465, -0.016303062438964844, -0.015432596206665039, -0.014562129974365234, -0.01369166374206543, -0.012821197509765625, -0.01195073127746582, -0.011080265045166016, -0.010209798812866211, -0.009339332580566406, -0.008468866348266602, -0.007598400115966797, -0.006727933883666992, -0.0058574676513671875, -0.004987001419067383, -0.004116535186767578, -0.0032460689544677734, -0.0023756027221679688, -0.001505136489868164, -0.0006346702575683594, 0.0002357959747314453, 0.00110626220703125, 0.0019767284393310547, 0.0028471946716308594, 0.003717660903930664, 0.004588127136230469, 0.0054585933685302734, 0.006329059600830078, 0.007199525833129883, 0.008069992065429688, 0.008940458297729492, 0.009810924530029297, 0.010681390762329102, 0.011551856994628906, 0.012422323226928711, 0.013292789459228516, 0.01416325569152832, 0.015033721923828125, 0.01590418815612793, 0.016774654388427734, 0.01764512062072754, 0.018515586853027344, 0.01938605308532715, 0.020256519317626953, 0.021126985549926758, 0.021997451782226562, 0.022867918014526367, 0.023738384246826172, 0.024608850479125977, 0.02547931671142578, 0.026349782943725586, 0.02722024917602539, 0.028090715408325195, 0.028961181640625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 6.0, 12.0, 18.0, 29.0, 27.0, 48.0, 47.0, 50.0, 79.0, 79.0, 74.0, 100.0, 92.0, 84.0, 61.0, 40.0, 41.0, 33.0, 23.0, 9.0, 11.0, 5.0, 2.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0227203369140625, -0.022068023681640625, -0.02141571044921875, -0.020763397216796875, -0.020111083984375, -0.019458770751953125, -0.01880645751953125, -0.018154144287109375, -0.0175018310546875, -0.016849517822265625, -0.01619720458984375, -0.015544891357421875, -0.014892578125, -0.014240264892578125, -0.01358795166015625, -0.012935638427734375, -0.0122833251953125, -0.011631011962890625, -0.01097869873046875, -0.010326385498046875, -0.009674072265625, -0.009021759033203125, -0.00836944580078125, -0.007717132568359375, -0.0070648193359375, -0.006412506103515625, -0.00576019287109375, -0.005107879638671875, -0.00445556640625, -0.003803253173828125, -0.00315093994140625, -0.002498626708984375, -0.0018463134765625, -0.001194000244140625, -0.00054168701171875, 0.000110626220703125, 0.000762939453125, 0.001415252685546875, 0.00206756591796875, 0.002719879150390625, 0.0033721923828125, 0.004024505615234375, 0.00467681884765625, 0.005329132080078125, 0.0059814453125, 0.006633758544921875, 0.00728607177734375, 0.007938385009765625, 0.0085906982421875, 0.009243011474609375, 0.00989532470703125, 0.010547637939453125, 0.011199951171875, 0.011852264404296875, 0.01250457763671875, 0.013156890869140625, 0.0138092041015625, 0.014461517333984375, 0.01511383056640625, 0.015766143798828125, 0.01641845703125, 0.017070770263671875, 0.01772308349609375, 0.018375396728515625, 0.0190277099609375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 11.0, 21.0, 23.0, 40.0, 65.0, 73.0, 110.0, 142.0, 203.0, 210.0, 294.0, 487.0, 1328.0, 32793.0, 4153126.0, 3163.0, 716.0, 434.0, 273.0, 210.0, 150.0, 116.0, 74.0, 72.0, 55.0, 26.0, 27.0, 17.0, 8.0, 9.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11895751953125, -0.11514568328857422, -0.11133384704589844, -0.10752201080322266, -0.10371017456054688, -0.0998983383178711, -0.09608650207519531, -0.09227466583251953, -0.08846282958984375, -0.08465099334716797, -0.08083915710449219, -0.0770273208618164, -0.07321548461914062, -0.06940364837646484, -0.06559181213378906, -0.06177997589111328, -0.0579681396484375, -0.05415630340576172, -0.05034446716308594, -0.046532630920410156, -0.042720794677734375, -0.038908958435058594, -0.03509712219238281, -0.03128528594970703, -0.02747344970703125, -0.02366161346435547, -0.019849777221679688, -0.016037940979003906, -0.012226104736328125, -0.008414268493652344, -0.0046024322509765625, -0.0007905960083007812, 0.003021240234375, 0.006833076477050781, 0.010644912719726562, 0.014456748962402344, 0.018268585205078125, 0.022080421447753906, 0.025892257690429688, 0.02970409393310547, 0.03351593017578125, 0.03732776641845703, 0.04113960266113281, 0.044951438903808594, 0.048763275146484375, 0.052575111389160156, 0.05638694763183594, 0.06019878387451172, 0.0640106201171875, 0.06782245635986328, 0.07163429260253906, 0.07544612884521484, 0.07925796508789062, 0.0830698013305664, 0.08688163757324219, 0.09069347381591797, 0.09450531005859375, 0.09831714630126953, 0.10212898254394531, 0.1059408187866211, 0.10975265502929688, 0.11356449127197266, 0.11737632751464844, 0.12118816375732422, 0.125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 15.0, 359.0, 3670.0, 25.0, 12.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046875, -0.04465484619140625, -0.0424346923828125, -0.04021453857421875, -0.037994384765625, -0.03577423095703125, -0.0335540771484375, -0.03133392333984375, -0.02911376953125, -0.02689361572265625, -0.0246734619140625, -0.02245330810546875, -0.020233154296875, -0.01801300048828125, -0.0157928466796875, -0.01357269287109375, -0.0113525390625, -0.00913238525390625, -0.0069122314453125, -0.00469207763671875, -0.002471923828125, -0.00025177001953125, 0.0019683837890625, 0.00418853759765625, 0.00640869140625, 0.00862884521484375, 0.0108489990234375, 0.01306915283203125, 0.015289306640625, 0.01750946044921875, 0.0197296142578125, 0.02194976806640625, 0.024169921875, 0.02639007568359375, 0.0286102294921875, 0.03083038330078125, 0.033050537109375, 0.03527069091796875, 0.0374908447265625, 0.03971099853515625, 0.04193115234375, 0.04415130615234375, 0.0463714599609375, 0.04859161376953125, 0.050811767578125, 0.05303192138671875, 0.0552520751953125, 0.05747222900390625, 0.0596923828125, 0.06191253662109375, 0.0641326904296875, 0.06635284423828125, 0.068572998046875, 0.07079315185546875, 0.0730133056640625, 0.07523345947265625, 0.07745361328125, 0.07967376708984375, 0.0818939208984375, 0.08411407470703125, 0.086334228515625, 0.08855438232421875, 0.0907745361328125, 0.09299468994140625, 0.09521484375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 12.0, 29.0, 109.0, 359.0, 375.0, 96.0, 23.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15574894845485687, -0.1479724645614624, -0.14019599556922913, -0.13241951167583466, -0.12464303523302078, -0.11686655879020691, -0.10909007489681244, -0.10131359845399857, -0.09353712201118469, -0.08576064556837082, -0.07798416912555695, -0.07020768523216248, -0.0624312087893486, -0.05465473234653473, -0.04687825217843056, -0.039101772010326385, -0.03132529556751251, -0.02354881726205349, -0.015772338956594467, -0.007995860651135445, -0.00021938234567642212, 0.007557094097137451, 0.015333574265241623, 0.023110054433345795, 0.030886530876159668, 0.03866300731897354, 0.04643948748707771, 0.054215967655181885, 0.06199244409799576, 0.06976892054080963, 0.0775454044342041, 0.08532188087701797, 0.09309834241867065, 0.10087481886148453, 0.1086512953042984, 0.11642777919769287, 0.12420425564050674, 0.13198073208332062, 0.1397572159767151, 0.14753368496894836, 0.15531016886234283, 0.1630866527557373, 0.17086312174797058, 0.17863960564136505, 0.18641608953475952, 0.1941925585269928, 0.20196904242038727, 0.20974552631378174, 0.21752199530601501, 0.22529847919940948, 0.23307494819164276, 0.24085143208503723, 0.2486279010772705, 0.25640439987182617, 0.26418086886405945, 0.2719573378562927, 0.2797338366508484, 0.28751030564308167, 0.29528680443763733, 0.3030632734298706, 0.3108397424221039, 0.31861621141433716, 0.3263927102088928, 0.3341691792011261, 0.3419456481933594]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 6.0, 5.0, 13.0, 18.0, 23.0, 31.0, 40.0, 50.0, 77.0, 112.0, 118.0, 101.0, 103.0, 79.0, 72.0, 59.0, 28.0, 24.0, 19.0, 10.0, 5.0, 3.0, 5.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15625214576721191, -0.15150687098503113, -0.14676161110401154, -0.14201635122299194, -0.13727107644081116, -0.13252580165863037, -0.12778054177761078, -0.12303527444601059, -0.1182900071144104, -0.11354473978281021, -0.10879947245121002, -0.10405420511960983, -0.09930893778800964, -0.09456367045640945, -0.08981840312480927, -0.08507313579320908, -0.08032786846160889, -0.0755826011300087, -0.07083733379840851, -0.06609206646680832, -0.06134679913520813, -0.05660153180360794, -0.05185626447200775, -0.04711099714040756, -0.04236572980880737, -0.037620462477207184, -0.032875195145606995, -0.028129927814006805, -0.023384660482406616, -0.018639393150806427, -0.013894125819206238, -0.009148858487606049, -0.004403591156005859, 0.00034167617559432983, 0.005086943507194519, 0.009832210838794708, 0.014577478170394897, 0.019322745501995087, 0.024068012833595276, 0.028813280165195465, 0.033558547496795654, 0.038303814828395844, 0.04304908215999603, 0.04779434949159622, 0.05253961682319641, 0.0572848841547966, 0.06203015148639679, 0.06677541881799698, 0.07152068614959717, 0.07626595348119736, 0.08101122081279755, 0.08575648814439774, 0.09050175547599792, 0.09524702280759811, 0.0999922901391983, 0.10473755747079849, 0.10948282480239868, 0.11422809213399887, 0.11897335946559906, 0.12371862679719925, 0.12846389412879944, 0.13320916891098022, 0.13795442879199982, 0.1426996886730194, 0.1474449634552002]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 7.0, 20.0, 21.0, 24.0, 72.0, 104.0, 195.0, 418.0, 1136.0, 3616.0, 14175.0, 75503.0, 485147.0, 394254.0, 57793.0, 11268.0, 2979.0, 1030.0, 397.0, 169.0, 94.0, 45.0, 27.0, 21.0, 16.0, 6.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02947998046875, -0.028526782989501953, -0.027573585510253906, -0.02662038803100586, -0.025667190551757812, -0.024713993072509766, -0.02376079559326172, -0.022807598114013672, -0.021854400634765625, -0.020901203155517578, -0.01994800567626953, -0.018994808197021484, -0.018041610717773438, -0.01708841323852539, -0.016135215759277344, -0.015182018280029297, -0.01422882080078125, -0.013275623321533203, -0.012322425842285156, -0.01136922836303711, -0.010416030883789062, -0.009462833404541016, -0.008509635925292969, -0.007556438446044922, -0.006603240966796875, -0.005650043487548828, -0.004696846008300781, -0.0037436485290527344, -0.0027904510498046875, -0.0018372535705566406, -0.0008840560913085938, 6.914138793945312e-05, 0.0010223388671875, 0.001975536346435547, 0.0029287338256835938, 0.0038819313049316406, 0.0048351287841796875, 0.005788326263427734, 0.006741523742675781, 0.007694721221923828, 0.008647918701171875, 0.009601116180419922, 0.010554313659667969, 0.011507511138916016, 0.012460708618164062, 0.01341390609741211, 0.014367103576660156, 0.015320301055908203, 0.01627349853515625, 0.017226696014404297, 0.018179893493652344, 0.01913309097290039, 0.020086288452148438, 0.021039485931396484, 0.02199268341064453, 0.022945880889892578, 0.023899078369140625, 0.024852275848388672, 0.02580547332763672, 0.026758670806884766, 0.027711868286132812, 0.02866506576538086, 0.029618263244628906, 0.030571460723876953, 0.031524658203125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 8.0, 4.0, 4.0, 8.0, 12.0, 21.0, 21.0, 31.0, 47.0, 49.0, 67.0, 64.0, 89.0, 82.0, 81.0, 76.0, 73.0, 62.0, 42.0, 43.0, 33.0, 28.0, 12.0, 12.0, 7.0, 6.0, 6.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02520751953125, -0.024524927139282227, -0.023842334747314453, -0.02315974235534668, -0.022477149963378906, -0.021794557571411133, -0.02111196517944336, -0.020429372787475586, -0.019746780395507812, -0.01906418800354004, -0.018381595611572266, -0.017699003219604492, -0.01701641082763672, -0.016333818435668945, -0.015651226043701172, -0.014968633651733398, -0.014286041259765625, -0.013603448867797852, -0.012920856475830078, -0.012238264083862305, -0.011555671691894531, -0.010873079299926758, -0.010190486907958984, -0.009507894515991211, -0.008825302124023438, -0.008142709732055664, -0.007460117340087891, -0.006777524948120117, -0.006094932556152344, -0.00541234016418457, -0.004729747772216797, -0.0040471553802490234, -0.00336456298828125, -0.0026819705963134766, -0.001999378204345703, -0.0013167858123779297, -0.0006341934204101562, 4.839897155761719e-05, 0.0007309913635253906, 0.001413583755493164, 0.0020961761474609375, 0.002778768539428711, 0.0034613609313964844, 0.004143953323364258, 0.004826545715332031, 0.005509138107299805, 0.006191730499267578, 0.0068743228912353516, 0.007556915283203125, 0.008239507675170898, 0.008922100067138672, 0.009604692459106445, 0.010287284851074219, 0.010969877243041992, 0.011652469635009766, 0.012335062026977539, 0.013017654418945312, 0.013700246810913086, 0.01438283920288086, 0.015065431594848633, 0.015748023986816406, 0.01643061637878418, 0.017113208770751953, 0.017795801162719727, 0.0184783935546875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 15.0, 25.0, 58.0, 91.0, 251.0, 635.0, 1983.0, 19666.0, 934283.0, 86281.0, 3646.0, 964.0, 346.0, 147.0, 68.0, 32.0, 16.0, 9.0, 7.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0780029296875, -0.07568645477294922, -0.07336997985839844, -0.07105350494384766, -0.06873703002929688, -0.0664205551147461, -0.06410408020019531, -0.06178760528564453, -0.05947113037109375, -0.05715465545654297, -0.05483818054199219, -0.052521705627441406, -0.050205230712890625, -0.047888755798339844, -0.04557228088378906, -0.04325580596923828, -0.0409393310546875, -0.03862285614013672, -0.03630638122558594, -0.033989906311035156, -0.031673431396484375, -0.029356956481933594, -0.027040481567382812, -0.02472400665283203, -0.02240753173828125, -0.02009105682373047, -0.017774581909179688, -0.015458106994628906, -0.013141632080078125, -0.010825157165527344, -0.008508682250976562, -0.006192207336425781, -0.003875732421875, -0.0015592575073242188, 0.0007572174072265625, 0.0030736923217773438, 0.005390167236328125, 0.007706642150878906, 0.010023117065429688, 0.012339591979980469, 0.01465606689453125, 0.01697254180908203, 0.019289016723632812, 0.021605491638183594, 0.023921966552734375, 0.026238441467285156, 0.028554916381835938, 0.03087139129638672, 0.0331878662109375, 0.03550434112548828, 0.03782081604003906, 0.040137290954589844, 0.042453765869140625, 0.044770240783691406, 0.04708671569824219, 0.04940319061279297, 0.05171966552734375, 0.05403614044189453, 0.05635261535644531, 0.058669090270996094, 0.060985565185546875, 0.06330204010009766, 0.06561851501464844, 0.06793498992919922, 0.07025146484375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 3.0, 5.0, 9.0, 11.0, 27.0, 42.0, 39.0, 68.0, 79.0, 113.0, 87.0, 102.0, 86.0, 70.0, 80.0, 55.0, 58.0, 29.0, 25.0, 5.0, 9.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.075439453125, -0.07217597961425781, -0.06891250610351562, -0.06564903259277344, -0.06238555908203125, -0.05912208557128906, -0.055858612060546875, -0.05259513854980469, -0.0493316650390625, -0.04606819152832031, -0.042804718017578125, -0.03954124450683594, -0.03627777099609375, -0.03301429748535156, -0.029750823974609375, -0.026487350463867188, -0.023223876953125, -0.019960403442382812, -0.016696929931640625, -0.013433456420898438, -0.01016998291015625, -0.0069065093994140625, -0.003643035888671875, -0.0003795623779296875, 0.0028839111328125, 0.0061473846435546875, 0.009410858154296875, 0.012674331665039062, 0.01593780517578125, 0.019201278686523438, 0.022464752197265625, 0.025728225708007812, 0.02899169921875, 0.03225517272949219, 0.035518646240234375, 0.03878211975097656, 0.04204559326171875, 0.04530906677246094, 0.048572540283203125, 0.05183601379394531, 0.0550994873046875, 0.05836296081542969, 0.061626434326171875, 0.06488990783691406, 0.06815338134765625, 0.07141685485839844, 0.07468032836914062, 0.07794380187988281, 0.081207275390625, 0.08447074890136719, 0.08773422241210938, 0.09099769592285156, 0.09426116943359375, 0.09752464294433594, 0.10078811645507812, 0.10405158996582031, 0.1073150634765625, 0.11057853698730469, 0.11384201049804688, 0.11710548400878906, 0.12036895751953125, 0.12363243103027344, 0.12689590454101562, 0.1301593780517578, 0.1334228515625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 10.0, 7.0, 20.0, 34.0, 64.0, 116.0, 360.0, 1359.0, 10121.0, 754580.0, 274024.0, 6221.0, 1046.0, 317.0, 150.0, 63.0, 23.0, 17.0, 9.0, 2.0, 8.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0211181640625, -0.020270347595214844, -0.019422531127929688, -0.01857471466064453, -0.017726898193359375, -0.01687908172607422, -0.016031265258789062, -0.015183448791503906, -0.01433563232421875, -0.013487815856933594, -0.012639999389648438, -0.011792182922363281, -0.010944366455078125, -0.010096549987792969, -0.009248733520507812, -0.008400917053222656, -0.0075531005859375, -0.006705284118652344, -0.0058574676513671875, -0.005009651184082031, -0.004161834716796875, -0.0033140182495117188, -0.0024662017822265625, -0.0016183853149414062, -0.00077056884765625, 7.724761962890625e-05, 0.0009250640869140625, 0.0017728805541992188, 0.002620697021484375, 0.0034685134887695312, 0.0043163299560546875, 0.005164146423339844, 0.006011962890625, 0.006859779357910156, 0.0077075958251953125, 0.008555412292480469, 0.009403228759765625, 0.010251045227050781, 0.011098861694335938, 0.011946678161621094, 0.01279449462890625, 0.013642311096191406, 0.014490127563476562, 0.015337944030761719, 0.016185760498046875, 0.01703357696533203, 0.017881393432617188, 0.018729209899902344, 0.0195770263671875, 0.020424842834472656, 0.021272659301757812, 0.02212047576904297, 0.022968292236328125, 0.02381610870361328, 0.024663925170898438, 0.025511741638183594, 0.02635955810546875, 0.027207374572753906, 0.028055191040039062, 0.02890300750732422, 0.029750823974609375, 0.03059864044189453, 0.03144645690917969, 0.032294273376464844, 0.03314208984375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 6.0, 9.0, 4.0, 9.0, 11.0, 16.0, 25.0, 33.0, 31.0, 52.0, 67.0, 94.0, 132.0, 133.0, 89.0, 60.0, 47.0, 41.0, 26.0, 20.0, 12.0, 15.0, 11.0, 2.0, 5.0, 8.0, 9.0, 5.0, 7.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.112720489501953e-05, -3.9880163967609406e-05, -3.863312304019928e-05, -3.7386082112789154e-05, -3.613904118537903e-05, -3.48920002579689e-05, -3.364495933055878e-05, -3.239791840314865e-05, -3.1150877475738525e-05, -2.99038365483284e-05, -2.8656795620918274e-05, -2.7409754693508148e-05, -2.6162713766098022e-05, -2.4915672838687897e-05, -2.366863191127777e-05, -2.2421590983867645e-05, -2.117455005645752e-05, -1.9927509129047394e-05, -1.8680468201637268e-05, -1.7433427274227142e-05, -1.6186386346817017e-05, -1.4939345419406891e-05, -1.3692304491996765e-05, -1.244526356458664e-05, -1.1198222637176514e-05, -9.951181709766388e-06, -8.704140782356262e-06, -7.4570998549461365e-06, -6.210058927536011e-06, -4.963018000125885e-06, -3.7159770727157593e-06, -2.4689361453056335e-06, -1.2218952178955078e-06, 2.514570951461792e-08, 1.2721866369247437e-06, 2.5192275643348694e-06, 3.766268491744995e-06, 5.013309419155121e-06, 6.260350346565247e-06, 7.507391273975372e-06, 8.754432201385498e-06, 1.0001473128795624e-05, 1.124851405620575e-05, 1.2495554983615875e-05, 1.3742595911026001e-05, 1.4989636838436127e-05, 1.6236677765846252e-05, 1.7483718693256378e-05, 1.8730759620666504e-05, 1.997780054807663e-05, 2.1224841475486755e-05, 2.247188240289688e-05, 2.3718923330307007e-05, 2.4965964257717133e-05, 2.6213005185127258e-05, 2.7460046112537384e-05, 2.870708703994751e-05, 2.9954127967357635e-05, 3.120116889476776e-05, 3.244820982217789e-05, 3.369525074958801e-05, 3.494229167699814e-05, 3.6189332604408264e-05, 3.743637353181839e-05, 3.8683414459228516e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 4.0, 10.0, 18.0, 31.0, 62.0, 101.0, 259.0, 825.0, 3794.0, 115181.0, 913414.0, 12651.0, 1464.0, 390.0, 181.0, 79.0, 38.0, 24.0, 4.0, 11.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0287628173828125, -0.02787041664123535, -0.026978015899658203, -0.026085615158081055, -0.025193214416503906, -0.024300813674926758, -0.02340841293334961, -0.02251601219177246, -0.021623611450195312, -0.020731210708618164, -0.019838809967041016, -0.018946409225463867, -0.01805400848388672, -0.01716160774230957, -0.016269207000732422, -0.015376806259155273, -0.014484405517578125, -0.013592004776000977, -0.012699604034423828, -0.01180720329284668, -0.010914802551269531, -0.010022401809692383, -0.009130001068115234, -0.008237600326538086, -0.0073451995849609375, -0.006452798843383789, -0.005560398101806641, -0.004667997360229492, -0.0037755966186523438, -0.0028831958770751953, -0.001990795135498047, -0.0010983943939208984, -0.00020599365234375, 0.0006864070892333984, 0.0015788078308105469, 0.0024712085723876953, 0.0033636093139648438, 0.004256010055541992, 0.005148410797119141, 0.006040811538696289, 0.0069332122802734375, 0.007825613021850586, 0.008718013763427734, 0.009610414505004883, 0.010502815246582031, 0.01139521598815918, 0.012287616729736328, 0.013180017471313477, 0.014072418212890625, 0.014964818954467773, 0.015857219696044922, 0.01674962043762207, 0.01764202117919922, 0.018534421920776367, 0.019426822662353516, 0.020319223403930664, 0.021211624145507812, 0.02210402488708496, 0.02299642562866211, 0.023888826370239258, 0.024781227111816406, 0.025673627853393555, 0.026566028594970703, 0.02745842933654785, 0.028350830078125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 6.0, 9.0, 10.0, 11.0, 25.0, 43.0, 57.0, 130.0, 177.0, 203.0, 153.0, 71.0, 41.0, 25.0, 21.0, 7.0, 5.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0297698974609375, -0.028970956802368164, -0.028172016143798828, -0.027373075485229492, -0.026574134826660156, -0.02577519416809082, -0.024976253509521484, -0.02417731285095215, -0.023378372192382812, -0.022579431533813477, -0.02178049087524414, -0.020981550216674805, -0.02018260955810547, -0.019383668899536133, -0.018584728240966797, -0.01778578758239746, -0.016986846923828125, -0.01618790626525879, -0.015388965606689453, -0.014590024948120117, -0.013791084289550781, -0.012992143630981445, -0.01219320297241211, -0.011394262313842773, -0.010595321655273438, -0.009796380996704102, -0.008997440338134766, -0.00819849967956543, -0.007399559020996094, -0.006600618362426758, -0.005801677703857422, -0.005002737045288086, -0.00420379638671875, -0.003404855728149414, -0.002605915069580078, -0.0018069744110107422, -0.0010080337524414062, -0.0002090930938720703, 0.0005898475646972656, 0.0013887882232666016, 0.0021877288818359375, 0.0029866695404052734, 0.0037856101989746094, 0.004584550857543945, 0.005383491516113281, 0.006182432174682617, 0.006981372833251953, 0.007780313491821289, 0.008579254150390625, 0.009378194808959961, 0.010177135467529297, 0.010976076126098633, 0.011775016784667969, 0.012573957443237305, 0.01337289810180664, 0.014171838760375977, 0.014970779418945312, 0.01576972007751465, 0.016568660736083984, 0.01736760139465332, 0.018166542053222656, 0.018965482711791992, 0.019764423370361328, 0.020563364028930664, 0.0213623046875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 12.0, 31.0, 90.0, 259.0, 304.0, 176.0, 75.0, 27.0, 15.0, 0.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.36147540807724, -0.3451583683490753, -0.32884132862091064, -0.31252431869506836, -0.2962072789669037, -0.279890239238739, -0.26357322931289673, -0.24725618958473206, -0.23093914985656738, -0.2146221101284027, -0.19830508530139923, -0.18198806047439575, -0.16567102074623108, -0.1493539810180664, -0.13303695619106293, -0.11671992391347885, -0.10040289163589478, -0.0840858593583107, -0.06776882708072662, -0.05145179480314255, -0.03513476252555847, -0.018817730247974396, -0.00250069797039032, 0.013816334307193756, 0.030133366584777832, 0.04645039886236191, 0.06276743113994598, 0.07908446341753006, 0.09540149569511414, 0.11171852797269821, 0.1280355602502823, 0.14435258507728577, 0.16066968441009521, 0.1769867241382599, 0.19330374896526337, 0.20962077379226685, 0.22593781352043152, 0.2422548532485962, 0.2585718631744385, 0.27488890290260315, 0.2912059426307678, 0.3075229823589325, 0.32384002208709717, 0.34015703201293945, 0.3564740717411041, 0.3727911114692688, 0.3891081213951111, 0.40542516112327576, 0.42174220085144043, 0.4380592405796051, 0.4543762803077698, 0.47069329023361206, 0.48701032996177673, 0.5033273696899414, 0.5196443796157837, 0.5359614491462708, 0.552278459072113, 0.5685954689979553, 0.5849125385284424, 0.6012295484542847, 0.617546558380127, 0.633863627910614, 0.6501806378364563, 0.6664977073669434, 0.6828147172927856]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 4.0, 11.0, 8.0, 12.0, 16.0, 17.0, 13.0, 22.0, 22.0, 30.0, 29.0, 28.0, 37.0, 38.0, 35.0, 38.0, 40.0, 44.0, 56.0, 53.0, 41.0, 48.0, 35.0, 31.0, 31.0, 26.0, 31.0, 25.0, 23.0, 28.0, 21.0, 15.0, 15.0, 15.0, 7.0, 9.0, 9.0, 5.0, 6.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.2416272759437561, -0.23407693207263947, -0.22652658820152283, -0.218976229429245, -0.21142588555812836, -0.20387554168701172, -0.1963251829147339, -0.18877483904361725, -0.1812244951725006, -0.17367415130138397, -0.16612380743026733, -0.1585734486579895, -0.15102310478687286, -0.14347276091575623, -0.1359224021434784, -0.12837205827236176, -0.12082171440124512, -0.11327137053012848, -0.10572101920843124, -0.09817066788673401, -0.09062032401561737, -0.08306998014450073, -0.0755196288228035, -0.06796927750110626, -0.060418933629989624, -0.05286858603358269, -0.04531823843717575, -0.037767890840768814, -0.030217543244361877, -0.02266719564795494, -0.015116848051548004, -0.0075665004551410675, -1.615285873413086e-05, 0.007534194737672806, 0.015084542334079742, 0.02263488993048668, 0.030185237526893616, 0.03773558512330055, 0.04528593271970749, 0.052836280316114426, 0.06038662791252136, 0.067936971783638, 0.07548732310533524, 0.08303767442703247, 0.09058801829814911, 0.09813836216926575, 0.10568871349096298, 0.11323906481266022, 0.12078940868377686, 0.1283397525548935, 0.13589009642601013, 0.14344045519828796, 0.1509907990694046, 0.15854114294052124, 0.16609150171279907, 0.1736418455839157, 0.18119218945503235, 0.188742533326149, 0.19629287719726562, 0.20384323596954346, 0.2113935798406601, 0.21894392371177673, 0.22649428248405457, 0.2340446263551712, 0.24159497022628784]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [5.0, 1.0, 11.0, 10.0, 10.0, 21.0, 55.0, 115.0, 289.0, 773.0, 2277.0, 9447.0, 72115.0, 3946684.0, 144253.0, 13516.0, 3010.0, 976.0, 403.0, 154.0, 80.0, 43.0, 16.0, 15.0, 10.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017425537109375, -0.01614522933959961, -0.014864921569824219, -0.013584613800048828, -0.012304306030273438, -0.011023998260498047, -0.009743690490722656, -0.008463382720947266, -0.007183074951171875, -0.005902767181396484, -0.004622459411621094, -0.003342151641845703, -0.0020618438720703125, -0.0007815361022949219, 0.0004987716674804688, 0.0017790794372558594, 0.00305938720703125, 0.004339694976806641, 0.005620002746582031, 0.006900310516357422, 0.008180618286132812, 0.009460926055908203, 0.010741233825683594, 0.012021541595458984, 0.013301849365234375, 0.014582157135009766, 0.015862464904785156, 0.017142772674560547, 0.018423080444335938, 0.019703388214111328, 0.02098369598388672, 0.02226400375366211, 0.0235443115234375, 0.02482461929321289, 0.02610492706298828, 0.027385234832763672, 0.028665542602539062, 0.029945850372314453, 0.031226158142089844, 0.032506465911865234, 0.033786773681640625, 0.035067081451416016, 0.036347389221191406, 0.0376276969909668, 0.03890800476074219, 0.04018831253051758, 0.04146862030029297, 0.04274892807006836, 0.04402923583984375, 0.04530954360961914, 0.04658985137939453, 0.04787015914916992, 0.04915046691894531, 0.0504307746887207, 0.051711082458496094, 0.052991390228271484, 0.054271697998046875, 0.055552005767822266, 0.056832313537597656, 0.05811262130737305, 0.05939292907714844, 0.06067323684692383, 0.06195354461669922, 0.06323385238647461, 0.06451416015625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 8.0, 9.0, 15.0, 25.0, 29.0, 37.0, 48.0, 51.0, 60.0, 79.0, 69.0, 80.0, 85.0, 66.0, 62.0, 68.0, 56.0, 45.0, 23.0, 23.0, 15.0, 6.0, 10.0, 3.0, 6.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.019195556640625, -0.018589019775390625, -0.01798248291015625, -0.017375946044921875, -0.0167694091796875, -0.016162872314453125, -0.01555633544921875, -0.014949798583984375, -0.01434326171875, -0.013736724853515625, -0.01313018798828125, -0.012523651123046875, -0.0119171142578125, -0.011310577392578125, -0.01070404052734375, -0.010097503662109375, -0.009490966796875, -0.008884429931640625, -0.00827789306640625, -0.007671356201171875, -0.0070648193359375, -0.006458282470703125, -0.00585174560546875, -0.005245208740234375, -0.004638671875, -0.004032135009765625, -0.00342559814453125, -0.002819061279296875, -0.0022125244140625, -0.001605987548828125, -0.00099945068359375, -0.000392913818359375, 0.000213623046875, 0.000820159912109375, 0.00142669677734375, 0.002033233642578125, 0.0026397705078125, 0.003246307373046875, 0.00385284423828125, 0.004459381103515625, 0.00506591796875, 0.005672454833984375, 0.00627899169921875, 0.006885528564453125, 0.0074920654296875, 0.008098602294921875, 0.00870513916015625, 0.009311676025390625, 0.009918212890625, 0.010524749755859375, 0.01113128662109375, 0.011737823486328125, 0.0123443603515625, 0.012950897216796875, 0.01355743408203125, 0.014163970947265625, 0.0147705078125, 0.015377044677734375, 0.01598358154296875, 0.016590118408203125, 0.0171966552734375, 0.017803192138671875, 0.01840972900390625, 0.019016265869140625, 0.019622802734375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 7.0, 4.0, 1.0, 9.0, 6.0, 15.0, 9.0, 21.0, 24.0, 31.0, 44.0, 79.0, 131.0, 258.0, 666.0, 2056.0, 9421.0, 78209.0, 3935771.0, 148080.0, 14792.0, 2904.0, 932.0, 355.0, 171.0, 84.0, 65.0, 49.0, 24.0, 15.0, 13.0, 9.0, 6.0, 3.0, 9.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.044219970703125, -0.04294252395629883, -0.041665077209472656, -0.040387630462646484, -0.03911018371582031, -0.03783273696899414, -0.03655529022216797, -0.0352778434753418, -0.034000396728515625, -0.03272294998168945, -0.03144550323486328, -0.03016805648803711, -0.028890609741210938, -0.027613162994384766, -0.026335716247558594, -0.025058269500732422, -0.02378082275390625, -0.022503376007080078, -0.021225929260253906, -0.019948482513427734, -0.018671035766601562, -0.01739358901977539, -0.01611614227294922, -0.014838695526123047, -0.013561248779296875, -0.012283802032470703, -0.011006355285644531, -0.00972890853881836, -0.008451461791992188, -0.007174015045166016, -0.005896568298339844, -0.004619121551513672, -0.0033416748046875, -0.002064228057861328, -0.0007867813110351562, 0.0004906654357910156, 0.0017681121826171875, 0.0030455589294433594, 0.004323005676269531, 0.005600452423095703, 0.006877899169921875, 0.008155345916748047, 0.009432792663574219, 0.01071023941040039, 0.011987686157226562, 0.013265132904052734, 0.014542579650878906, 0.015820026397705078, 0.01709747314453125, 0.018374919891357422, 0.019652366638183594, 0.020929813385009766, 0.022207260131835938, 0.02348470687866211, 0.02476215362548828, 0.026039600372314453, 0.027317047119140625, 0.028594493865966797, 0.02987194061279297, 0.03114938735961914, 0.03242683410644531, 0.033704280853271484, 0.034981727600097656, 0.03625917434692383, 0.03753662109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 6.0, 4.0, 7.0, 16.0, 31.0, 25.0, 33.0, 66.0, 93.0, 369.0, 1580.0, 1324.0, 251.0, 80.0, 46.0, 34.0, 29.0, 22.0, 12.0, 11.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03759765625, -0.03645467758178711, -0.03531169891357422, -0.03416872024536133, -0.03302574157714844, -0.03188276290893555, -0.030739784240722656, -0.029596805572509766, -0.028453826904296875, -0.027310848236083984, -0.026167869567871094, -0.025024890899658203, -0.023881912231445312, -0.022738933563232422, -0.02159595489501953, -0.02045297622680664, -0.01930999755859375, -0.01816701889038086, -0.01702404022216797, -0.015881061553955078, -0.014738082885742188, -0.013595104217529297, -0.012452125549316406, -0.011309146881103516, -0.010166168212890625, -0.009023189544677734, -0.007880210876464844, -0.006737232208251953, -0.0055942535400390625, -0.004451274871826172, -0.0033082962036132812, -0.0021653175354003906, -0.0010223388671875, 0.00012063980102539062, 0.0012636184692382812, 0.002406597137451172, 0.0035495758056640625, 0.004692554473876953, 0.005835533142089844, 0.006978511810302734, 0.008121490478515625, 0.009264469146728516, 0.010407447814941406, 0.011550426483154297, 0.012693405151367188, 0.013836383819580078, 0.014979362487792969, 0.01612234115600586, 0.01726531982421875, 0.01840829849243164, 0.01955127716064453, 0.020694255828857422, 0.021837234497070312, 0.022980213165283203, 0.024123191833496094, 0.025266170501708984, 0.026409149169921875, 0.027552127838134766, 0.028695106506347656, 0.029838085174560547, 0.030981063842773438, 0.03212404251098633, 0.03326702117919922, 0.03440999984741211, 0.035552978515625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 5.0, 8.0, 5.0, 7.0, 24.0, 49.0, 111.0, 187.0, 240.0, 204.0, 93.0, 42.0, 12.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27881789207458496, -0.27002912759780884, -0.2612403929233551, -0.252451628446579, -0.24366287887096405, -0.23487412929534912, -0.226085364818573, -0.21729661524295807, -0.20850786566734314, -0.1997191160917282, -0.19093036651611328, -0.18214160203933716, -0.17335285246372223, -0.1645641028881073, -0.15577533841133118, -0.14698658883571625, -0.13819783926010132, -0.1294090896844864, -0.12062033265829086, -0.11183157563209534, -0.10304282605648041, -0.09425407648086548, -0.08546531945466995, -0.07667656242847443, -0.0678878128528595, -0.05909905955195427, -0.05031030625104904, -0.041521552950143814, -0.032732799649238586, -0.02394404634833336, -0.015155293047428131, -0.0063665397465229034, 0.0024221837520599365, 0.011210937052965164, 0.019999690353870392, 0.02878844365477562, 0.03757719695568085, 0.046365950256586075, 0.0551547035574913, 0.06394346058368683, 0.07273221015930176, 0.08152095973491669, 0.09030971676111221, 0.09909847378730774, 0.10788722336292267, 0.1166759729385376, 0.12546473741531372, 0.13425348699092865, 0.14304223656654358, 0.1518309861421585, 0.16061973571777344, 0.16940850019454956, 0.1781972497701645, 0.18698599934577942, 0.19577476382255554, 0.20456351339817047, 0.2133522629737854, 0.22214101254940033, 0.23092976212501526, 0.23971852660179138, 0.2485072761774063, 0.25729602575302124, 0.26608479022979736, 0.2748735249042511, 0.2836622893810272]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 6.0, 10.0, 7.0, 10.0, 6.0, 6.0, 10.0, 16.0, 23.0, 18.0, 20.0, 21.0, 25.0, 19.0, 28.0, 32.0, 38.0, 34.0, 40.0, 40.0, 39.0, 54.0, 43.0, 48.0, 32.0, 41.0, 38.0, 30.0, 26.0, 22.0, 25.0, 27.0, 19.0, 23.0, 20.0, 13.0, 13.0, 7.0, 13.0, 10.0, 7.0, 7.0, 9.0, 7.0, 3.0, 2.0, 2.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.09588378667831421, -0.09298962354660034, -0.09009545296430588, -0.08720128983259201, -0.08430711925029755, -0.08141295611858368, -0.07851879298686981, -0.07562462985515594, -0.07273045927286148, -0.06983629614114761, -0.06694212555885315, -0.06404796242713928, -0.06115379557013512, -0.05825962871313095, -0.055365465581417084, -0.05247129872441292, -0.04957713186740875, -0.04668296501040459, -0.04378879815340042, -0.040894635021686554, -0.03800046816468239, -0.03510630130767822, -0.032212138175964355, -0.02931797131896019, -0.026423804461956024, -0.02352963760495186, -0.020635472610592842, -0.017741307616233826, -0.01484714075922966, -0.011952974833548069, -0.009058808907866478, -0.0061646439135074615, -0.003270477056503296, -0.00037631113082170486, 0.002517854794859886, 0.005412020720541477, 0.008306186646223068, 0.01120035257190466, 0.01409451849758625, 0.016988683491945267, 0.019882850348949432, 0.022777017205953598, 0.025671182200312614, 0.02856534719467163, 0.031459514051675797, 0.03435368090867996, 0.03724784404039383, 0.040142010897397995, 0.04303617775440216, 0.045930344611406326, 0.04882451146841049, 0.05171867460012436, 0.054612841457128525, 0.05750700831413269, 0.06040117144584656, 0.06329533457756042, 0.06618950515985489, 0.06908366829156876, 0.07197783887386322, 0.07487200200557709, 0.07776616513729095, 0.08066033571958542, 0.08355449885129929, 0.08644866943359375, 0.08934283256530762]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 0.0, 4.0, 3.0, 7.0, 25.0, 30.0, 40.0, 54.0, 95.0, 176.0, 395.0, 749.0, 1573.0, 3981.0, 10523.0, 34137.0, 125714.0, 390202.0, 338802.0, 99493.0, 27643.0, 8780.0, 3323.0, 1418.0, 659.0, 317.0, 169.0, 94.0, 54.0, 29.0, 28.0, 13.0, 12.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0197906494140625, -0.019129037857055664, -0.018467426300048828, -0.017805814743041992, -0.017144203186035156, -0.01648259162902832, -0.015820980072021484, -0.015159368515014648, -0.014497756958007812, -0.013836145401000977, -0.01317453384399414, -0.012512922286987305, -0.011851310729980469, -0.011189699172973633, -0.010528087615966797, -0.009866476058959961, -0.009204864501953125, -0.008543252944946289, -0.007881641387939453, -0.007220029830932617, -0.006558418273925781, -0.005896806716918945, -0.005235195159912109, -0.0045735836029052734, -0.0039119720458984375, -0.0032503604888916016, -0.0025887489318847656, -0.0019271373748779297, -0.0012655258178710938, -0.0006039142608642578, 5.7697296142578125e-05, 0.0007193088531494141, 0.00138092041015625, 0.002042531967163086, 0.002704143524169922, 0.003365755081176758, 0.004027366638183594, 0.00468897819519043, 0.005350589752197266, 0.0060122013092041016, 0.0066738128662109375, 0.0073354244232177734, 0.00799703598022461, 0.008658647537231445, 0.009320259094238281, 0.009981870651245117, 0.010643482208251953, 0.011305093765258789, 0.011966705322265625, 0.012628316879272461, 0.013289928436279297, 0.013951539993286133, 0.014613151550292969, 0.015274763107299805, 0.01593637466430664, 0.016597986221313477, 0.017259597778320312, 0.01792120933532715, 0.018582820892333984, 0.01924443244934082, 0.019906044006347656, 0.020567655563354492, 0.021229267120361328, 0.021890878677368164, 0.022552490234375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 8.0, 5.0, 15.0, 16.0, 23.0, 33.0, 51.0, 59.0, 66.0, 57.0, 79.0, 93.0, 70.0, 74.0, 69.0, 54.0, 64.0, 45.0, 38.0, 15.0, 20.0, 8.0, 8.0, 6.0, 3.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01953125, -0.01890110969543457, -0.01827096939086914, -0.01764082908630371, -0.01701068878173828, -0.01638054847717285, -0.015750408172607422, -0.015120267868041992, -0.014490127563476562, -0.013859987258911133, -0.013229846954345703, -0.012599706649780273, -0.011969566345214844, -0.011339426040649414, -0.010709285736083984, -0.010079145431518555, -0.009449005126953125, -0.008818864822387695, -0.008188724517822266, -0.007558584213256836, -0.006928443908691406, -0.0062983036041259766, -0.005668163299560547, -0.005038022994995117, -0.0044078826904296875, -0.003777742385864258, -0.003147602081298828, -0.0025174617767333984, -0.0018873214721679688, -0.001257181167602539, -0.0006270408630371094, 3.0994415283203125e-06, 0.00063323974609375, 0.0012633800506591797, 0.0018935203552246094, 0.002523660659790039, 0.0031538009643554688, 0.0037839412689208984, 0.004414081573486328, 0.005044221878051758, 0.0056743621826171875, 0.006304502487182617, 0.006934642791748047, 0.0075647830963134766, 0.008194923400878906, 0.008825063705444336, 0.009455204010009766, 0.010085344314575195, 0.010715484619140625, 0.011345624923706055, 0.011975765228271484, 0.012605905532836914, 0.013236045837402344, 0.013866186141967773, 0.014496326446533203, 0.015126466751098633, 0.015756607055664062, 0.016386747360229492, 0.017016887664794922, 0.01764702796936035, 0.01827716827392578, 0.01890730857849121, 0.01953744888305664, 0.02016758918762207, 0.0207977294921875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 8.0, 4.0, 9.0, 14.0, 29.0, 32.0, 70.0, 107.0, 168.0, 247.0, 436.0, 757.0, 1537.0, 3961.0, 18352.0, 243002.0, 714140.0, 53562.0, 7240.0, 2262.0, 1043.0, 578.0, 361.0, 205.0, 156.0, 96.0, 50.0, 54.0, 23.0, 16.0, 15.0, 4.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03839111328125, -0.037199974060058594, -0.03600883483886719, -0.03481769561767578, -0.033626556396484375, -0.03243541717529297, -0.031244277954101562, -0.030053138732910156, -0.02886199951171875, -0.027670860290527344, -0.026479721069335938, -0.02528858184814453, -0.024097442626953125, -0.02290630340576172, -0.021715164184570312, -0.020524024963378906, -0.0193328857421875, -0.018141746520996094, -0.016950607299804688, -0.01575946807861328, -0.014568328857421875, -0.013377189636230469, -0.012186050415039062, -0.010994911193847656, -0.00980377197265625, -0.008612632751464844, -0.0074214935302734375, -0.006230354309082031, -0.005039215087890625, -0.0038480758666992188, -0.0026569366455078125, -0.0014657974243164062, -0.000274658203125, 0.0009164810180664062, 0.0021076202392578125, 0.0032987594604492188, 0.004489898681640625, 0.005681037902832031, 0.0068721771240234375, 0.008063316345214844, 0.00925445556640625, 0.010445594787597656, 0.011636734008789062, 0.012827873229980469, 0.014019012451171875, 0.015210151672363281, 0.016401290893554688, 0.017592430114746094, 0.0187835693359375, 0.019974708557128906, 0.021165847778320312, 0.02235698699951172, 0.023548126220703125, 0.02473926544189453, 0.025930404663085938, 0.027121543884277344, 0.02831268310546875, 0.029503822326660156, 0.030694961547851562, 0.03188610076904297, 0.033077239990234375, 0.03426837921142578, 0.03545951843261719, 0.036650657653808594, 0.037841796875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 1.0, 8.0, 5.0, 11.0, 6.0, 11.0, 19.0, 13.0, 23.0, 28.0, 27.0, 23.0, 28.0, 30.0, 46.0, 40.0, 44.0, 48.0, 34.0, 50.0, 51.0, 46.0, 34.0, 35.0, 42.0, 39.0, 35.0, 30.0, 25.0, 28.0, 26.0, 12.0, 18.0, 23.0, 13.0, 15.0, 6.0, 5.0, 8.0, 6.0, 0.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03802490234375, -0.03664731979370117, -0.035269737243652344, -0.033892154693603516, -0.03251457214355469, -0.03113698959350586, -0.02975940704345703, -0.028381824493408203, -0.027004241943359375, -0.025626659393310547, -0.02424907684326172, -0.02287149429321289, -0.021493911743164062, -0.020116329193115234, -0.018738746643066406, -0.017361164093017578, -0.01598358154296875, -0.014605998992919922, -0.013228416442871094, -0.011850833892822266, -0.010473251342773438, -0.00909566879272461, -0.007718086242675781, -0.006340503692626953, -0.004962921142578125, -0.003585338592529297, -0.0022077560424804688, -0.0008301734924316406, 0.0005474090576171875, 0.0019249916076660156, 0.0033025741577148438, 0.004680156707763672, 0.0060577392578125, 0.007435321807861328, 0.008812904357910156, 0.010190486907958984, 0.011568069458007812, 0.01294565200805664, 0.014323234558105469, 0.015700817108154297, 0.017078399658203125, 0.018455982208251953, 0.01983356475830078, 0.02121114730834961, 0.022588729858398438, 0.023966312408447266, 0.025343894958496094, 0.026721477508544922, 0.02809906005859375, 0.029476642608642578, 0.030854225158691406, 0.032231807708740234, 0.03360939025878906, 0.03498697280883789, 0.03636455535888672, 0.03774213790893555, 0.039119720458984375, 0.0404973030090332, 0.04187488555908203, 0.04325246810913086, 0.04463005065917969, 0.046007633209228516, 0.047385215759277344, 0.04876279830932617, 0.050140380859375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 7.0, 1.0, 9.0, 5.0, 6.0, 9.0, 18.0, 48.0, 72.0, 141.0, 213.0, 486.0, 1025.0, 2792.0, 12670.0, 996288.0, 28395.0, 3958.0, 1274.0, 544.0, 249.0, 145.0, 97.0, 46.0, 21.0, 8.0, 8.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0731201171875, -0.07112503051757812, -0.06912994384765625, -0.06713485717773438, -0.0651397705078125, -0.06314468383789062, -0.06114959716796875, -0.059154510498046875, -0.057159423828125, -0.055164337158203125, -0.05316925048828125, -0.051174163818359375, -0.0491790771484375, -0.047183990478515625, -0.04518890380859375, -0.043193817138671875, -0.04119873046875, -0.039203643798828125, -0.03720855712890625, -0.035213470458984375, -0.0332183837890625, -0.031223297119140625, -0.02922821044921875, -0.027233123779296875, -0.025238037109375, -0.023242950439453125, -0.02124786376953125, -0.019252777099609375, -0.0172576904296875, -0.015262603759765625, -0.01326751708984375, -0.011272430419921875, -0.00927734375, -0.007282257080078125, -0.00528717041015625, -0.003292083740234375, -0.0012969970703125, 0.000698089599609375, 0.00269317626953125, 0.004688262939453125, 0.006683349609375, 0.008678436279296875, 0.01067352294921875, 0.012668609619140625, 0.0146636962890625, 0.016658782958984375, 0.01865386962890625, 0.020648956298828125, 0.02264404296875, 0.024639129638671875, 0.02663421630859375, 0.028629302978515625, 0.0306243896484375, 0.032619476318359375, 0.03461456298828125, 0.036609649658203125, 0.038604736328125, 0.040599822998046875, 0.04259490966796875, 0.044589996337890625, 0.0465850830078125, 0.048580169677734375, 0.05057525634765625, 0.052570343017578125, 0.0545654296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 2.0, 5.0, 5.0, 1.0, 12.0, 7.0, 11.0, 23.0, 23.0, 23.0, 26.0, 67.0, 89.0, 139.0, 159.0, 142.0, 67.0, 39.0, 39.0, 25.0, 20.0, 17.0, 18.0, 6.0, 13.0, 10.0, 5.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.684925079345703e-05, -4.5000575482845306e-05, -4.315190017223358e-05, -4.130322486162186e-05, -3.945454955101013e-05, -3.760587424039841e-05, -3.575719892978668e-05, -3.390852361917496e-05, -3.205984830856323e-05, -3.0211172997951508e-05, -2.8362497687339783e-05, -2.6513822376728058e-05, -2.4665147066116333e-05, -2.2816471755504608e-05, -2.0967796444892883e-05, -1.911912113428116e-05, -1.7270445823669434e-05, -1.542177051305771e-05, -1.3573095202445984e-05, -1.1724419891834259e-05, -9.875744581222534e-06, -8.02706927061081e-06, -6.1783939599990845e-06, -4.32971864938736e-06, -2.4810433387756348e-06, -6.323680281639099e-07, 1.216307282447815e-06, 3.06498259305954e-06, 4.913657903671265e-06, 6.7623332142829895e-06, 8.611008524894714e-06, 1.045968383550644e-05, 1.2308359146118164e-05, 1.4157034456729889e-05, 1.6005709767341614e-05, 1.785438507795334e-05, 1.9703060388565063e-05, 2.155173569917679e-05, 2.3400411009788513e-05, 2.5249086320400238e-05, 2.7097761631011963e-05, 2.8946436941623688e-05, 3.079511225223541e-05, 3.264378756284714e-05, 3.449246287345886e-05, 3.634113818407059e-05, 3.818981349468231e-05, 4.003848880529404e-05, 4.188716411590576e-05, 4.3735839426517487e-05, 4.558451473712921e-05, 4.7433190047740936e-05, 4.928186535835266e-05, 5.1130540668964386e-05, 5.297921597957611e-05, 5.4827891290187836e-05, 5.667656660079956e-05, 5.8525241911411285e-05, 6.037391722202301e-05, 6.222259253263474e-05, 6.407126784324646e-05, 6.591994315385818e-05, 6.776861846446991e-05, 6.961729377508163e-05, 7.146596908569336e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 3.0, 5.0, 1.0, 11.0, 8.0, 9.0, 11.0, 18.0, 19.0, 24.0, 57.0, 92.0, 152.0, 298.0, 570.0, 1404.0, 3558.0, 11947.0, 366618.0, 643448.0, 13425.0, 3805.0, 1545.0, 702.0, 332.0, 179.0, 94.0, 61.0, 43.0, 30.0, 17.0, 10.0, 8.0, 11.0, 7.0, 4.0, 7.0, 6.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.036712646484375, -0.03563404083251953, -0.03455543518066406, -0.033476829528808594, -0.032398223876953125, -0.031319618225097656, -0.030241012573242188, -0.02916240692138672, -0.02808380126953125, -0.02700519561767578, -0.025926589965820312, -0.024847984313964844, -0.023769378662109375, -0.022690773010253906, -0.021612167358398438, -0.02053356170654297, -0.0194549560546875, -0.01837635040283203, -0.017297744750976562, -0.016219139099121094, -0.015140533447265625, -0.014061927795410156, -0.012983322143554688, -0.011904716491699219, -0.01082611083984375, -0.009747505187988281, -0.008668899536132812, -0.007590293884277344, -0.006511688232421875, -0.005433082580566406, -0.0043544769287109375, -0.0032758712768554688, -0.002197265625, -0.0011186599731445312, -4.00543212890625e-05, 0.0010385513305664062, 0.002117156982421875, 0.0031957626342773438, 0.0042743682861328125, 0.005352973937988281, 0.00643157958984375, 0.007510185241699219, 0.008588790893554688, 0.009667396545410156, 0.010746002197265625, 0.011824607849121094, 0.012903213500976562, 0.013981819152832031, 0.0150604248046875, 0.01613903045654297, 0.017217636108398438, 0.018296241760253906, 0.019374847412109375, 0.020453453063964844, 0.021532058715820312, 0.02261066436767578, 0.02368927001953125, 0.02476787567138672, 0.025846481323242188, 0.026925086975097656, 0.028003692626953125, 0.029082298278808594, 0.030160903930664062, 0.03123950958251953, 0.032318115234375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 6.0, 18.0, 21.0, 52.0, 65.0, 117.0, 152.0, 190.0, 149.0, 80.0, 39.0, 34.0, 21.0, 12.0, 13.0, 8.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.024169921875, -0.023463964462280273, -0.022758007049560547, -0.02205204963684082, -0.021346092224121094, -0.020640134811401367, -0.01993417739868164, -0.019228219985961914, -0.018522262573242188, -0.01781630516052246, -0.017110347747802734, -0.016404390335083008, -0.01569843292236328, -0.014992475509643555, -0.014286518096923828, -0.013580560684204102, -0.012874603271484375, -0.012168645858764648, -0.011462688446044922, -0.010756731033325195, -0.010050773620605469, -0.009344816207885742, -0.008638858795166016, -0.007932901382446289, -0.0072269439697265625, -0.006520986557006836, -0.005815029144287109, -0.005109071731567383, -0.004403114318847656, -0.0036971569061279297, -0.002991199493408203, -0.0022852420806884766, -0.00157928466796875, -0.0008733272552490234, -0.00016736984252929688, 0.0005385875701904297, 0.0012445449829101562, 0.0019505023956298828, 0.0026564598083496094, 0.003362417221069336, 0.0040683746337890625, 0.004774332046508789, 0.005480289459228516, 0.006186246871948242, 0.006892204284667969, 0.007598161697387695, 0.008304119110107422, 0.009010076522827148, 0.009716033935546875, 0.010421991348266602, 0.011127948760986328, 0.011833906173706055, 0.012539863586425781, 0.013245820999145508, 0.013951778411865234, 0.014657735824584961, 0.015363693237304688, 0.016069650650024414, 0.01677560806274414, 0.017481565475463867, 0.018187522888183594, 0.01889348030090332, 0.019599437713623047, 0.020305395126342773, 0.0210113525390625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 5.0, 12.0, 33.0, 125.0, 432.0, 310.0, 68.0, 16.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21322138607501984, -0.18608735501766205, -0.15895330905914307, -0.13181927800178528, -0.1046852394938469, -0.07755120098590851, -0.05041716992855072, -0.02328312397003174, 0.00385090708732605, 0.030984943732619286, 0.05811898037791252, 0.08525301516056061, 0.11238705366849899, 0.13952109217643738, 0.16665512323379517, 0.19378916919231415, 0.22092320024967194, 0.24805723130702972, 0.2751912772655487, 0.3023253083229065, 0.3294593393802643, 0.35659337043762207, 0.38372743129730225, 0.41086146235466003, 0.4379954934120178, 0.4651295244693756, 0.4922635555267334, 0.5193976163864136, 0.546531617641449, 0.5736656785011292, 0.6007996797561646, 0.6279337406158447, 0.6550677418708801, 0.6822018027305603, 0.7093358039855957, 0.7364698648452759, 0.7636038661003113, 0.7907379269599915, 0.8178719282150269, 0.845005989074707, 0.8721400499343872, 0.8992741107940674, 0.9264081120491028, 0.953542172908783, 0.9806761741638184, 1.0078102350234985, 1.0349442958831787, 1.0620783567428589, 1.0892122983932495, 1.1163463592529297, 1.1434804201126099, 1.1706143617630005, 1.1977484226226807, 1.2248824834823608, 1.252016544342041, 1.2791506052017212, 1.3062846660614014, 1.3334187269210815, 1.3605527877807617, 1.3876867294311523, 1.4148207902908325, 1.4419548511505127, 1.4690889120101929, 1.496222972869873, 1.5233569145202637]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 5.0, 5.0, 11.0, 12.0, 17.0, 18.0, 23.0, 17.0, 26.0, 39.0, 41.0, 36.0, 47.0, 43.0, 44.0, 60.0, 55.0, 65.0, 63.0, 55.0, 41.0, 42.0, 36.0, 37.0, 31.0, 21.0, 26.0, 14.0, 11.0, 15.0, 9.0, 7.0, 10.0, 6.0, 9.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17495495080947876, -0.16816669702529907, -0.16137844324111938, -0.1545901745557785, -0.14780192077159882, -0.14101366698741913, -0.13422539830207825, -0.12743714451789856, -0.12064889073371887, -0.11386063694953918, -0.1070723757147789, -0.10028411448001862, -0.09349586069583893, -0.08670760691165924, -0.07991934567689896, -0.07313108444213867, -0.06634283065795898, -0.059554573148489, -0.05276631563901901, -0.045978058129549026, -0.03918980062007904, -0.032401543110609055, -0.02561328560113907, -0.018825028091669083, -0.012036770582199097, -0.005248513072729111, 0.0015397444367408752, 0.008328001946210861, 0.015116259455680847, 0.021904516965150833, 0.02869277447462082, 0.035481031984090805, 0.04226928949356079, 0.04905754700303078, 0.05584580451250076, 0.06263406574726105, 0.06942231953144073, 0.07621057331562042, 0.0829988345503807, 0.08978709578514099, 0.09657534956932068, 0.10336360335350037, 0.11015186458826065, 0.11694012582302094, 0.12372837960720062, 0.1305166333913803, 0.1373049020767212, 0.14409315586090088, 0.15088140964508057, 0.15766966342926025, 0.16445791721343994, 0.17124618589878082, 0.1780344396829605, 0.1848226934671402, 0.19161096215248108, 0.19839921593666077, 0.20518746972084045, 0.21197572350502014, 0.21876397728919983, 0.2255522459745407, 0.2323404997587204, 0.23912875354290009, 0.24591702222824097, 0.25270527601242065, 0.25949352979660034]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 11.0, 39.0, 119.0, 352.0, 1820487.0, 2372818.0, 315.0, 90.0, 32.0, 17.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2320556640625, -0.20627403259277344, -0.18049240112304688, -0.1547107696533203, -0.12892913818359375, -0.10314750671386719, -0.07736587524414062, -0.05158424377441406, -0.0258026123046875, -2.09808349609375e-05, 0.025760650634765625, 0.05154228210449219, 0.07732391357421875, 0.10310554504394531, 0.12888717651367188, 0.15466880798339844, 0.180450439453125, 0.20623207092285156, 0.23201370239257812, 0.2577953338623047, 0.28357696533203125, 0.3093585968017578, 0.3351402282714844, 0.36092185974121094, 0.3867034912109375, 0.41248512268066406, 0.4382667541503906, 0.4640483856201172, 0.48983001708984375, 0.5156116485595703, 0.5413932800292969, 0.5671749114990234, 0.59295654296875, 0.6187381744384766, 0.6445198059082031, 0.6703014373779297, 0.6960830688476562, 0.7218647003173828, 0.7476463317871094, 0.7734279632568359, 0.7992095947265625, 0.8249912261962891, 0.8507728576660156, 0.8765544891357422, 0.9023361206054688, 0.9281177520751953, 0.9538993835449219, 0.9796810150146484, 1.005462646484375, 1.0312442779541016, 1.0570259094238281, 1.0828075408935547, 1.1085891723632812, 1.1343708038330078, 1.1601524353027344, 1.185934066772461, 1.2117156982421875, 1.237497329711914, 1.2632789611816406, 1.2890605926513672, 1.3148422241210938, 1.3406238555908203, 1.3664054870605469, 1.3921871185302734, 1.41796875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 7.0, 1.0, 10.0, 14.0, 25.0, 36.0, 50.0, 64.0, 63.0, 77.0, 80.0, 76.0, 85.0, 72.0, 77.0, 78.0, 45.0, 39.0, 32.0, 22.0, 11.0, 9.0, 7.0, 9.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0184478759765625, -0.017790555953979492, -0.017133235931396484, -0.016475915908813477, -0.01581859588623047, -0.015161275863647461, -0.014503955841064453, -0.013846635818481445, -0.013189315795898438, -0.01253199577331543, -0.011874675750732422, -0.011217355728149414, -0.010560035705566406, -0.009902715682983398, -0.00924539566040039, -0.008588075637817383, -0.007930755615234375, -0.007273435592651367, -0.006616115570068359, -0.0059587955474853516, -0.005301475524902344, -0.004644155502319336, -0.003986835479736328, -0.0033295154571533203, -0.0026721954345703125, -0.0020148754119873047, -0.0013575553894042969, -0.0007002353668212891, -4.291534423828125e-05, 0.0006144046783447266, 0.0012717247009277344, 0.0019290447235107422, 0.00258636474609375, 0.003243684768676758, 0.0039010047912597656, 0.0045583248138427734, 0.005215644836425781, 0.005872964859008789, 0.006530284881591797, 0.007187604904174805, 0.007844924926757812, 0.00850224494934082, 0.009159564971923828, 0.009816884994506836, 0.010474205017089844, 0.011131525039672852, 0.01178884506225586, 0.012446165084838867, 0.013103485107421875, 0.013760805130004883, 0.01441812515258789, 0.015075445175170898, 0.015732765197753906, 0.016390085220336914, 0.017047405242919922, 0.01770472526550293, 0.018362045288085938, 0.019019365310668945, 0.019676685333251953, 0.02033400535583496, 0.02099132537841797, 0.021648645401000977, 0.022305965423583984, 0.022963285446166992, 0.02362060546875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 9.0, 15.0, 24.0, 39.0, 93.0, 183.0, 426.0, 934.0, 2701.0, 12927.0, 174290.0, 3940919.0, 52533.0, 6475.0, 1663.0, 551.0, 262.0, 115.0, 42.0, 34.0, 16.0, 6.0, 6.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05572509765625, -0.05405235290527344, -0.052379608154296875, -0.05070686340332031, -0.04903411865234375, -0.04736137390136719, -0.045688629150390625, -0.04401588439941406, -0.0423431396484375, -0.04067039489746094, -0.038997650146484375, -0.03732490539550781, -0.03565216064453125, -0.03397941589355469, -0.032306671142578125, -0.030633926391601562, -0.028961181640625, -0.027288436889648438, -0.025615692138671875, -0.023942947387695312, -0.02227020263671875, -0.020597457885742188, -0.018924713134765625, -0.017251968383789062, -0.0155792236328125, -0.013906478881835938, -0.012233734130859375, -0.010560989379882812, -0.00888824462890625, -0.0072154998779296875, -0.005542755126953125, -0.0038700103759765625, -0.002197265625, -0.0005245208740234375, 0.001148223876953125, 0.0028209686279296875, 0.00449371337890625, 0.0061664581298828125, 0.007839202880859375, 0.009511947631835938, 0.0111846923828125, 0.012857437133789062, 0.014530181884765625, 0.016202926635742188, 0.01787567138671875, 0.019548416137695312, 0.021221160888671875, 0.022893905639648438, 0.024566650390625, 0.026239395141601562, 0.027912139892578125, 0.029584884643554688, 0.03125762939453125, 0.03293037414550781, 0.034603118896484375, 0.03627586364746094, 0.0379486083984375, 0.03962135314941406, 0.041294097900390625, 0.04296684265136719, 0.04463958740234375, 0.04631233215332031, 0.047985076904296875, 0.04965782165527344, 0.05133056640625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 21.0, 19.0, 37.0, 69.0, 88.0, 321.0, 1417.0, 1413.0, 368.0, 109.0, 75.0, 39.0, 24.0, 16.0, 7.0, 9.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.047454833984375, -0.04623866081237793, -0.04502248764038086, -0.04380631446838379, -0.04259014129638672, -0.04137396812438965, -0.04015779495239258, -0.03894162178039551, -0.03772544860839844, -0.03650927543640137, -0.0352931022644043, -0.03407692909240723, -0.032860755920410156, -0.031644582748413086, -0.030428409576416016, -0.029212236404418945, -0.027996063232421875, -0.026779890060424805, -0.025563716888427734, -0.024347543716430664, -0.023131370544433594, -0.021915197372436523, -0.020699024200439453, -0.019482851028442383, -0.018266677856445312, -0.017050504684448242, -0.015834331512451172, -0.014618158340454102, -0.013401985168457031, -0.012185811996459961, -0.01096963882446289, -0.00975346565246582, -0.00853729248046875, -0.00732111930847168, -0.006104946136474609, -0.004888772964477539, -0.0036725997924804688, -0.0024564266204833984, -0.0012402534484863281, -2.4080276489257812e-05, 0.0011920928955078125, 0.002408266067504883, 0.003624439239501953, 0.0048406124114990234, 0.006056785583496094, 0.007272958755493164, 0.008489131927490234, 0.009705305099487305, 0.010921478271484375, 0.012137651443481445, 0.013353824615478516, 0.014569997787475586, 0.015786170959472656, 0.017002344131469727, 0.018218517303466797, 0.019434690475463867, 0.020650863647460938, 0.021867036819458008, 0.023083209991455078, 0.02429938316345215, 0.02551555633544922, 0.02673172950744629, 0.02794790267944336, 0.02916407585144043, 0.0303802490234375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 8.0, 14.0, 31.0, 63.0, 131.0, 230.0, 250.0, 147.0, 85.0, 18.0, 4.0, 8.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46390947699546814, -0.4539170265197754, -0.44392457604408264, -0.4339321553707123, -0.42393970489501953, -0.4139472544193268, -0.40395480394363403, -0.3939623534679413, -0.38396990299224854, -0.3739774525165558, -0.36398500204086304, -0.3539925813674927, -0.3440001308917999, -0.3340076804161072, -0.32401522994041443, -0.3140227794647217, -0.3040303587913513, -0.29403790831565857, -0.2840454578399658, -0.27405303716659546, -0.2640605866909027, -0.25406813621520996, -0.2440756857395172, -0.23408323526382446, -0.2240907996892929, -0.21409834921360016, -0.2041059136390686, -0.19411346316337585, -0.1841210126876831, -0.17412857711315155, -0.1641361266374588, -0.15414369106292725, -0.1441512554883957, -0.13415880501270294, -0.12416636943817139, -0.11417391896247864, -0.10418147593736649, -0.09418903291225433, -0.08419658243656158, -0.07420413941144943, -0.06421169638633728, -0.05421925336122513, -0.04422680661082268, -0.03423435986042023, -0.024241916835308075, -0.014249473810195923, -0.004257027059793472, 0.005735419690608978, 0.01572786271572113, 0.02572030760347843, 0.03571275249123573, 0.045705199241638184, 0.055697642266750336, 0.06569008529186249, 0.07568253576755524, 0.08567497879266739, 0.09566742181777954, 0.1056598648428917, 0.11565230786800385, 0.1256447583436966, 0.13563719391822815, 0.1456296443939209, 0.15562209486961365, 0.1656145453453064, 0.17560698091983795]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 8.0, 12.0, 22.0, 16.0, 25.0, 27.0, 32.0, 50.0, 42.0, 45.0, 57.0, 51.0, 60.0, 54.0, 52.0, 65.0, 63.0, 52.0, 50.0, 35.0, 40.0, 20.0, 19.0, 28.0, 19.0, 7.0, 14.0, 6.0, 9.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.14072805643081665, -0.1366768777370453, -0.13262568414211273, -0.12857449054718018, -0.12452331185340881, -0.12047212570905685, -0.1164209395647049, -0.11236975342035294, -0.10831856727600098, -0.10426738113164902, -0.10021619498729706, -0.0961650088429451, -0.09211382269859314, -0.08806263655424118, -0.08401145040988922, -0.07996026426553726, -0.0759090781211853, -0.07185789197683334, -0.06780670583248138, -0.06375551968812943, -0.059704333543777466, -0.05565314739942551, -0.05160196125507355, -0.04755077511072159, -0.04349958896636963, -0.03944840282201767, -0.03539721667766571, -0.03134603053331375, -0.027294844388961792, -0.023243658244609833, -0.019192472100257874, -0.015141285955905914, -0.011090099811553955, -0.007038913667201996, -0.0029877275228500366, 0.0010634586215019226, 0.005114644765853882, 0.009165830910205841, 0.0132170170545578, 0.01726820319890976, 0.02131938934326172, 0.025370575487613678, 0.029421761631965637, 0.033472947776317596, 0.037524133920669556, 0.041575320065021515, 0.045626506209373474, 0.04967769235372543, 0.05372887849807739, 0.05778006464242935, 0.06183125078678131, 0.06588243693113327, 0.06993362307548523, 0.07398480921983719, 0.07803599536418915, 0.08208718150854111, 0.08613836765289307, 0.09018955379724503, 0.09424073994159698, 0.09829192608594894, 0.1023431122303009, 0.10639429837465286, 0.11044548451900482, 0.11449667066335678, 0.11854785680770874]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 9.0, 11.0, 22.0, 24.0, 48.0, 162.0, 429.0, 1871.0, 12830.0, 322268.0, 680551.0, 26403.0, 2952.0, 586.0, 212.0, 78.0, 32.0, 20.0, 12.0, 8.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06427001953125, -0.062064170837402344, -0.05985832214355469, -0.05765247344970703, -0.055446624755859375, -0.05324077606201172, -0.05103492736816406, -0.048829078674316406, -0.04662322998046875, -0.044417381286621094, -0.04221153259277344, -0.04000568389892578, -0.037799835205078125, -0.03559398651123047, -0.03338813781738281, -0.031182289123535156, -0.0289764404296875, -0.026770591735839844, -0.024564743041992188, -0.02235889434814453, -0.020153045654296875, -0.01794719696044922, -0.015741348266601562, -0.013535499572753906, -0.01132965087890625, -0.009123802185058594, -0.0069179534912109375, -0.004712104797363281, -0.002506256103515625, -0.00030040740966796875, 0.0019054412841796875, 0.004111289978027344, 0.006317138671875, 0.008522987365722656, 0.010728836059570312, 0.012934684753417969, 0.015140533447265625, 0.01734638214111328, 0.019552230834960938, 0.021758079528808594, 0.02396392822265625, 0.026169776916503906, 0.028375625610351562, 0.03058147430419922, 0.032787322998046875, 0.03499317169189453, 0.03719902038574219, 0.039404869079589844, 0.0416107177734375, 0.043816566467285156, 0.04602241516113281, 0.04822826385498047, 0.050434112548828125, 0.05263996124267578, 0.05484580993652344, 0.057051658630371094, 0.05925750732421875, 0.061463356018066406, 0.06366920471191406, 0.06587505340576172, 0.06808090209960938, 0.07028675079345703, 0.07249259948730469, 0.07469844818115234, 0.076904296875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 4.0, 9.0, 14.0, 22.0, 20.0, 31.0, 51.0, 61.0, 55.0, 70.0, 52.0, 86.0, 69.0, 90.0, 66.0, 62.0, 64.0, 48.0, 39.0, 18.0, 17.0, 15.0, 6.0, 6.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019500732421875, -0.018875837326049805, -0.01825094223022461, -0.017626047134399414, -0.01700115203857422, -0.016376256942749023, -0.015751361846923828, -0.015126466751098633, -0.014501571655273438, -0.013876676559448242, -0.013251781463623047, -0.012626886367797852, -0.012001991271972656, -0.011377096176147461, -0.010752201080322266, -0.01012730598449707, -0.009502410888671875, -0.00887751579284668, -0.008252620697021484, -0.007627725601196289, -0.007002830505371094, -0.0063779354095458984, -0.005753040313720703, -0.005128145217895508, -0.0045032501220703125, -0.003878355026245117, -0.003253459930419922, -0.0026285648345947266, -0.0020036697387695312, -0.001378774642944336, -0.0007538795471191406, -0.0001289844512939453, 0.00049591064453125, 0.0011208057403564453, 0.0017457008361816406, 0.002370595932006836, 0.0029954910278320312, 0.0036203861236572266, 0.004245281219482422, 0.004870176315307617, 0.0054950714111328125, 0.006119966506958008, 0.006744861602783203, 0.0073697566986083984, 0.007994651794433594, 0.008619546890258789, 0.009244441986083984, 0.00986933708190918, 0.010494232177734375, 0.01111912727355957, 0.011744022369384766, 0.012368917465209961, 0.012993812561035156, 0.013618707656860352, 0.014243602752685547, 0.014868497848510742, 0.015493392944335938, 0.016118288040161133, 0.016743183135986328, 0.017368078231811523, 0.01799297332763672, 0.018617868423461914, 0.01924276351928711, 0.019867658615112305, 0.0204925537109375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 6.0, 6.0, 13.0, 17.0, 32.0, 35.0, 85.0, 90.0, 154.0, 201.0, 384.0, 677.0, 1309.0, 3284.0, 10966.0, 59671.0, 569746.0, 348340.0, 40038.0, 8262.0, 2690.0, 1068.0, 556.0, 308.0, 208.0, 139.0, 79.0, 50.0, 35.0, 16.0, 16.0, 22.0, 9.0, 8.0, 8.0, 1.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.037139892578125, -0.03593778610229492, -0.034735679626464844, -0.033533573150634766, -0.03233146667480469, -0.03112936019897461, -0.02992725372314453, -0.028725147247314453, -0.027523040771484375, -0.026320934295654297, -0.02511882781982422, -0.02391672134399414, -0.022714614868164062, -0.021512508392333984, -0.020310401916503906, -0.019108295440673828, -0.01790618896484375, -0.016704082489013672, -0.015501976013183594, -0.014299869537353516, -0.013097763061523438, -0.01189565658569336, -0.010693550109863281, -0.009491443634033203, -0.008289337158203125, -0.007087230682373047, -0.005885124206542969, -0.004683017730712891, -0.0034809112548828125, -0.0022788047790527344, -0.0010766983032226562, 0.00012540817260742188, 0.0013275146484375, 0.002529621124267578, 0.0037317276000976562, 0.004933834075927734, 0.0061359405517578125, 0.007338047027587891, 0.008540153503417969, 0.009742259979248047, 0.010944366455078125, 0.012146472930908203, 0.013348579406738281, 0.01455068588256836, 0.015752792358398438, 0.016954898834228516, 0.018157005310058594, 0.019359111785888672, 0.02056121826171875, 0.021763324737548828, 0.022965431213378906, 0.024167537689208984, 0.025369644165039062, 0.02657175064086914, 0.02777385711669922, 0.028975963592529297, 0.030178070068359375, 0.03138017654418945, 0.03258228302001953, 0.03378438949584961, 0.03498649597167969, 0.036188602447509766, 0.037390708923339844, 0.03859281539916992, 0.039794921875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 8.0, 14.0, 10.0, 15.0, 17.0, 15.0, 19.0, 33.0, 22.0, 35.0, 50.0, 47.0, 51.0, 56.0, 53.0, 45.0, 55.0, 59.0, 52.0, 54.0, 48.0, 44.0, 31.0, 37.0, 32.0, 20.0, 17.0, 13.0, 8.0, 6.0, 9.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04840087890625, -0.0467371940612793, -0.045073509216308594, -0.04340982437133789, -0.04174613952636719, -0.040082454681396484, -0.03841876983642578, -0.03675508499145508, -0.035091400146484375, -0.03342771530151367, -0.03176403045654297, -0.030100345611572266, -0.028436660766601562, -0.02677297592163086, -0.025109291076660156, -0.023445606231689453, -0.02178192138671875, -0.020118236541748047, -0.018454551696777344, -0.01679086685180664, -0.015127182006835938, -0.013463497161865234, -0.011799812316894531, -0.010136127471923828, -0.008472442626953125, -0.006808757781982422, -0.005145072937011719, -0.0034813880920410156, -0.0018177032470703125, -0.00015401840209960938, 0.0015096664428710938, 0.003173351287841797, 0.0048370361328125, 0.006500720977783203, 0.008164405822753906, 0.00982809066772461, 0.011491775512695312, 0.013155460357666016, 0.014819145202636719, 0.016482830047607422, 0.018146514892578125, 0.019810199737548828, 0.02147388458251953, 0.023137569427490234, 0.024801254272460938, 0.02646493911743164, 0.028128623962402344, 0.029792308807373047, 0.03145599365234375, 0.03311967849731445, 0.034783363342285156, 0.03644704818725586, 0.03811073303222656, 0.039774417877197266, 0.04143810272216797, 0.04310178756713867, 0.044765472412109375, 0.04642915725708008, 0.04809284210205078, 0.049756526947021484, 0.05142021179199219, 0.05308389663696289, 0.054747581481933594, 0.0564112663269043, 0.058074951171875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 5.0, 3.0, 6.0, 4.0, 2.0, 8.0, 9.0, 14.0, 11.0, 29.0, 36.0, 76.0, 123.0, 170.0, 288.0, 569.0, 1153.0, 2681.0, 9104.0, 508395.0, 511600.0, 9208.0, 2680.0, 1062.0, 528.0, 307.0, 183.0, 100.0, 48.0, 44.0, 34.0, 19.0, 13.0, 6.0, 9.0, 4.0, 9.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07330322265625, -0.07101249694824219, -0.06872177124023438, -0.06643104553222656, -0.06414031982421875, -0.06184959411621094, -0.059558868408203125, -0.05726814270019531, -0.0549774169921875, -0.05268669128417969, -0.050395965576171875, -0.04810523986816406, -0.04581451416015625, -0.04352378845214844, -0.041233062744140625, -0.03894233703613281, -0.036651611328125, -0.03436088562011719, -0.032070159912109375, -0.029779434204101562, -0.02748870849609375, -0.025197982788085938, -0.022907257080078125, -0.020616531372070312, -0.0183258056640625, -0.016035079956054688, -0.013744354248046875, -0.011453628540039062, -0.00916290283203125, -0.0068721771240234375, -0.004581451416015625, -0.0022907257080078125, 0.0, 0.0022907257080078125, 0.004581451416015625, 0.0068721771240234375, 0.00916290283203125, 0.011453628540039062, 0.013744354248046875, 0.016035079956054688, 0.0183258056640625, 0.020616531372070312, 0.022907257080078125, 0.025197982788085938, 0.02748870849609375, 0.029779434204101562, 0.032070159912109375, 0.03436088562011719, 0.036651611328125, 0.03894233703613281, 0.041233062744140625, 0.04352378845214844, 0.04581451416015625, 0.04810523986816406, 0.050395965576171875, 0.05268669128417969, 0.0549774169921875, 0.05726814270019531, 0.059558868408203125, 0.06184959411621094, 0.06414031982421875, 0.06643104553222656, 0.06872177124023438, 0.07101249694824219, 0.07330322265625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 5.0, 13.0, 4.0, 4.0, 15.0, 15.0, 16.0, 19.0, 24.0, 36.0, 60.0, 94.0, 134.0, 157.0, 116.0, 83.0, 55.0, 23.0, 32.0, 14.0, 16.0, 11.0, 10.0, 5.0, 5.0, 5.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.8770179748535156e-05, -5.723442882299423e-05, -5.569867789745331e-05, -5.4162926971912384e-05, -5.262717604637146e-05, -5.1091425120830536e-05, -4.955567419528961e-05, -4.801992326974869e-05, -4.6484172344207764e-05, -4.494842141866684e-05, -4.3412670493125916e-05, -4.187691956758499e-05, -4.034116864204407e-05, -3.880541771650314e-05, -3.726966679096222e-05, -3.5733915865421295e-05, -3.419816493988037e-05, -3.266241401433945e-05, -3.112666308879852e-05, -2.95909121632576e-05, -2.8055161237716675e-05, -2.651941031217575e-05, -2.4983659386634827e-05, -2.3447908461093903e-05, -2.191215753555298e-05, -2.0376406610012054e-05, -1.884065568447113e-05, -1.7304904758930206e-05, -1.5769153833389282e-05, -1.4233402907848358e-05, -1.2697651982307434e-05, -1.116190105676651e-05, -9.626150131225586e-06, -8.090399205684662e-06, -6.554648280143738e-06, -5.018897354602814e-06, -3.4831464290618896e-06, -1.9473955035209656e-06, -4.116445779800415e-07, 1.1241063475608826e-06, 2.6598572731018066e-06, 4.195608198642731e-06, 5.731359124183655e-06, 7.267110049724579e-06, 8.802860975265503e-06, 1.0338611900806427e-05, 1.1874362826347351e-05, 1.3410113751888275e-05, 1.49458646774292e-05, 1.6481615602970123e-05, 1.8017366528511047e-05, 1.955311745405197e-05, 2.1088868379592896e-05, 2.262461930513382e-05, 2.4160370230674744e-05, 2.5696121156215668e-05, 2.7231872081756592e-05, 2.8767623007297516e-05, 3.030337393283844e-05, 3.1839124858379364e-05, 3.337487578392029e-05, 3.491062670946121e-05, 3.6446377635002136e-05, 3.798212856054306e-05, 3.9517879486083984e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 2.0, 3.0, 10.0, 8.0, 7.0, 12.0, 19.0, 23.0, 20.0, 43.0, 68.0, 90.0, 177.0, 351.0, 690.0, 1521.0, 3946.0, 14294.0, 148026.0, 818587.0, 47611.0, 7927.0, 2686.0, 1187.0, 555.0, 276.0, 143.0, 103.0, 43.0, 33.0, 23.0, 16.0, 15.0, 8.0, 3.0, 8.0, 5.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0341796875, -0.033121585845947266, -0.03206348419189453, -0.031005382537841797, -0.029947280883789062, -0.028889179229736328, -0.027831077575683594, -0.02677297592163086, -0.025714874267578125, -0.02465677261352539, -0.023598670959472656, -0.022540569305419922, -0.021482467651367188, -0.020424365997314453, -0.01936626434326172, -0.018308162689208984, -0.01725006103515625, -0.016191959381103516, -0.015133857727050781, -0.014075756072998047, -0.013017654418945312, -0.011959552764892578, -0.010901451110839844, -0.00984334945678711, -0.008785247802734375, -0.007727146148681641, -0.006669044494628906, -0.005610942840576172, -0.0045528411865234375, -0.003494739532470703, -0.0024366378784179688, -0.0013785362243652344, -0.0003204345703125, 0.0007376670837402344, 0.0017957687377929688, 0.002853870391845703, 0.0039119720458984375, 0.004970073699951172, 0.006028175354003906, 0.007086277008056641, 0.008144378662109375, 0.00920248031616211, 0.010260581970214844, 0.011318683624267578, 0.012376785278320312, 0.013434886932373047, 0.014492988586425781, 0.015551090240478516, 0.01660919189453125, 0.017667293548583984, 0.01872539520263672, 0.019783496856689453, 0.020841598510742188, 0.021899700164794922, 0.022957801818847656, 0.02401590347290039, 0.025074005126953125, 0.02613210678100586, 0.027190208435058594, 0.028248310089111328, 0.029306411743164062, 0.030364513397216797, 0.03142261505126953, 0.032480716705322266, 0.033538818359375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 11.0, 7.0, 8.0, 16.0, 21.0, 19.0, 40.0, 49.0, 51.0, 79.0, 99.0, 96.0, 99.0, 89.0, 70.0, 68.0, 45.0, 27.0, 26.0, 16.0, 13.0, 11.0, 8.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.020294189453125, -0.019695281982421875, -0.01909637451171875, -0.018497467041015625, -0.0178985595703125, -0.017299652099609375, -0.01670074462890625, -0.016101837158203125, -0.0155029296875, -0.014904022216796875, -0.01430511474609375, -0.013706207275390625, -0.0131072998046875, -0.012508392333984375, -0.01190948486328125, -0.011310577392578125, -0.010711669921875, -0.010112762451171875, -0.00951385498046875, -0.008914947509765625, -0.0083160400390625, -0.007717132568359375, -0.00711822509765625, -0.006519317626953125, -0.00592041015625, -0.005321502685546875, -0.00472259521484375, -0.004123687744140625, -0.0035247802734375, -0.002925872802734375, -0.00232696533203125, -0.001728057861328125, -0.001129150390625, -0.000530242919921875, 6.866455078125e-05, 0.000667572021484375, 0.0012664794921875, 0.001865386962890625, 0.00246429443359375, 0.003063201904296875, 0.003662109375, 0.004261016845703125, 0.00485992431640625, 0.005458831787109375, 0.0060577392578125, 0.006656646728515625, 0.00725555419921875, 0.007854461669921875, 0.008453369140625, 0.009052276611328125, 0.00965118408203125, 0.010250091552734375, 0.0108489990234375, 0.011447906494140625, 0.01204681396484375, 0.012645721435546875, 0.01324462890625, 0.013843536376953125, 0.01444244384765625, 0.015041351318359375, 0.0156402587890625, 0.016239166259765625, 0.01683807373046875, 0.017436981201171875, 0.018035888671875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 29.0, 101.0, 571.0, 261.0, 30.0, 7.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6955938339233398, -1.6507084369659424, -1.6058229207992554, -1.560937523841858, -1.516052007675171, -1.4711666107177734, -1.426281213760376, -1.3813958168029785, -1.3365103006362915, -1.291624903678894, -1.246739387512207, -1.2018539905548096, -1.156968593597412, -1.112083077430725, -1.0671976804733276, -1.0223121643066406, -0.9774267673492432, -0.9325413107872009, -0.8876558542251587, -0.8427704572677612, -0.797885000705719, -0.7529995441436768, -0.7081141471862793, -0.6632286906242371, -0.6183432340621948, -0.5734577775001526, -0.5285723209381104, -0.4836869239807129, -0.43880146741867065, -0.3939160108566284, -0.34903058409690857, -0.3041451573371887, -0.2592597007751465, -0.21437425911426544, -0.1694888174533844, -0.12460337579250336, -0.07971793413162231, -0.03483249247074127, 0.01005294919013977, 0.05493837594985962, 0.09982383251190186, 0.1447092741727829, 0.18959471583366394, 0.23448015749454498, 0.279365599155426, 0.32425105571746826, 0.3691364824771881, 0.41402190923690796, 0.4589073657989502, 0.5037928223609924, 0.5486782789230347, 0.5935636758804321, 0.6384491324424744, 0.6833345890045166, 0.7282199859619141, 0.7731054425239563, 0.8179908990859985, 0.8628763556480408, 0.907761812210083, 0.9526472091674805, 0.9975326657295227, 1.042418122291565, 1.0873035192489624, 1.1321890354156494, 1.1770744323730469]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 1.0, 10.0, 5.0, 5.0, 6.0, 11.0, 10.0, 22.0, 17.0, 24.0, 26.0, 28.0, 32.0, 30.0, 23.0, 41.0, 51.0, 57.0, 66.0, 65.0, 51.0, 50.0, 28.0, 41.0, 48.0, 34.0, 33.0, 27.0, 24.0, 27.0, 19.0, 13.0, 17.0, 12.0, 11.0, 8.0, 5.0, 3.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.226351797580719, -0.21975180506706238, -0.21315181255340576, -0.20655182003974915, -0.19995182752609253, -0.1933518350124359, -0.1867518573999405, -0.18015186488628387, -0.17355187237262726, -0.16695187985897064, -0.16035188734531403, -0.1537518948316574, -0.147151917219162, -0.14055192470550537, -0.13395193219184875, -0.12735193967819214, -0.12075194716453552, -0.1141519546508789, -0.10755196213722229, -0.10095197707414627, -0.09435198456048965, -0.08775199204683304, -0.08115200698375702, -0.0745520144701004, -0.06795202195644379, -0.06135202944278717, -0.05475204065442085, -0.048152051866054535, -0.04155205935239792, -0.0349520668387413, -0.028352078050374985, -0.021752089262008667, -0.01515209674835205, -0.008552106097340584, -0.0019521154463291168, 0.00464787520468235, 0.011247865855693817, 0.017847858369350433, 0.02444784715771675, 0.03104783594608307, 0.037647828459739685, 0.0442478209733963, 0.05084780976176262, 0.05744779855012894, 0.06404779106378555, 0.07064778357744217, 0.07724776864051819, 0.0838477611541748, 0.09044775366783142, 0.09704774618148804, 0.10364773869514465, 0.11024772375822067, 0.11684771627187729, 0.1234477087855339, 0.13004769384860992, 0.13664768636226654, 0.14324767887592316, 0.14984767138957977, 0.1564476639032364, 0.163047656416893, 0.16964763402938843, 0.17624762654304504, 0.18284761905670166, 0.18944761157035828, 0.1960476040840149]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 6.0, 12.0, 20.0, 33.0, 57.0, 108.0, 342.0, 2243.0, 649141.0, 3538292.0, 3303.0, 383.0, 145.0, 75.0, 52.0, 34.0, 14.0, 8.0, 8.0, 10.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050872802734375, -0.04665803909301758, -0.042443275451660156, -0.038228511810302734, -0.03401374816894531, -0.02979898452758789, -0.02558422088623047, -0.021369457244873047, -0.017154693603515625, -0.012939929962158203, -0.008725166320800781, -0.004510402679443359, -0.0002956390380859375, 0.003919124603271484, 0.008133888244628906, 0.012348651885986328, 0.01656341552734375, 0.020778179168701172, 0.024992942810058594, 0.029207706451416016, 0.03342247009277344, 0.03763723373413086, 0.04185199737548828, 0.0460667610168457, 0.050281524658203125, 0.05449628829956055, 0.05871105194091797, 0.06292581558227539, 0.06714057922363281, 0.07135534286499023, 0.07557010650634766, 0.07978487014770508, 0.0839996337890625, 0.08821439743041992, 0.09242916107177734, 0.09664392471313477, 0.10085868835449219, 0.10507345199584961, 0.10928821563720703, 0.11350297927856445, 0.11771774291992188, 0.1219325065612793, 0.12614727020263672, 0.13036203384399414, 0.13457679748535156, 0.13879156112670898, 0.1430063247680664, 0.14722108840942383, 0.15143585205078125, 0.15565061569213867, 0.1598653793334961, 0.16408014297485352, 0.16829490661621094, 0.17250967025756836, 0.17672443389892578, 0.1809391975402832, 0.18515396118164062, 0.18936872482299805, 0.19358348846435547, 0.1977982521057129, 0.2020130157470703, 0.20622777938842773, 0.21044254302978516, 0.21465730667114258, 0.2188720703125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 8.0, 14.0, 18.0, 30.0, 27.0, 41.0, 50.0, 73.0, 68.0, 70.0, 95.0, 84.0, 77.0, 65.0, 64.0, 46.0, 44.0, 40.0, 22.0, 18.0, 10.0, 6.0, 7.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0237274169921875, -0.023083925247192383, -0.022440433502197266, -0.02179694175720215, -0.02115345001220703, -0.020509958267211914, -0.019866466522216797, -0.01922297477722168, -0.018579483032226562, -0.017935991287231445, -0.017292499542236328, -0.01664900779724121, -0.016005516052246094, -0.015362024307250977, -0.01471853256225586, -0.014075040817260742, -0.013431549072265625, -0.012788057327270508, -0.01214456558227539, -0.011501073837280273, -0.010857582092285156, -0.010214090347290039, -0.009570598602294922, -0.008927106857299805, -0.008283615112304688, -0.00764012336730957, -0.006996631622314453, -0.006353139877319336, -0.005709648132324219, -0.0050661563873291016, -0.004422664642333984, -0.003779172897338867, -0.00313568115234375, -0.002492189407348633, -0.0018486976623535156, -0.0012052059173583984, -0.0005617141723632812, 8.177757263183594e-05, 0.0007252693176269531, 0.0013687610626220703, 0.0020122528076171875, 0.0026557445526123047, 0.003299236297607422, 0.003942728042602539, 0.004586219787597656, 0.0052297115325927734, 0.005873203277587891, 0.006516695022583008, 0.007160186767578125, 0.007803678512573242, 0.00844717025756836, 0.009090662002563477, 0.009734153747558594, 0.010377645492553711, 0.011021137237548828, 0.011664628982543945, 0.012308120727539062, 0.01295161247253418, 0.013595104217529297, 0.014238595962524414, 0.014882087707519531, 0.015525579452514648, 0.016169071197509766, 0.016812562942504883, 0.0174560546875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 15.0, 10.0, 18.0, 21.0, 26.0, 53.0, 68.0, 81.0, 192.0, 434.0, 1425.0, 8271.0, 129836.0, 3949546.0, 93662.0, 7759.0, 1648.0, 550.0, 248.0, 112.0, 74.0, 56.0, 46.0, 33.0, 32.0, 17.0, 11.0, 10.0, 3.0, 7.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0782470703125, -0.07609987258911133, -0.07395267486572266, -0.07180547714233398, -0.06965827941894531, -0.06751108169555664, -0.06536388397216797, -0.0632166862487793, -0.061069488525390625, -0.05892229080200195, -0.05677509307861328, -0.05462789535522461, -0.05248069763183594, -0.050333499908447266, -0.048186302185058594, -0.04603910446166992, -0.04389190673828125, -0.04174470901489258, -0.039597511291503906, -0.037450313568115234, -0.03530311584472656, -0.03315591812133789, -0.03100872039794922, -0.028861522674560547, -0.026714324951171875, -0.024567127227783203, -0.02241992950439453, -0.02027273178100586, -0.018125534057617188, -0.015978336334228516, -0.013831138610839844, -0.011683940887451172, -0.0095367431640625, -0.007389545440673828, -0.005242347717285156, -0.0030951499938964844, -0.0009479522705078125, 0.0011992454528808594, 0.0033464431762695312, 0.005493640899658203, 0.007640838623046875, 0.009788036346435547, 0.011935234069824219, 0.01408243179321289, 0.016229629516601562, 0.018376827239990234, 0.020524024963378906, 0.022671222686767578, 0.02481842041015625, 0.026965618133544922, 0.029112815856933594, 0.031260013580322266, 0.03340721130371094, 0.03555440902709961, 0.03770160675048828, 0.03984880447387695, 0.041996002197265625, 0.0441431999206543, 0.04629039764404297, 0.04843759536743164, 0.05058479309082031, 0.052731990814208984, 0.054879188537597656, 0.05702638626098633, 0.059173583984375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 2.0, 4.0, 7.0, 10.0, 5.0, 10.0, 18.0, 20.0, 27.0, 42.0, 46.0, 68.0, 130.0, 249.0, 635.0, 1053.0, 840.0, 351.0, 165.0, 111.0, 66.0, 51.0, 36.0, 30.0, 31.0, 11.0, 9.0, 13.0, 4.0, 7.0, 5.0, 3.0, 2.0, 4.0, 0.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.031982421875, -0.030908584594726562, -0.029834747314453125, -0.028760910034179688, -0.02768707275390625, -0.026613235473632812, -0.025539398193359375, -0.024465560913085938, -0.0233917236328125, -0.022317886352539062, -0.021244049072265625, -0.020170211791992188, -0.01909637451171875, -0.018022537231445312, -0.016948699951171875, -0.015874862670898438, -0.014801025390625, -0.013727188110351562, -0.012653350830078125, -0.011579513549804688, -0.01050567626953125, -0.009431838989257812, -0.008358001708984375, -0.0072841644287109375, -0.0062103271484375, -0.0051364898681640625, -0.004062652587890625, -0.0029888153076171875, -0.00191497802734375, -0.0008411407470703125, 0.000232696533203125, 0.0013065338134765625, 0.00238037109375, 0.0034542083740234375, 0.004528045654296875, 0.0056018829345703125, 0.00667572021484375, 0.0077495574951171875, 0.008823394775390625, 0.009897232055664062, 0.0109710693359375, 0.012044906616210938, 0.013118743896484375, 0.014192581176757812, 0.01526641845703125, 0.016340255737304688, 0.017414093017578125, 0.018487930297851562, 0.019561767578125, 0.020635604858398438, 0.021709442138671875, 0.022783279418945312, 0.02385711669921875, 0.024930953979492188, 0.026004791259765625, 0.027078628540039062, 0.0281524658203125, 0.029226303100585938, 0.030300140380859375, 0.03137397766113281, 0.03244781494140625, 0.03352165222167969, 0.034595489501953125, 0.03566932678222656, 0.0367431640625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 0.0, 1.0, 5.0, 11.0, 12.0, 39.0, 58.0, 167.0, 235.0, 249.0, 119.0, 44.0, 24.0, 18.0, 10.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5413346290588379, -0.5231657028198242, -0.5049967765808105, -0.4868278503417969, -0.4686588943004608, -0.45048996806144714, -0.43232104182243347, -0.4141520857810974, -0.39598315954208374, -0.37781423330307007, -0.3596453070640564, -0.3414763808250427, -0.32330742478370667, -0.305138498544693, -0.2869695723056793, -0.26880061626434326, -0.250631719827652, -0.2324627935886383, -0.21429385244846344, -0.19612492620944977, -0.1779559850692749, -0.15978705883026123, -0.14161813259124756, -0.12344919145107269, -0.10528026521205902, -0.08711133152246475, -0.06894239783287048, -0.05077347159385681, -0.03260453790426254, -0.014435604214668274, 0.003733322024345398, 0.021902263164520264, 0.040071189403533936, 0.058240123093128204, 0.07640905678272247, 0.09457798302173615, 0.11274691671133041, 0.13091585040092468, 0.14908477663993835, 0.16725371778011322, 0.1854226440191269, 0.20359157025814056, 0.22176051139831543, 0.2399294376373291, 0.2580983638763428, 0.27626729011535645, 0.2944362163543701, 0.3126051723957062, 0.33077409863471985, 0.3489430248737335, 0.3671119511127472, 0.38528090715408325, 0.4034498333930969, 0.4216187596321106, 0.43978768587112427, 0.45795661211013794, 0.4761255383491516, 0.4942944645881653, 0.512463390827179, 0.5306323170661926, 0.5488012433052063, 0.5669702291488647, 0.5851391553878784, 0.6033080816268921, 0.6214770078659058]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 4.0, 2.0, 5.0, 7.0, 12.0, 11.0, 11.0, 17.0, 12.0, 29.0, 28.0, 24.0, 56.0, 35.0, 48.0, 57.0, 39.0, 52.0, 53.0, 38.0, 57.0, 56.0, 44.0, 45.0, 27.0, 32.0, 21.0, 30.0, 24.0, 23.0, 23.0, 15.0, 20.0, 13.0, 5.0, 5.0, 4.0, 5.0, 7.0, 2.0, 4.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15900921821594238, -0.15388479828834534, -0.1487603783607483, -0.14363594353199005, -0.138511523604393, -0.13338710367679596, -0.12826266884803772, -0.12313824892044067, -0.11801382899284363, -0.11288940906524658, -0.10776498168706894, -0.1026405543088913, -0.09751613438129425, -0.0923917144536972, -0.08726728707551956, -0.08214285969734192, -0.07701843976974487, -0.07189401984214783, -0.06676959246397018, -0.06164516881108284, -0.056520745158195496, -0.05139632150530815, -0.04627189785242081, -0.04114747419953346, -0.03602305054664612, -0.030898626893758774, -0.02577420324087143, -0.020649779587984085, -0.01552535593509674, -0.010400932282209396, -0.005276508629322052, -0.00015208497643470764, 0.004972338676452637, 0.010096762329339981, 0.015221185982227325, 0.02034560963511467, 0.025470033288002014, 0.03059445694088936, 0.0357188805937767, 0.04084330424666405, 0.04596772789955139, 0.051092151552438736, 0.05621657520532608, 0.061340998858213425, 0.06646542251110077, 0.07158984243869781, 0.07671426981687546, 0.0818386971950531, 0.08696311712265015, 0.09208753705024719, 0.09721196442842484, 0.10233639180660248, 0.10746081173419952, 0.11258523166179657, 0.11770965903997421, 0.12283408641815186, 0.1279585063457489, 0.13308292627334595, 0.138207346200943, 0.14333178102970123, 0.14845620095729828, 0.15358062088489532, 0.15870505571365356, 0.1638294756412506, 0.16895389556884766]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 2.0, 7.0, 8.0, 9.0, 10.0, 23.0, 21.0, 30.0, 75.0, 145.0, 252.0, 523.0, 1409.0, 3740.0, 11525.0, 42212.0, 169236.0, 458044.0, 266281.0, 68443.0, 17936.0, 5316.0, 1867.0, 729.0, 328.0, 176.0, 87.0, 40.0, 25.0, 13.0, 14.0, 11.0, 2.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0272369384765625, -0.026215791702270508, -0.025194644927978516, -0.024173498153686523, -0.02315235137939453, -0.02213120460510254, -0.021110057830810547, -0.020088911056518555, -0.019067764282226562, -0.01804661750793457, -0.017025470733642578, -0.016004323959350586, -0.014983177185058594, -0.013962030410766602, -0.01294088363647461, -0.011919736862182617, -0.010898590087890625, -0.009877443313598633, -0.00885629653930664, -0.007835149765014648, -0.006814002990722656, -0.005792856216430664, -0.004771709442138672, -0.0037505626678466797, -0.0027294158935546875, -0.0017082691192626953, -0.0006871223449707031, 0.00033402442932128906, 0.0013551712036132812, 0.0023763179779052734, 0.0033974647521972656, 0.004418611526489258, 0.00543975830078125, 0.006460905075073242, 0.007482051849365234, 0.008503198623657227, 0.009524345397949219, 0.010545492172241211, 0.011566638946533203, 0.012587785720825195, 0.013608932495117188, 0.01463007926940918, 0.015651226043701172, 0.016672372817993164, 0.017693519592285156, 0.01871466636657715, 0.01973581314086914, 0.020756959915161133, 0.021778106689453125, 0.022799253463745117, 0.02382040023803711, 0.0248415470123291, 0.025862693786621094, 0.026883840560913086, 0.027904987335205078, 0.02892613410949707, 0.029947280883789062, 0.030968427658081055, 0.03198957443237305, 0.03301072120666504, 0.03403186798095703, 0.03505301475524902, 0.036074161529541016, 0.03709530830383301, 0.038116455078125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 7.0, 6.0, 6.0, 18.0, 17.0, 33.0, 29.0, 35.0, 51.0, 65.0, 58.0, 66.0, 75.0, 70.0, 70.0, 61.0, 63.0, 51.0, 45.0, 43.0, 24.0, 22.0, 23.0, 12.0, 15.0, 11.0, 6.0, 6.0, 2.0, 6.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0211944580078125, -0.020598173141479492, -0.020001888275146484, -0.019405603408813477, -0.01880931854248047, -0.01821303367614746, -0.017616748809814453, -0.017020463943481445, -0.016424179077148438, -0.01582789421081543, -0.015231609344482422, -0.014635324478149414, -0.014039039611816406, -0.013442754745483398, -0.01284646987915039, -0.012250185012817383, -0.011653900146484375, -0.011057615280151367, -0.01046133041381836, -0.009865045547485352, -0.009268760681152344, -0.008672475814819336, -0.008076190948486328, -0.00747990608215332, -0.0068836212158203125, -0.006287336349487305, -0.005691051483154297, -0.005094766616821289, -0.004498481750488281, -0.0039021968841552734, -0.0033059120178222656, -0.002709627151489258, -0.00211334228515625, -0.0015170574188232422, -0.0009207725524902344, -0.00032448768615722656, 0.00027179718017578125, 0.0008680820465087891, 0.0014643669128417969, 0.0020606517791748047, 0.0026569366455078125, 0.0032532215118408203, 0.003849506378173828, 0.004445791244506836, 0.005042076110839844, 0.0056383609771728516, 0.006234645843505859, 0.006830930709838867, 0.007427215576171875, 0.008023500442504883, 0.00861978530883789, 0.009216070175170898, 0.009812355041503906, 0.010408639907836914, 0.011004924774169922, 0.01160120964050293, 0.012197494506835938, 0.012793779373168945, 0.013390064239501953, 0.013986349105834961, 0.014582633972167969, 0.015178918838500977, 0.015775203704833984, 0.016371488571166992, 0.0169677734375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 3.0, 7.0, 16.0, 7.0, 16.0, 23.0, 18.0, 34.0, 59.0, 61.0, 135.0, 192.0, 291.0, 478.0, 932.0, 1773.0, 4521.0, 17330.0, 166408.0, 771772.0, 67857.0, 10104.0, 3187.0, 1399.0, 739.0, 442.0, 242.0, 152.0, 100.0, 70.0, 55.0, 32.0, 23.0, 14.0, 10.0, 7.0, 8.0, 9.0, 4.0, 4.0, 6.0, 1.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.06573486328125, -0.06370162963867188, -0.06166839599609375, -0.059635162353515625, -0.0576019287109375, -0.055568695068359375, -0.05353546142578125, -0.051502227783203125, -0.049468994140625, -0.047435760498046875, -0.04540252685546875, -0.043369293212890625, -0.0413360595703125, -0.039302825927734375, -0.03726959228515625, -0.035236358642578125, -0.033203125, -0.031169891357421875, -0.02913665771484375, -0.027103424072265625, -0.0250701904296875, -0.023036956787109375, -0.02100372314453125, -0.018970489501953125, -0.016937255859375, -0.014904022216796875, -0.01287078857421875, -0.010837554931640625, -0.0088043212890625, -0.006771087646484375, -0.00473785400390625, -0.002704620361328125, -0.00067138671875, 0.001361846923828125, 0.00339508056640625, 0.005428314208984375, 0.0074615478515625, 0.009494781494140625, 0.01152801513671875, 0.013561248779296875, 0.015594482421875, 0.017627716064453125, 0.01966094970703125, 0.021694183349609375, 0.0237274169921875, 0.025760650634765625, 0.02779388427734375, 0.029827117919921875, 0.0318603515625, 0.033893585205078125, 0.03592681884765625, 0.037960052490234375, 0.0399932861328125, 0.042026519775390625, 0.04405975341796875, 0.046092987060546875, 0.048126220703125, 0.050159454345703125, 0.05219268798828125, 0.054225921630859375, 0.0562591552734375, 0.058292388916015625, 0.06032562255859375, 0.062358856201171875, 0.06439208984375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 5.0, 3.0, 8.0, 6.0, 6.0, 10.0, 12.0, 21.0, 14.0, 17.0, 30.0, 28.0, 38.0, 41.0, 37.0, 46.0, 54.0, 51.0, 45.0, 50.0, 53.0, 64.0, 51.0, 55.0, 39.0, 27.0, 36.0, 22.0, 28.0, 28.0, 16.0, 15.0, 9.0, 3.0, 12.0, 10.0, 4.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0634765625, -0.061443328857421875, -0.05941009521484375, -0.057376861572265625, -0.0553436279296875, -0.053310394287109375, -0.05127716064453125, -0.049243927001953125, -0.047210693359375, -0.045177459716796875, -0.04314422607421875, -0.041110992431640625, -0.0390777587890625, -0.037044525146484375, -0.03501129150390625, -0.032978057861328125, -0.03094482421875, -0.028911590576171875, -0.02687835693359375, -0.024845123291015625, -0.0228118896484375, -0.020778656005859375, -0.01874542236328125, -0.016712188720703125, -0.014678955078125, -0.012645721435546875, -0.01061248779296875, -0.008579254150390625, -0.0065460205078125, -0.004512786865234375, -0.00247955322265625, -0.000446319580078125, 0.0015869140625, 0.003620147705078125, 0.00565338134765625, 0.007686614990234375, 0.0097198486328125, 0.011753082275390625, 0.01378631591796875, 0.015819549560546875, 0.017852783203125, 0.019886016845703125, 0.02191925048828125, 0.023952484130859375, 0.0259857177734375, 0.028018951416015625, 0.03005218505859375, 0.032085418701171875, 0.03411865234375, 0.036151885986328125, 0.03818511962890625, 0.040218353271484375, 0.0422515869140625, 0.044284820556640625, 0.04631805419921875, 0.048351287841796875, 0.050384521484375, 0.052417755126953125, 0.05445098876953125, 0.056484222412109375, 0.0585174560546875, 0.060550689697265625, 0.06258392333984375, 0.06461715698242188, 0.066650390625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 8.0, 5.0, 5.0, 17.0, 18.0, 29.0, 28.0, 51.0, 66.0, 101.0, 150.0, 239.0, 438.0, 722.0, 1157.0, 2135.0, 4280.0, 10792.0, 49205.0, 919576.0, 40746.0, 9907.0, 4026.0, 2007.0, 1083.0, 632.0, 401.0, 250.0, 145.0, 110.0, 69.0, 49.0, 33.0, 21.0, 15.0, 10.0, 6.0, 10.0, 8.0, 2.0, 4.0, 2.0, 4.0, 2.0], "bins": [-0.07757568359375, -0.07560968399047852, -0.07364368438720703, -0.07167768478393555, -0.06971168518066406, -0.06774568557739258, -0.0657796859741211, -0.06381368637084961, -0.061847686767578125, -0.05988168716430664, -0.057915687561035156, -0.05594968795776367, -0.05398368835449219, -0.0520176887512207, -0.05005168914794922, -0.048085689544677734, -0.04611968994140625, -0.044153690338134766, -0.04218769073486328, -0.0402216911315918, -0.03825569152832031, -0.03628969192504883, -0.034323692321777344, -0.03235769271850586, -0.030391693115234375, -0.02842569351196289, -0.026459693908691406, -0.024493694305419922, -0.022527694702148438, -0.020561695098876953, -0.01859569549560547, -0.016629695892333984, -0.0146636962890625, -0.012697696685791016, -0.010731697082519531, -0.008765697479248047, -0.0067996978759765625, -0.004833698272705078, -0.0028676986694335938, -0.0009016990661621094, 0.001064300537109375, 0.0030303001403808594, 0.004996299743652344, 0.006962299346923828, 0.008928298950195312, 0.010894298553466797, 0.012860298156738281, 0.014826297760009766, 0.01679229736328125, 0.018758296966552734, 0.02072429656982422, 0.022690296173095703, 0.024656295776367188, 0.026622295379638672, 0.028588294982910156, 0.03055429458618164, 0.032520294189453125, 0.03448629379272461, 0.036452293395996094, 0.03841829299926758, 0.04038429260253906, 0.04235029220581055, 0.04431629180908203, 0.046282291412353516, 0.048248291015625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 5.0, 8.0, 6.0, 12.0, 7.0, 13.0, 14.0, 16.0, 15.0, 26.0, 32.0, 45.0, 58.0, 73.0, 123.0, 138.0, 101.0, 71.0, 47.0, 35.0, 26.0, 24.0, 19.0, 9.0, 16.0, 15.0, 7.0, 11.0, 7.0, 4.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.704164505004883e-05, -5.546770989894867e-05, -5.389377474784851e-05, -5.231983959674835e-05, -5.074590444564819e-05, -4.9171969294548035e-05, -4.7598034143447876e-05, -4.602409899234772e-05, -4.445016384124756e-05, -4.28762286901474e-05, -4.130229353904724e-05, -3.972835838794708e-05, -3.8154423236846924e-05, -3.6580488085746765e-05, -3.5006552934646606e-05, -3.343261778354645e-05, -3.185868263244629e-05, -3.028474748134613e-05, -2.871081233024597e-05, -2.7136877179145813e-05, -2.5562942028045654e-05, -2.3989006876945496e-05, -2.2415071725845337e-05, -2.0841136574745178e-05, -1.926720142364502e-05, -1.769326627254486e-05, -1.6119331121444702e-05, -1.4545395970344543e-05, -1.2971460819244385e-05, -1.1397525668144226e-05, -9.823590517044067e-06, -8.249655365943909e-06, -6.67572021484375e-06, -5.101785063743591e-06, -3.5278499126434326e-06, -1.953914761543274e-06, -3.7997961044311523e-07, 1.1939555406570435e-06, 2.767890691757202e-06, 4.341825842857361e-06, 5.9157609939575195e-06, 7.489696145057678e-06, 9.063631296157837e-06, 1.0637566447257996e-05, 1.2211501598358154e-05, 1.3785436749458313e-05, 1.535937190055847e-05, 1.693330705165863e-05, 1.850724220275879e-05, 2.0081177353858948e-05, 2.1655112504959106e-05, 2.3229047656059265e-05, 2.4802982807159424e-05, 2.6376917958259583e-05, 2.795085310935974e-05, 2.95247882604599e-05, 3.109872341156006e-05, 3.267265856266022e-05, 3.4246593713760376e-05, 3.5820528864860535e-05, 3.739446401596069e-05, 3.896839916706085e-05, 4.054233431816101e-05, 4.211626946926117e-05, 4.369020462036133e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 6.0, 7.0, 11.0, 16.0, 34.0, 43.0, 77.0, 133.0, 286.0, 609.0, 1598.0, 5101.0, 31058.0, 976125.0, 26047.0, 4674.0, 1473.0, 642.0, 284.0, 136.0, 69.0, 42.0, 23.0, 23.0, 14.0, 11.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.096923828125, -0.09363460540771484, -0.09034538269042969, -0.08705615997314453, -0.08376693725585938, -0.08047771453857422, -0.07718849182128906, -0.0738992691040039, -0.07061004638671875, -0.0673208236694336, -0.06403160095214844, -0.06074237823486328, -0.057453155517578125, -0.05416393280029297, -0.05087471008300781, -0.047585487365722656, -0.0442962646484375, -0.041007041931152344, -0.03771781921386719, -0.03442859649658203, -0.031139373779296875, -0.02785015106201172, -0.024560928344726562, -0.021271705627441406, -0.01798248291015625, -0.014693260192871094, -0.011404037475585938, -0.008114814758300781, -0.004825592041015625, -0.0015363693237304688, 0.0017528533935546875, 0.005042076110839844, 0.008331298828125, 0.011620521545410156, 0.014909744262695312, 0.01819896697998047, 0.021488189697265625, 0.02477741241455078, 0.028066635131835938, 0.031355857849121094, 0.03464508056640625, 0.037934303283691406, 0.04122352600097656, 0.04451274871826172, 0.047801971435546875, 0.05109119415283203, 0.05438041687011719, 0.057669639587402344, 0.0609588623046875, 0.06424808502197266, 0.06753730773925781, 0.07082653045654297, 0.07411575317382812, 0.07740497589111328, 0.08069419860839844, 0.0839834213256836, 0.08727264404296875, 0.0905618667602539, 0.09385108947753906, 0.09714031219482422, 0.10042953491210938, 0.10371875762939453, 0.10700798034667969, 0.11029720306396484, 0.11358642578125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 9.0, 10.0, 14.0, 26.0, 81.0, 277.0, 357.0, 136.0, 37.0, 19.0, 7.0, 4.0, 2.0, 3.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10443115234375, -0.10169124603271484, -0.09895133972167969, -0.09621143341064453, -0.09347152709960938, -0.09073162078857422, -0.08799171447753906, -0.0852518081665039, -0.08251190185546875, -0.0797719955444336, -0.07703208923339844, -0.07429218292236328, -0.07155227661132812, -0.06881237030029297, -0.06607246398925781, -0.06333255767822266, -0.0605926513671875, -0.057852745056152344, -0.05511283874511719, -0.05237293243408203, -0.049633026123046875, -0.04689311981201172, -0.04415321350097656, -0.041413307189941406, -0.03867340087890625, -0.035933494567871094, -0.03319358825683594, -0.03045368194580078, -0.027713775634765625, -0.02497386932373047, -0.022233963012695312, -0.019494056701660156, -0.016754150390625, -0.014014244079589844, -0.011274337768554688, -0.008534431457519531, -0.005794525146484375, -0.0030546188354492188, -0.0003147125244140625, 0.0024251937866210938, 0.00516510009765625, 0.007905006408691406, 0.010644912719726562, 0.013384819030761719, 0.016124725341796875, 0.01886463165283203, 0.021604537963867188, 0.024344444274902344, 0.0270843505859375, 0.029824256896972656, 0.03256416320800781, 0.03530406951904297, 0.038043975830078125, 0.04078388214111328, 0.04352378845214844, 0.046263694763183594, 0.04900360107421875, 0.051743507385253906, 0.05448341369628906, 0.05722332000732422, 0.059963226318359375, 0.06270313262939453, 0.06544303894042969, 0.06818294525146484, 0.0709228515625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 1.0, 4.0, 29.0, 75.0, 234.0, 377.0, 159.0, 64.0, 36.0, 4.0, 8.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7154682874679565, -0.6739500761032104, -0.6324318051338196, -0.5909135937690735, -0.5493953227996826, -0.5078771114349365, -0.46635890007019043, -0.42484065890312195, -0.38332241773605347, -0.341804176568985, -0.3002859354019165, -0.2587677240371704, -0.21724948287010193, -0.17573124170303345, -0.13421301543712616, -0.09269478917121887, -0.05117654800415039, -0.009658314287662506, 0.03185991942882538, 0.07337815314531326, 0.11489638686180115, 0.15641462802886963, 0.19793285429477692, 0.2394510805606842, 0.2809693217277527, 0.32248756289482117, 0.36400580406188965, 0.40552401542663574, 0.4470422565937042, 0.4885604977607727, 0.5300787091255188, 0.5715969800949097, 0.6131151914596558, 0.6546334028244019, 0.6961516737937927, 0.7376698851585388, 0.7791881561279297, 0.8207063674926758, 0.8622245788574219, 0.903742790222168, 0.9452610611915588, 0.9867792725563049, 1.0282975435256958, 1.069815754890442, 1.111333966255188, 1.1528522968292236, 1.1943705081939697, 1.2358887195587158, 1.277406930923462, 1.318925142288208, 1.360443353652954, 1.4019616842269897, 1.4434798955917358, 1.484998106956482, 1.526516318321228, 1.5680345296859741, 1.6095528602600098, 1.6510710716247559, 1.692589282989502, 1.7341076135635376, 1.7756258249282837, 1.8171440362930298, 1.8586622476577759, 1.900180459022522, 1.941698670387268]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 3.0, 5.0, 4.0, 5.0, 7.0, 8.0, 5.0, 13.0, 14.0, 17.0, 14.0, 17.0, 22.0, 28.0, 21.0, 18.0, 42.0, 30.0, 38.0, 27.0, 39.0, 62.0, 75.0, 66.0, 46.0, 59.0, 38.0, 32.0, 28.0, 23.0, 26.0, 21.0, 20.0, 14.0, 14.0, 16.0, 19.0, 19.0, 10.0, 8.0, 10.0, 5.0, 4.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22172784805297852, -0.21322104334831238, -0.20471423864364624, -0.1962074339389801, -0.18770062923431396, -0.17919382452964783, -0.1706870198249817, -0.16218021512031555, -0.15367341041564941, -0.14516660571098328, -0.13665980100631714, -0.128152996301651, -0.11964619159698486, -0.11113938689231873, -0.10263258963823318, -0.09412578493356705, -0.0856189876794815, -0.07711218297481537, -0.06860537827014923, -0.06009857729077339, -0.051591772586107254, -0.043084967881441116, -0.03457816690206528, -0.02607136219739914, -0.017564557492733, -0.009057753719389439, -0.0005509499460458755, 0.007955852895975113, 0.01646265760064125, 0.02496946230530739, 0.03347626328468323, 0.041983067989349365, 0.0504898726940155, 0.05899667739868164, 0.06750348210334778, 0.07601028680801392, 0.08451709151268005, 0.09302389621734619, 0.10153069347143173, 0.11003749817609787, 0.11854430288076401, 0.12705110013484955, 0.13555790483951569, 0.14406470954418182, 0.15257151424884796, 0.1610783189535141, 0.16958512365818024, 0.17809192836284637, 0.1865987330675125, 0.19510553777217865, 0.2036123424768448, 0.21211914718151093, 0.22062595188617706, 0.2291327565908432, 0.23763954639434814, 0.24614635109901428, 0.2546531558036804, 0.26315996050834656, 0.2716667652130127, 0.28017356991767883, 0.28868037462234497, 0.2971871793270111, 0.30569398403167725, 0.3142007887363434, 0.3227075934410095]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 4.0, 12.0, 15.0, 15.0, 29.0, 30.0, 33.0, 61.0, 76.0, 158.0, 300.0, 585.0, 2074.0, 11646.0, 195826.0, 3858760.0, 113232.0, 8500.0, 1570.0, 597.0, 255.0, 161.0, 103.0, 55.0, 42.0, 39.0, 18.0, 12.0, 19.0, 7.0, 5.0, 7.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.06439208984375, -0.06240653991699219, -0.060420989990234375, -0.05843544006347656, -0.05644989013671875, -0.05446434020996094, -0.052478790283203125, -0.05049324035644531, -0.0485076904296875, -0.04652214050292969, -0.044536590576171875, -0.04255104064941406, -0.04056549072265625, -0.03857994079589844, -0.036594390869140625, -0.03460884094238281, -0.032623291015625, -0.030637741088867188, -0.028652191162109375, -0.026666641235351562, -0.02468109130859375, -0.022695541381835938, -0.020709991455078125, -0.018724441528320312, -0.0167388916015625, -0.014753341674804688, -0.012767791748046875, -0.010782241821289062, -0.00879669189453125, -0.0068111419677734375, -0.004825592041015625, -0.0028400421142578125, -0.0008544921875, 0.0011310577392578125, 0.003116607666015625, 0.0051021575927734375, 0.00708770751953125, 0.009073257446289062, 0.011058807373046875, 0.013044357299804688, 0.0150299072265625, 0.017015457153320312, 0.019001007080078125, 0.020986557006835938, 0.02297210693359375, 0.024957656860351562, 0.026943206787109375, 0.028928756713867188, 0.030914306640625, 0.03289985656738281, 0.034885406494140625, 0.03687095642089844, 0.03885650634765625, 0.04084205627441406, 0.042827606201171875, 0.04481315612792969, 0.0467987060546875, 0.04878425598144531, 0.050769805908203125, 0.05275535583496094, 0.05474090576171875, 0.05672645568847656, 0.058712005615234375, 0.06069755554199219, 0.06268310546875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 6.0, 8.0, 12.0, 15.0, 15.0, 34.0, 27.0, 30.0, 31.0, 42.0, 38.0, 50.0, 57.0, 72.0, 54.0, 65.0, 53.0, 47.0, 66.0, 49.0, 43.0, 33.0, 28.0, 28.0, 11.0, 18.0, 11.0, 15.0, 7.0, 10.0, 6.0, 3.0, 3.0, 3.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.018096923828125, -0.017548799514770508, -0.017000675201416016, -0.016452550888061523, -0.01590442657470703, -0.015356302261352539, -0.014808177947998047, -0.014260053634643555, -0.013711929321289062, -0.01316380500793457, -0.012615680694580078, -0.012067556381225586, -0.011519432067871094, -0.010971307754516602, -0.01042318344116211, -0.009875059127807617, -0.009326934814453125, -0.008778810501098633, -0.00823068618774414, -0.0076825618743896484, -0.007134437561035156, -0.006586313247680664, -0.006038188934326172, -0.00549006462097168, -0.0049419403076171875, -0.004393815994262695, -0.003845691680908203, -0.003297567367553711, -0.0027494430541992188, -0.0022013187408447266, -0.0016531944274902344, -0.0011050701141357422, -0.00055694580078125, -8.821487426757812e-06, 0.0005393028259277344, 0.0010874271392822266, 0.0016355514526367188, 0.002183675765991211, 0.002731800079345703, 0.0032799243927001953, 0.0038280487060546875, 0.00437617301940918, 0.004924297332763672, 0.005472421646118164, 0.006020545959472656, 0.0065686702728271484, 0.007116794586181641, 0.007664918899536133, 0.008213043212890625, 0.008761167526245117, 0.00930929183959961, 0.009857416152954102, 0.010405540466308594, 0.010953664779663086, 0.011501789093017578, 0.01204991340637207, 0.012598037719726562, 0.013146162033081055, 0.013694286346435547, 0.014242410659790039, 0.014790534973144531, 0.015338659286499023, 0.015886783599853516, 0.016434907913208008, 0.0169830322265625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 3.0, 18.0, 22.0, 23.0, 34.0, 59.0, 69.0, 94.0, 188.0, 352.0, 1307.0, 79285.0, 4106489.0, 5081.0, 461.0, 225.0, 155.0, 100.0, 76.0, 60.0, 44.0, 45.0, 22.0, 14.0, 19.0, 14.0, 7.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.212890625, -0.205352783203125, -0.19781494140625, -0.190277099609375, -0.1827392578125, -0.175201416015625, -0.16766357421875, -0.160125732421875, -0.152587890625, -0.145050048828125, -0.13751220703125, -0.129974365234375, -0.1224365234375, -0.114898681640625, -0.10736083984375, -0.099822998046875, -0.09228515625, -0.084747314453125, -0.07720947265625, -0.069671630859375, -0.0621337890625, -0.054595947265625, -0.04705810546875, -0.039520263671875, -0.031982421875, -0.024444580078125, -0.01690673828125, -0.009368896484375, -0.0018310546875, 0.005706787109375, 0.01324462890625, 0.020782470703125, 0.0283203125, 0.035858154296875, 0.04339599609375, 0.050933837890625, 0.0584716796875, 0.066009521484375, 0.07354736328125, 0.081085205078125, 0.088623046875, 0.096160888671875, 0.10369873046875, 0.111236572265625, 0.1187744140625, 0.126312255859375, 0.13385009765625, 0.141387939453125, 0.14892578125, 0.156463623046875, 0.16400146484375, 0.171539306640625, 0.1790771484375, 0.186614990234375, 0.19415283203125, 0.201690673828125, 0.209228515625, 0.216766357421875, 0.22430419921875, 0.231842041015625, 0.2393798828125, 0.246917724609375, 0.25445556640625, 0.261993408203125, 0.26953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 18.0, 38.0, 98.0, 300.0, 2105.0, 1159.0, 215.0, 81.0, 36.0, 8.0, 14.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.076904296875, -0.0725860595703125, -0.068267822265625, -0.0639495849609375, -0.05963134765625, -0.0553131103515625, -0.050994873046875, -0.0466766357421875, -0.0423583984375, -0.0380401611328125, -0.033721923828125, -0.0294036865234375, -0.02508544921875, -0.0207672119140625, -0.016448974609375, -0.0121307373046875, -0.0078125, -0.0034942626953125, 0.000823974609375, 0.0051422119140625, 0.00946044921875, 0.0137786865234375, 0.018096923828125, 0.0224151611328125, 0.0267333984375, 0.0310516357421875, 0.035369873046875, 0.0396881103515625, 0.04400634765625, 0.0483245849609375, 0.052642822265625, 0.0569610595703125, 0.061279296875, 0.0655975341796875, 0.069915771484375, 0.0742340087890625, 0.07855224609375, 0.0828704833984375, 0.087188720703125, 0.0915069580078125, 0.0958251953125, 0.1001434326171875, 0.104461669921875, 0.1087799072265625, 0.11309814453125, 0.1174163818359375, 0.121734619140625, 0.1260528564453125, 0.13037109375, 0.1346893310546875, 0.139007568359375, 0.1433258056640625, 0.14764404296875, 0.1519622802734375, 0.156280517578125, 0.1605987548828125, 0.1649169921875, 0.1692352294921875, 0.173553466796875, 0.1778717041015625, 0.18218994140625, 0.1865081787109375, 0.190826416015625, 0.1951446533203125, 0.199462890625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 3.0, 7.0, 10.0, 12.0, 16.0, 49.0, 106.0, 188.0, 288.0, 163.0, 69.0, 40.0, 19.0, 11.0, 6.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7050898671150208, -0.6719392538070679, -0.638788640499115, -0.6056380271911621, -0.5724873542785645, -0.5393368005752563, -0.5061861276626587, -0.4730355143547058, -0.43988490104675293, -0.40673428773880005, -0.37358367443084717, -0.3404330313205719, -0.307282418012619, -0.27413180470466614, -0.24098117649555206, -0.207830548286438, -0.1746799349784851, -0.14152932167053223, -0.10837869346141815, -0.07522807270288467, -0.042077451944351196, -0.008926838636398315, 0.02422378957271576, 0.057374417781829834, 0.09052503108978271, 0.12367565184831619, 0.15682627260684967, 0.18997690081596375, 0.22312751412391663, 0.2562781274318695, 0.2894287705421448, 0.32257938385009766, 0.3557300567626953, 0.3888806700706482, 0.4220312833786011, 0.45518192648887634, 0.4883325397968292, 0.5214831829071045, 0.5546337962150574, 0.5877844095230103, 0.6209350228309631, 0.654085636138916, 0.6872362494468689, 0.7203868627548218, 0.7535375356674194, 0.7866880893707275, 0.8198387622833252, 0.8529893755912781, 0.886139988899231, 0.9192906022071838, 0.9524412155151367, 0.9855918288230896, 1.0187424421310425, 1.0518931150436401, 1.0850436687469482, 1.118194341659546, 1.1513450145721436, 1.1844956874847412, 1.2176462411880493, 1.250796914100647, 1.283947467803955, 1.3170981407165527, 1.3502486944198608, 1.3833993673324585, 1.4165499210357666]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 2.0, 6.0, 14.0, 19.0, 11.0, 16.0, 28.0, 28.0, 31.0, 36.0, 36.0, 42.0, 48.0, 77.0, 46.0, 56.0, 54.0, 51.0, 46.0, 60.0, 53.0, 33.0, 33.0, 32.0, 33.0, 28.0, 20.0, 19.0, 3.0, 8.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.34015971422195435, -0.3299034535884857, -0.3196471929550171, -0.30939093232154846, -0.29913467168807983, -0.2888784110546112, -0.2786221504211426, -0.26836588978767395, -0.2581096291542053, -0.2478533685207367, -0.23759710788726807, -0.22734084725379944, -0.2170845866203308, -0.20682832598686218, -0.19657206535339355, -0.18631580471992493, -0.1760595440864563, -0.16580328345298767, -0.15554702281951904, -0.14529076218605042, -0.1350345015525818, -0.12477824091911316, -0.11452198028564453, -0.1042657196521759, -0.09400945901870728, -0.08375319838523865, -0.07349693775177002, -0.06324067711830139, -0.052984416484832764, -0.042728155851364136, -0.03247189521789551, -0.02221563458442688, -0.011959373950958252, -0.001703113317489624, 0.008553147315979004, 0.018809407949447632, 0.02906566858291626, 0.03932192921638489, 0.049578189849853516, 0.059834450483322144, 0.07009071111679077, 0.0803469717502594, 0.09060323238372803, 0.10085949301719666, 0.11111575365066528, 0.12137201428413391, 0.13162827491760254, 0.14188453555107117, 0.1521407961845398, 0.16239705681800842, 0.17265331745147705, 0.18290957808494568, 0.1931658387184143, 0.20342209935188293, 0.21367835998535156, 0.2239346206188202, 0.23419088125228882, 0.24444714188575745, 0.2547034025192261, 0.2649596631526947, 0.27521592378616333, 0.28547218441963196, 0.2957284450531006, 0.3059847056865692, 0.31624096632003784]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 2.0, 7.0, 9.0, 13.0, 10.0, 17.0, 23.0, 38.0, 53.0, 69.0, 96.0, 168.0, 303.0, 435.0, 773.0, 1488.0, 2583.0, 5126.0, 11004.0, 25096.0, 67444.0, 199555.0, 406474.0, 208224.0, 70522.0, 26361.0, 11317.0, 5173.0, 2667.0, 1362.0, 808.0, 496.0, 296.0, 178.0, 125.0, 65.0, 54.0, 27.0, 24.0, 20.0, 14.0, 8.0, 9.0, 6.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.039093017578125, -0.03785276412963867, -0.036612510681152344, -0.035372257232666016, -0.03413200378417969, -0.03289175033569336, -0.03165149688720703, -0.030411243438720703, -0.029170989990234375, -0.027930736541748047, -0.02669048309326172, -0.02545022964477539, -0.024209976196289062, -0.022969722747802734, -0.021729469299316406, -0.020489215850830078, -0.01924896240234375, -0.018008708953857422, -0.016768455505371094, -0.015528202056884766, -0.014287948608398438, -0.01304769515991211, -0.011807441711425781, -0.010567188262939453, -0.009326934814453125, -0.008086681365966797, -0.006846427917480469, -0.005606174468994141, -0.0043659210205078125, -0.0031256675720214844, -0.0018854141235351562, -0.0006451606750488281, 0.0005950927734375, 0.0018353462219238281, 0.0030755996704101562, 0.004315853118896484, 0.0055561065673828125, 0.006796360015869141, 0.008036613464355469, 0.009276866912841797, 0.010517120361328125, 0.011757373809814453, 0.012997627258300781, 0.01423788070678711, 0.015478134155273438, 0.016718387603759766, 0.017958641052246094, 0.019198894500732422, 0.02043914794921875, 0.021679401397705078, 0.022919654846191406, 0.024159908294677734, 0.025400161743164062, 0.02664041519165039, 0.02788066864013672, 0.029120922088623047, 0.030361175537109375, 0.0316014289855957, 0.03284168243408203, 0.03408193588256836, 0.03532218933105469, 0.036562442779541016, 0.037802696228027344, 0.03904294967651367, 0.040283203125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 5.0, 6.0, 9.0, 7.0, 7.0, 10.0, 15.0, 19.0, 15.0, 27.0, 17.0, 24.0, 26.0, 42.0, 42.0, 47.0, 53.0, 46.0, 47.0, 58.0, 50.0, 47.0, 44.0, 58.0, 47.0, 35.0, 38.0, 34.0, 23.0, 17.0, 14.0, 15.0, 11.0, 7.0, 6.0, 7.0, 6.0, 4.0, 5.0, 2.0, 5.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.02191162109375, -0.021276235580444336, -0.020640850067138672, -0.020005464553833008, -0.019370079040527344, -0.01873469352722168, -0.018099308013916016, -0.01746392250061035, -0.016828536987304688, -0.016193151473999023, -0.01555776596069336, -0.014922380447387695, -0.014286994934082031, -0.013651609420776367, -0.013016223907470703, -0.012380838394165039, -0.011745452880859375, -0.011110067367553711, -0.010474681854248047, -0.009839296340942383, -0.009203910827636719, -0.008568525314331055, -0.00793313980102539, -0.0072977542877197266, -0.0066623687744140625, -0.0060269832611083984, -0.005391597747802734, -0.00475621223449707, -0.004120826721191406, -0.003485441207885742, -0.002850055694580078, -0.002214670181274414, -0.00157928466796875, -0.0009438991546630859, -0.0003085136413574219, 0.0003268718719482422, 0.0009622573852539062, 0.0015976428985595703, 0.0022330284118652344, 0.0028684139251708984, 0.0035037994384765625, 0.0041391849517822266, 0.004774570465087891, 0.005409955978393555, 0.006045341491699219, 0.006680727005004883, 0.007316112518310547, 0.007951498031616211, 0.008586883544921875, 0.009222269058227539, 0.009857654571533203, 0.010493040084838867, 0.011128425598144531, 0.011763811111450195, 0.01239919662475586, 0.013034582138061523, 0.013669967651367188, 0.014305353164672852, 0.014940738677978516, 0.01557612419128418, 0.016211509704589844, 0.016846895217895508, 0.017482280731201172, 0.018117666244506836, 0.0187530517578125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 2.0, 8.0, 10.0, 7.0, 15.0, 24.0, 32.0, 62.0, 108.0, 110.0, 156.0, 303.0, 444.0, 915.0, 1777.0, 4803.0, 18422.0, 207047.0, 759642.0, 41326.0, 7885.0, 2630.0, 1220.0, 629.0, 340.0, 220.0, 108.0, 78.0, 59.0, 45.0, 37.0, 23.0, 20.0, 7.0, 7.0, 8.0, 6.0, 3.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1275634765625, -0.12347602844238281, -0.11938858032226562, -0.11530113220214844, -0.11121368408203125, -0.10712623596191406, -0.10303878784179688, -0.09895133972167969, -0.0948638916015625, -0.09077644348144531, -0.08668899536132812, -0.08260154724121094, -0.07851409912109375, -0.07442665100097656, -0.07033920288085938, -0.06625175476074219, -0.062164306640625, -0.05807685852050781, -0.053989410400390625, -0.04990196228027344, -0.04581451416015625, -0.04172706604003906, -0.037639617919921875, -0.03355216979980469, -0.0294647216796875, -0.025377273559570312, -0.021289825439453125, -0.017202377319335938, -0.01311492919921875, -0.009027481079101562, -0.004940032958984375, -0.0008525848388671875, 0.00323486328125, 0.0073223114013671875, 0.011409759521484375, 0.015497207641601562, 0.01958465576171875, 0.023672103881835938, 0.027759552001953125, 0.03184700012207031, 0.0359344482421875, 0.04002189636230469, 0.044109344482421875, 0.04819679260253906, 0.05228424072265625, 0.05637168884277344, 0.060459136962890625, 0.06454658508300781, 0.068634033203125, 0.07272148132324219, 0.07680892944335938, 0.08089637756347656, 0.08498382568359375, 0.08907127380371094, 0.09315872192382812, 0.09724617004394531, 0.1013336181640625, 0.10542106628417969, 0.10950851440429688, 0.11359596252441406, 0.11768341064453125, 0.12177085876464844, 0.12585830688476562, 0.1299457550048828, 0.134033203125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 4.0, 4.0, 7.0, 14.0, 5.0, 19.0, 20.0, 18.0, 33.0, 31.0, 30.0, 34.0, 37.0, 42.0, 50.0, 46.0, 58.0, 64.0, 55.0, 43.0, 59.0, 42.0, 42.0, 36.0, 32.0, 43.0, 28.0, 25.0, 21.0, 14.0, 10.0, 9.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0843505859375, -0.08096694946289062, -0.07758331298828125, -0.07419967651367188, -0.0708160400390625, -0.06743240356445312, -0.06404876708984375, -0.060665130615234375, -0.057281494140625, -0.053897857666015625, -0.05051422119140625, -0.047130584716796875, -0.0437469482421875, -0.040363311767578125, -0.03697967529296875, -0.033596038818359375, -0.03021240234375, -0.026828765869140625, -0.02344512939453125, -0.020061492919921875, -0.0166778564453125, -0.013294219970703125, -0.00991058349609375, -0.006526947021484375, -0.003143310546875, 0.000240325927734375, 0.00362396240234375, 0.007007598876953125, 0.0103912353515625, 0.013774871826171875, 0.01715850830078125, 0.020542144775390625, 0.02392578125, 0.027309417724609375, 0.03069305419921875, 0.034076690673828125, 0.0374603271484375, 0.040843963623046875, 0.04422760009765625, 0.047611236572265625, 0.050994873046875, 0.054378509521484375, 0.05776214599609375, 0.061145782470703125, 0.0645294189453125, 0.06791305541992188, 0.07129669189453125, 0.07468032836914062, 0.07806396484375, 0.08144760131835938, 0.08483123779296875, 0.08821487426757812, 0.0915985107421875, 0.09498214721679688, 0.09836578369140625, 0.10174942016601562, 0.105133056640625, 0.10851669311523438, 0.11190032958984375, 0.11528396606445312, 0.1186676025390625, 0.12205123901367188, 0.12543487548828125, 0.12881851196289062, 0.1322021484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 8.0, 19.0, 30.0, 43.0, 80.0, 143.0, 157.0, 352.0, 628.0, 1370.0, 2918.0, 7228.0, 22541.0, 193075.0, 766722.0, 35757.0, 10187.0, 3850.0, 1643.0, 811.0, 409.0, 246.0, 147.0, 72.0, 49.0, 19.0, 11.0, 14.0, 8.0, 7.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07342529296875, -0.07106876373291016, -0.06871223449707031, -0.06635570526123047, -0.06399917602539062, -0.06164264678955078, -0.05928611755371094, -0.056929588317871094, -0.05457305908203125, -0.052216529846191406, -0.04986000061035156, -0.04750347137451172, -0.045146942138671875, -0.04279041290283203, -0.04043388366699219, -0.038077354431152344, -0.0357208251953125, -0.033364295959472656, -0.031007766723632812, -0.02865123748779297, -0.026294708251953125, -0.02393817901611328, -0.021581649780273438, -0.019225120544433594, -0.01686859130859375, -0.014512062072753906, -0.012155532836914062, -0.009799003601074219, -0.007442474365234375, -0.005085945129394531, -0.0027294158935546875, -0.00037288665771484375, 0.001983642578125, 0.004340171813964844, 0.0066967010498046875, 0.009053230285644531, 0.011409759521484375, 0.013766288757324219, 0.016122817993164062, 0.018479347229003906, 0.02083587646484375, 0.023192405700683594, 0.025548934936523438, 0.02790546417236328, 0.030261993408203125, 0.03261852264404297, 0.03497505187988281, 0.037331581115722656, 0.0396881103515625, 0.042044639587402344, 0.04440116882324219, 0.04675769805908203, 0.049114227294921875, 0.05147075653076172, 0.05382728576660156, 0.056183815002441406, 0.05854034423828125, 0.060896873474121094, 0.06325340270996094, 0.06560993194580078, 0.06796646118164062, 0.07032299041748047, 0.07267951965332031, 0.07503604888916016, 0.077392578125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 4.0, 7.0, 4.0, 6.0, 7.0, 9.0, 10.0, 4.0, 12.0, 21.0, 27.0, 36.0, 32.0, 37.0, 45.0, 69.0, 65.0, 95.0, 104.0, 92.0, 49.0, 56.0, 37.0, 25.0, 26.0, 21.0, 20.0, 18.0, 11.0, 7.0, 8.0, 5.0, 6.0, 5.0, 6.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.063678741455078e-05, -2.963189035654068e-05, -2.862699329853058e-05, -2.7622096240520477e-05, -2.6617199182510376e-05, -2.5612302124500275e-05, -2.4607405066490173e-05, -2.3602508008480072e-05, -2.259761095046997e-05, -2.159271389245987e-05, -2.0587816834449768e-05, -1.9582919776439667e-05, -1.8578022718429565e-05, -1.7573125660419464e-05, -1.6568228602409363e-05, -1.556333154439926e-05, -1.455843448638916e-05, -1.3553537428379059e-05, -1.2548640370368958e-05, -1.1543743312358856e-05, -1.0538846254348755e-05, -9.533949196338654e-06, -8.529052138328552e-06, -7.524155080318451e-06, -6.51925802230835e-06, -5.514360964298248e-06, -4.509463906288147e-06, -3.5045668482780457e-06, -2.4996697902679443e-06, -1.494772732257843e-06, -4.898756742477417e-07, 5.150213837623596e-07, 1.519918441772461e-06, 2.5248154997825623e-06, 3.5297125577926636e-06, 4.534609615802765e-06, 5.539506673812866e-06, 6.5444037318229675e-06, 7.549300789833069e-06, 8.55419784784317e-06, 9.559094905853271e-06, 1.0563991963863373e-05, 1.1568889021873474e-05, 1.2573786079883575e-05, 1.3578683137893677e-05, 1.4583580195903778e-05, 1.558847725391388e-05, 1.659337431192398e-05, 1.7598271369934082e-05, 1.8603168427944183e-05, 1.9608065485954285e-05, 2.0612962543964386e-05, 2.1617859601974487e-05, 2.262275665998459e-05, 2.362765371799469e-05, 2.463255077600479e-05, 2.5637447834014893e-05, 2.6642344892024994e-05, 2.7647241950035095e-05, 2.8652139008045197e-05, 2.9657036066055298e-05, 3.06619331240654e-05, 3.16668301820755e-05, 3.26717272400856e-05, 3.36766242980957e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 11.0, 9.0, 12.0, 16.0, 22.0, 29.0, 41.0, 58.0, 86.0, 143.0, 210.0, 382.0, 606.0, 1264.0, 2558.0, 6161.0, 18053.0, 105455.0, 822949.0, 66492.0, 14232.0, 5092.0, 2188.0, 1039.0, 549.0, 321.0, 202.0, 104.0, 83.0, 49.0, 36.0, 27.0, 20.0, 19.0, 12.0, 10.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.072265625, -0.07022428512573242, -0.06818294525146484, -0.06614160537719727, -0.06410026550292969, -0.06205892562866211, -0.06001758575439453, -0.05797624588012695, -0.055934906005859375, -0.0538935661315918, -0.05185222625732422, -0.04981088638305664, -0.04776954650878906, -0.045728206634521484, -0.043686866760253906, -0.04164552688598633, -0.03960418701171875, -0.03756284713745117, -0.035521507263183594, -0.033480167388916016, -0.03143882751464844, -0.02939748764038086, -0.02735614776611328, -0.025314807891845703, -0.023273468017578125, -0.021232128143310547, -0.01919078826904297, -0.01714944839477539, -0.015108108520507812, -0.013066768646240234, -0.011025428771972656, -0.008984088897705078, -0.0069427490234375, -0.004901409149169922, -0.0028600692749023438, -0.0008187294006347656, 0.0012226104736328125, 0.0032639503479003906, 0.005305290222167969, 0.007346630096435547, 0.009387969970703125, 0.011429309844970703, 0.013470649719238281, 0.01551198959350586, 0.017553329467773438, 0.019594669342041016, 0.021636009216308594, 0.023677349090576172, 0.02571868896484375, 0.027760028839111328, 0.029801368713378906, 0.031842708587646484, 0.03388404846191406, 0.03592538833618164, 0.03796672821044922, 0.0400080680847168, 0.042049407958984375, 0.04409074783325195, 0.04613208770751953, 0.04817342758178711, 0.05021476745605469, 0.052256107330322266, 0.054297447204589844, 0.05633878707885742, 0.058380126953125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 3.0, 5.0, 5.0, 3.0, 5.0, 8.0, 6.0, 11.0, 9.0, 11.0, 19.0, 21.0, 45.0, 59.0, 86.0, 113.0, 144.0, 132.0, 94.0, 54.0, 47.0, 27.0, 17.0, 15.0, 13.0, 10.0, 6.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.057373046875, -0.05580854415893555, -0.054244041442871094, -0.05267953872680664, -0.05111503601074219, -0.049550533294677734, -0.04798603057861328, -0.04642152786254883, -0.044857025146484375, -0.04329252243041992, -0.04172801971435547, -0.040163516998291016, -0.03859901428222656, -0.03703451156616211, -0.035470008850097656, -0.0339055061340332, -0.03234100341796875, -0.030776500701904297, -0.029211997985839844, -0.02764749526977539, -0.026082992553710938, -0.024518489837646484, -0.02295398712158203, -0.021389484405517578, -0.019824981689453125, -0.018260478973388672, -0.01669597625732422, -0.015131473541259766, -0.013566970825195312, -0.01200246810913086, -0.010437965393066406, -0.008873462677001953, -0.0073089599609375, -0.005744457244873047, -0.004179954528808594, -0.0026154518127441406, -0.0010509490966796875, 0.0005135536193847656, 0.0020780563354492188, 0.003642559051513672, 0.005207061767578125, 0.006771564483642578, 0.008336067199707031, 0.009900569915771484, 0.011465072631835938, 0.01302957534790039, 0.014594078063964844, 0.016158580780029297, 0.01772308349609375, 0.019287586212158203, 0.020852088928222656, 0.02241659164428711, 0.023981094360351562, 0.025545597076416016, 0.02711009979248047, 0.028674602508544922, 0.030239105224609375, 0.03180360794067383, 0.03336811065673828, 0.034932613372802734, 0.03649711608886719, 0.03806161880493164, 0.039626121520996094, 0.04119062423706055, 0.042755126953125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 7.0, 3.0, 2.0, 6.0, 19.0, 24.0, 62.0, 95.0, 189.0, 238.0, 133.0, 82.0, 46.0, 33.0, 22.0, 14.0, 6.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0570756196975708, -1.025195837020874, -0.9933161735534668, -0.9614364504814148, -0.9295567274093628, -0.8976770043373108, -0.8657972812652588, -0.833917498588562, -0.8020378351211548, -0.7701581120491028, -0.7382783889770508, -0.7063986659049988, -0.6745189428329468, -0.6426392197608948, -0.6107594966888428, -0.578879714012146, -0.546999990940094, -0.515120267868042, -0.48324054479599, -0.451360821723938, -0.419481098651886, -0.387601375579834, -0.3557216227054596, -0.3238418996334076, -0.2919621765613556, -0.2600824534893036, -0.2282027304172516, -0.1963229924440384, -0.1644432693719864, -0.1325635462999344, -0.10068380832672119, -0.06880408525466919, -0.03692430257797241, -0.005044575780630112, 0.02683515101671219, 0.05871488153934479, 0.09059460461139679, 0.12247432768344879, 0.154354065656662, 0.186233788728714, 0.218113511800766, 0.249993234872818, 0.28187295794487, 0.3137527108192444, 0.3456324338912964, 0.3775121569633484, 0.4093918800354004, 0.4412716031074524, 0.4731513261795044, 0.5050310492515564, 0.5369107723236084, 0.5687904953956604, 0.6006702184677124, 0.6325499415397644, 0.6644296646118164, 0.6963094472885132, 0.7281891107559204, 0.7600688338279724, 0.7919485569000244, 0.8238282799720764, 0.8557080030441284, 0.8875877261161804, 0.9194674491882324, 0.9513472318649292, 0.9832269549369812]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 6.0, 4.0, 4.0, 7.0, 13.0, 18.0, 15.0, 13.0, 21.0, 29.0, 26.0, 36.0, 21.0, 42.0, 35.0, 40.0, 52.0, 89.0, 84.0, 76.0, 43.0, 45.0, 42.0, 19.0, 26.0, 29.0, 23.0, 26.0, 24.0, 15.0, 14.0, 11.0, 12.0, 9.0, 8.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.529944658279419, -0.5129480361938477, -0.495951384305954, -0.4789547324180603, -0.4619580805301666, -0.44496142864227295, -0.42796480655670166, -0.410968154668808, -0.3939715027809143, -0.37697485089302063, -0.35997822880744934, -0.34298157691955566, -0.325984925031662, -0.3089882731437683, -0.291991651058197, -0.27499499917030334, -0.25799837708473206, -0.24100174009799957, -0.2240050882101059, -0.2070084512233734, -0.19001179933547974, -0.17301516234874725, -0.15601852536201477, -0.1390218734741211, -0.12202523648738861, -0.10502859205007553, -0.08803194761276245, -0.07103531062602997, -0.05403866618871689, -0.03704202175140381, -0.020045384764671326, -0.003048740327358246, 0.013947904109954834, 0.030944546684622765, 0.047941189259290695, 0.06493782997131348, 0.08193447440862656, 0.09893111884593964, 0.11592775583267212, 0.1329244077205658, 0.14992104470729828, 0.16691768169403076, 0.18391433358192444, 0.20091097056865692, 0.2179076075553894, 0.23490425944328308, 0.25190091133117676, 0.26889753341674805, 0.2858941853046417, 0.3028908371925354, 0.3198874592781067, 0.33688411116600037, 0.35388076305389404, 0.37087738513946533, 0.387874037027359, 0.4048706889152527, 0.421867311000824, 0.43886396288871765, 0.45586058497428894, 0.4728572368621826, 0.4898538887500763, 0.50685054063797, 0.5238471627235413, 0.5408437848091125, 0.5578404664993286]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 3.0, 6.0, 15.0, 20.0, 24.0, 35.0, 65.0, 89.0, 146.0, 228.0, 324.0, 595.0, 1092.0, 2219.0, 5478.0, 17832.0, 125618.0, 3035971.0, 935339.0, 51075.0, 10743.0, 3697.0, 1627.0, 821.0, 448.0, 243.0, 171.0, 97.0, 66.0, 45.0, 37.0, 29.0, 22.0, 9.0, 13.0, 7.0, 10.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.056060791015625, -0.05417966842651367, -0.052298545837402344, -0.050417423248291016, -0.04853630065917969, -0.04665517807006836, -0.04477405548095703, -0.0428929328918457, -0.041011810302734375, -0.03913068771362305, -0.03724956512451172, -0.03536844253540039, -0.03348731994628906, -0.031606197357177734, -0.029725074768066406, -0.027843952178955078, -0.02596282958984375, -0.024081707000732422, -0.022200584411621094, -0.020319461822509766, -0.018438339233398438, -0.01655721664428711, -0.014676094055175781, -0.012794971466064453, -0.010913848876953125, -0.009032726287841797, -0.007151603698730469, -0.005270481109619141, -0.0033893585205078125, -0.0015082359313964844, 0.00037288665771484375, 0.002254009246826172, 0.0041351318359375, 0.006016254425048828, 0.007897377014160156, 0.009778499603271484, 0.011659622192382812, 0.01354074478149414, 0.015421867370605469, 0.017302989959716797, 0.019184112548828125, 0.021065235137939453, 0.02294635772705078, 0.02482748031616211, 0.026708602905273438, 0.028589725494384766, 0.030470848083496094, 0.03235197067260742, 0.03423309326171875, 0.03611421585083008, 0.037995338439941406, 0.039876461029052734, 0.04175758361816406, 0.04363870620727539, 0.04551982879638672, 0.04740095138549805, 0.049282073974609375, 0.0511631965637207, 0.05304431915283203, 0.05492544174194336, 0.05680656433105469, 0.058687686920166016, 0.060568809509277344, 0.06244993209838867, 0.0643310546875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 10.0, 7.0, 5.0, 11.0, 8.0, 8.0, 15.0, 20.0, 21.0, 15.0, 29.0, 30.0, 47.0, 48.0, 53.0, 53.0, 42.0, 65.0, 59.0, 65.0, 56.0, 50.0, 48.0, 41.0, 32.0, 27.0, 30.0, 21.0, 14.0, 17.0, 14.0, 4.0, 7.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0257720947265625, -0.02491140365600586, -0.02405071258544922, -0.023190021514892578, -0.022329330444335938, -0.021468639373779297, -0.020607948303222656, -0.019747257232666016, -0.018886566162109375, -0.018025875091552734, -0.017165184020996094, -0.016304492950439453, -0.015443801879882812, -0.014583110809326172, -0.013722419738769531, -0.01286172866821289, -0.01200103759765625, -0.01114034652709961, -0.010279655456542969, -0.009418964385986328, -0.008558273315429688, -0.007697582244873047, -0.006836891174316406, -0.005976200103759766, -0.005115509033203125, -0.004254817962646484, -0.0033941268920898438, -0.002533435821533203, -0.0016727447509765625, -0.0008120536804199219, 4.863739013671875e-05, 0.0009093284606933594, 0.00177001953125, 0.0026307106018066406, 0.0034914016723632812, 0.004352092742919922, 0.0052127838134765625, 0.006073474884033203, 0.006934165954589844, 0.007794857025146484, 0.008655548095703125, 0.009516239166259766, 0.010376930236816406, 0.011237621307373047, 0.012098312377929688, 0.012959003448486328, 0.013819694519042969, 0.01468038558959961, 0.01554107666015625, 0.01640176773071289, 0.01726245880126953, 0.018123149871826172, 0.018983840942382812, 0.019844532012939453, 0.020705223083496094, 0.021565914154052734, 0.022426605224609375, 0.023287296295166016, 0.024147987365722656, 0.025008678436279297, 0.025869369506835938, 0.026730060577392578, 0.02759075164794922, 0.02845144271850586, 0.0293121337890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 6.0, 16.0, 14.0, 24.0, 35.0, 61.0, 75.0, 103.0, 173.0, 412.0, 1811.0, 3844371.0, 344936.0, 1274.0, 403.0, 146.0, 131.0, 80.0, 64.0, 51.0, 25.0, 25.0, 13.0, 18.0, 6.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4453125, -0.42992401123046875, -0.4145355224609375, -0.39914703369140625, -0.383758544921875, -0.36837005615234375, -0.3529815673828125, -0.33759307861328125, -0.32220458984375, -0.30681610107421875, -0.2914276123046875, -0.27603912353515625, -0.260650634765625, -0.24526214599609375, -0.2298736572265625, -0.21448516845703125, -0.1990966796875, -0.18370819091796875, -0.1683197021484375, -0.15293121337890625, -0.137542724609375, -0.12215423583984375, -0.1067657470703125, -0.09137725830078125, -0.07598876953125, -0.06060028076171875, -0.0452117919921875, -0.02982330322265625, -0.014434814453125, 0.00095367431640625, 0.0163421630859375, 0.03173065185546875, 0.047119140625, 0.06250762939453125, 0.0778961181640625, 0.09328460693359375, 0.108673095703125, 0.12406158447265625, 0.1394500732421875, 0.15483856201171875, 0.17022705078125, 0.18561553955078125, 0.2010040283203125, 0.21639251708984375, 0.231781005859375, 0.24716949462890625, 0.2625579833984375, 0.27794647216796875, 0.2933349609375, 0.30872344970703125, 0.3241119384765625, 0.33950042724609375, 0.354888916015625, 0.37027740478515625, 0.3856658935546875, 0.40105438232421875, 0.41644287109375, 0.43183135986328125, 0.4472198486328125, 0.46260833740234375, 0.477996826171875, 0.49338531494140625, 0.5087738037109375, 0.5241622924804688, 0.53955078125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 10.0, 16.0, 23.0, 39.0, 107.0, 405.0, 2056.0, 1095.0, 189.0, 83.0, 28.0, 14.0, 10.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0933837890625, -0.08781242370605469, -0.08224105834960938, -0.07666969299316406, -0.07109832763671875, -0.06552696228027344, -0.059955596923828125, -0.05438423156738281, -0.0488128662109375, -0.04324150085449219, -0.037670135498046875, -0.03209877014160156, -0.02652740478515625, -0.020956039428710938, -0.015384674072265625, -0.009813308715820312, -0.004241943359375, 0.0013294219970703125, 0.006900787353515625, 0.012472152709960938, 0.01804351806640625, 0.023614883422851562, 0.029186248779296875, 0.03475761413574219, 0.0403289794921875, 0.04590034484863281, 0.051471710205078125, 0.05704307556152344, 0.06261444091796875, 0.06818580627441406, 0.07375717163085938, 0.07932853698730469, 0.08489990234375, 0.09047126770019531, 0.09604263305664062, 0.10161399841308594, 0.10718536376953125, 0.11275672912597656, 0.11832809448242188, 0.12389945983886719, 0.1294708251953125, 0.1350421905517578, 0.14061355590820312, 0.14618492126464844, 0.15175628662109375, 0.15732765197753906, 0.16289901733398438, 0.1684703826904297, 0.174041748046875, 0.1796131134033203, 0.18518447875976562, 0.19075584411621094, 0.19632720947265625, 0.20189857482910156, 0.20746994018554688, 0.2130413055419922, 0.2186126708984375, 0.2241840362548828, 0.22975540161132812, 0.23532676696777344, 0.24089813232421875, 0.24646949768066406, 0.2520408630371094, 0.2576122283935547, 0.26318359375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 11.0, 19.0, 33.0, 95.0, 197.0, 282.0, 197.0, 82.0, 39.0, 11.0, 13.0, 7.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7471466064453125, -0.6986462473869324, -0.6501458883285522, -0.6016455292701721, -0.553145170211792, -0.5046448111534119, -0.45614445209503174, -0.4076440930366516, -0.3591437339782715, -0.31064337491989136, -0.26214301586151123, -0.2136426568031311, -0.16514229774475098, -0.11664193868637085, -0.06814157962799072, -0.019641220569610596, 0.02885913848876953, 0.07735949754714966, 0.12585985660552979, 0.1743602156639099, 0.22286057472229004, 0.27136093378067017, 0.3198612928390503, 0.3683616518974304, 0.41686201095581055, 0.4653623700141907, 0.5138627290725708, 0.5623630881309509, 0.610863447189331, 0.6593638062477112, 0.7078641653060913, 0.7563645243644714, 0.8048648834228516, 0.8533652424812317, 0.9018656015396118, 0.9503659605979919, 0.9988663196563721, 1.0473666191101074, 1.0958670377731323, 1.1443674564361572, 1.1928677558898926, 1.241368055343628, 1.2898684740066528, 1.3383688926696777, 1.386869192123413, 1.4353694915771484, 1.4838699102401733, 1.5323703289031982, 1.5808706283569336, 1.629370927810669, 1.6778713464736938, 1.7263717651367188, 1.774872064590454, 1.8233723640441895, 1.8718727827072144, 1.9203732013702393, 1.9688735008239746, 2.01737380027771, 2.0658740997314453, 2.1143746376037598, 2.162874937057495, 2.2113752365112305, 2.259875774383545, 2.3083760738372803, 2.3568763732910156]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 5.0, 6.0, 9.0, 13.0, 22.0, 25.0, 27.0, 35.0, 36.0, 43.0, 54.0, 54.0, 54.0, 54.0, 52.0, 58.0, 55.0, 43.0, 53.0, 45.0, 35.0, 42.0, 32.0, 30.0, 28.0, 18.0, 19.0, 11.0, 9.0, 5.0, 6.0, 5.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.45279455184936523, -0.4397910237312317, -0.42678749561309814, -0.4137839674949646, -0.40078043937683105, -0.3877769112586975, -0.37477338314056396, -0.3617698550224304, -0.3487663269042969, -0.33576279878616333, -0.3227592706680298, -0.30975574254989624, -0.2967522144317627, -0.28374868631362915, -0.2707451581954956, -0.25774163007736206, -0.24473808705806732, -0.23173455893993378, -0.21873103082180023, -0.2057275027036667, -0.19272397458553314, -0.1797204315662384, -0.16671690344810486, -0.1537133753299713, -0.14070984721183777, -0.12770631909370422, -0.11470279097557068, -0.10169926285743713, -0.08869573473930359, -0.07569219917058945, -0.0626886710524559, -0.04968514293432236, -0.03668162226676941, -0.023678094148635864, -0.01067456416785717, 0.002328965812921524, 0.015332493931055069, 0.028336025774478912, 0.04133955389261246, 0.054343082010746, 0.06734661012887955, 0.08035013824701309, 0.09335366636514664, 0.10635720193386078, 0.11936073005199432, 0.13236425817012787, 0.1453677862882614, 0.15837131440639496, 0.1713748425245285, 0.18437837064266205, 0.1973818987607956, 0.21038542687892914, 0.22338895499706268, 0.23639249801635742, 0.24939602613449097, 0.2623995542526245, 0.27540308237075806, 0.2884066104888916, 0.30141013860702515, 0.3144136667251587, 0.32741719484329224, 0.3404207229614258, 0.3534242510795593, 0.36642777919769287, 0.3794313073158264]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 7.0, 7.0, 2.0, 7.0, 14.0, 24.0, 30.0, 49.0, 55.0, 99.0, 133.0, 204.0, 386.0, 647.0, 1072.0, 1996.0, 3758.0, 8045.0, 17641.0, 44543.0, 130616.0, 358496.0, 309646.0, 104462.0, 37040.0, 15113.0, 6828.0, 3423.0, 1731.0, 962.0, 564.0, 342.0, 219.0, 147.0, 82.0, 59.0, 31.0, 20.0, 19.0, 14.0, 9.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0479736328125, -0.04612159729003906, -0.044269561767578125, -0.04241752624511719, -0.04056549072265625, -0.03871345520019531, -0.036861419677734375, -0.03500938415527344, -0.0331573486328125, -0.03130531311035156, -0.029453277587890625, -0.027601242065429688, -0.02574920654296875, -0.023897171020507812, -0.022045135498046875, -0.020193099975585938, -0.018341064453125, -0.016489028930664062, -0.014636993408203125, -0.012784957885742188, -0.01093292236328125, -0.009080886840820312, -0.007228851318359375, -0.0053768157958984375, -0.0035247802734375, -0.0016727447509765625, 0.000179290771484375, 0.0020313262939453125, 0.00388336181640625, 0.0057353973388671875, 0.007587432861328125, 0.009439468383789062, 0.01129150390625, 0.013143539428710938, 0.014995574951171875, 0.016847610473632812, 0.01869964599609375, 0.020551681518554688, 0.022403717041015625, 0.024255752563476562, 0.0261077880859375, 0.027959823608398438, 0.029811859130859375, 0.03166389465332031, 0.03351593017578125, 0.03536796569824219, 0.037220001220703125, 0.03907203674316406, 0.040924072265625, 0.04277610778808594, 0.044628143310546875, 0.04648017883300781, 0.04833221435546875, 0.05018424987792969, 0.052036285400390625, 0.05388832092285156, 0.0557403564453125, 0.05759239196777344, 0.059444427490234375, 0.06129646301269531, 0.06314849853515625, 0.06500053405761719, 0.06685256958007812, 0.06870460510253906, 0.070556640625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 2.0, 7.0, 6.0, 6.0, 9.0, 13.0, 11.0, 14.0, 18.0, 26.0, 30.0, 18.0, 34.0, 26.0, 38.0, 46.0, 39.0, 46.0, 46.0, 42.0, 48.0, 48.0, 46.0, 34.0, 41.0, 41.0, 32.0, 27.0, 25.0, 32.0, 20.0, 23.0, 22.0, 13.0, 9.0, 10.0, 13.0, 8.0, 6.0, 4.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.0307769775390625, -0.029875516891479492, -0.028974056243896484, -0.028072595596313477, -0.02717113494873047, -0.02626967430114746, -0.025368213653564453, -0.024466753005981445, -0.023565292358398438, -0.02266383171081543, -0.021762371063232422, -0.020860910415649414, -0.019959449768066406, -0.0190579891204834, -0.01815652847290039, -0.017255067825317383, -0.016353607177734375, -0.015452146530151367, -0.01455068588256836, -0.013649225234985352, -0.012747764587402344, -0.011846303939819336, -0.010944843292236328, -0.01004338264465332, -0.009141921997070312, -0.008240461349487305, -0.007339000701904297, -0.006437540054321289, -0.005536079406738281, -0.0046346187591552734, -0.0037331581115722656, -0.002831697463989258, -0.00193023681640625, -0.0010287761688232422, -0.00012731552124023438, 0.0007741451263427734, 0.0016756057739257812, 0.002577066421508789, 0.003478527069091797, 0.004379987716674805, 0.0052814483642578125, 0.00618290901184082, 0.007084369659423828, 0.007985830307006836, 0.008887290954589844, 0.009788751602172852, 0.01069021224975586, 0.011591672897338867, 0.012493133544921875, 0.013394594192504883, 0.01429605484008789, 0.015197515487670898, 0.016098976135253906, 0.017000436782836914, 0.017901897430419922, 0.01880335807800293, 0.019704818725585938, 0.020606279373168945, 0.021507740020751953, 0.02240920066833496, 0.02331066131591797, 0.024212121963500977, 0.025113582611083984, 0.026015043258666992, 0.02691650390625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 8.0, 12.0, 10.0, 13.0, 25.0, 15.0, 44.0, 77.0, 92.0, 155.0, 271.0, 529.0, 1326.0, 4033.0, 19946.0, 264103.0, 709735.0, 38667.0, 6142.0, 1797.0, 682.0, 322.0, 199.0, 111.0, 80.0, 51.0, 31.0, 18.0, 20.0, 10.0, 11.0, 4.0, 5.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1805419921875, -0.1749267578125, -0.1693115234375, -0.1636962890625, -0.1580810546875, -0.1524658203125, -0.1468505859375, -0.1412353515625, -0.1356201171875, -0.1300048828125, -0.1243896484375, -0.1187744140625, -0.1131591796875, -0.1075439453125, -0.1019287109375, -0.0963134765625, -0.0906982421875, -0.0850830078125, -0.0794677734375, -0.0738525390625, -0.0682373046875, -0.0626220703125, -0.0570068359375, -0.0513916015625, -0.0457763671875, -0.0401611328125, -0.0345458984375, -0.0289306640625, -0.0233154296875, -0.0177001953125, -0.0120849609375, -0.0064697265625, -0.0008544921875, 0.0047607421875, 0.0103759765625, 0.0159912109375, 0.0216064453125, 0.0272216796875, 0.0328369140625, 0.0384521484375, 0.0440673828125, 0.0496826171875, 0.0552978515625, 0.0609130859375, 0.0665283203125, 0.0721435546875, 0.0777587890625, 0.0833740234375, 0.0889892578125, 0.0946044921875, 0.1002197265625, 0.1058349609375, 0.1114501953125, 0.1170654296875, 0.1226806640625, 0.1282958984375, 0.1339111328125, 0.1395263671875, 0.1451416015625, 0.1507568359375, 0.1563720703125, 0.1619873046875, 0.1676025390625, 0.1732177734375, 0.1788330078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 7.0, 9.0, 7.0, 9.0, 12.0, 8.0, 16.0, 21.0, 17.0, 38.0, 27.0, 31.0, 38.0, 40.0, 45.0, 58.0, 53.0, 50.0, 50.0, 60.0, 53.0, 52.0, 41.0, 47.0, 30.0, 35.0, 36.0, 26.0, 13.0, 23.0, 8.0, 10.0, 8.0, 10.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12548828125, -0.1214599609375, -0.117431640625, -0.1134033203125, -0.109375, -0.1053466796875, -0.101318359375, -0.0972900390625, -0.09326171875, -0.0892333984375, -0.085205078125, -0.0811767578125, -0.0771484375, -0.0731201171875, -0.069091796875, -0.0650634765625, -0.06103515625, -0.0570068359375, -0.052978515625, -0.0489501953125, -0.044921875, -0.0408935546875, -0.036865234375, -0.0328369140625, -0.02880859375, -0.0247802734375, -0.020751953125, -0.0167236328125, -0.0126953125, -0.0086669921875, -0.004638671875, -0.0006103515625, 0.00341796875, 0.0074462890625, 0.011474609375, 0.0155029296875, 0.01953125, 0.0235595703125, 0.027587890625, 0.0316162109375, 0.03564453125, 0.0396728515625, 0.043701171875, 0.0477294921875, 0.0517578125, 0.0557861328125, 0.059814453125, 0.0638427734375, 0.06787109375, 0.0718994140625, 0.075927734375, 0.0799560546875, 0.083984375, 0.0880126953125, 0.092041015625, 0.0960693359375, 0.10009765625, 0.1041259765625, 0.108154296875, 0.1121826171875, 0.1162109375, 0.1202392578125, 0.124267578125, 0.1282958984375, 0.13232421875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 2.0, 4.0, 15.0, 13.0, 13.0, 20.0, 31.0, 46.0, 54.0, 74.0, 100.0, 141.0, 204.0, 277.0, 432.0, 676.0, 1053.0, 1835.0, 3616.0, 7707.0, 22153.0, 93530.0, 707454.0, 158195.0, 30903.0, 10035.0, 4236.0, 2158.0, 1177.0, 771.0, 509.0, 332.0, 229.0, 149.0, 97.0, 80.0, 55.0, 45.0, 37.0, 23.0, 17.0, 12.0, 6.0, 7.0, 6.0, 6.0, 5.0, 4.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.052886962890625, -0.051215171813964844, -0.04954338073730469, -0.04787158966064453, -0.046199798583984375, -0.04452800750732422, -0.04285621643066406, -0.041184425354003906, -0.03951263427734375, -0.037840843200683594, -0.03616905212402344, -0.03449726104736328, -0.032825469970703125, -0.03115367889404297, -0.029481887817382812, -0.027810096740722656, -0.0261383056640625, -0.024466514587402344, -0.022794723510742188, -0.02112293243408203, -0.019451141357421875, -0.01777935028076172, -0.016107559204101562, -0.014435768127441406, -0.01276397705078125, -0.011092185974121094, -0.009420394897460938, -0.007748603820800781, -0.006076812744140625, -0.004405021667480469, -0.0027332305908203125, -0.0010614395141601562, 0.0006103515625, 0.0022821426391601562, 0.0039539337158203125, 0.005625724792480469, 0.007297515869140625, 0.008969306945800781, 0.010641098022460938, 0.012312889099121094, 0.01398468017578125, 0.015656471252441406, 0.017328262329101562, 0.01900005340576172, 0.020671844482421875, 0.02234363555908203, 0.024015426635742188, 0.025687217712402344, 0.0273590087890625, 0.029030799865722656, 0.030702590942382812, 0.03237438201904297, 0.034046173095703125, 0.03571796417236328, 0.03738975524902344, 0.039061546325683594, 0.04073333740234375, 0.042405128479003906, 0.04407691955566406, 0.04574871063232422, 0.047420501708984375, 0.04909229278564453, 0.05076408386230469, 0.052435874938964844, 0.054107666015625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 8.0, 2.0, 2.0, 3.0, 1.0, 3.0, 8.0, 8.0, 9.0, 13.0, 23.0, 40.0, 69.0, 64.0, 84.0, 128.0, 106.0, 104.0, 80.0, 83.0, 52.0, 38.0, 28.0, 19.0, 16.0, 1.0, 3.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.141164779663086e-05, -3.0310824513435364e-05, -2.9210001230239868e-05, -2.8109177947044373e-05, -2.7008354663848877e-05, -2.590753138065338e-05, -2.4806708097457886e-05, -2.370588481426239e-05, -2.2605061531066895e-05, -2.15042382478714e-05, -2.0403414964675903e-05, -1.9302591681480408e-05, -1.8201768398284912e-05, -1.7100945115089417e-05, -1.600012183189392e-05, -1.4899298548698425e-05, -1.379847526550293e-05, -1.2697651982307434e-05, -1.1596828699111938e-05, -1.0496005415916443e-05, -9.395182132720947e-06, -8.294358849525452e-06, -7.193535566329956e-06, -6.0927122831344604e-06, -4.991888999938965e-06, -3.891065716743469e-06, -2.7902424335479736e-06, -1.689419150352478e-06, -5.885958671569824e-07, 5.122274160385132e-07, 1.6130506992340088e-06, 2.7138739824295044e-06, 3.814697265625e-06, 4.915520548820496e-06, 6.016343832015991e-06, 7.117167115211487e-06, 8.217990398406982e-06, 9.318813681602478e-06, 1.0419636964797974e-05, 1.152046024799347e-05, 1.2621283531188965e-05, 1.372210681438446e-05, 1.4822930097579956e-05, 1.592375338077545e-05, 1.7024576663970947e-05, 1.8125399947166443e-05, 1.922622323036194e-05, 2.0327046513557434e-05, 2.142786979675293e-05, 2.2528693079948425e-05, 2.362951636314392e-05, 2.4730339646339417e-05, 2.5831162929534912e-05, 2.6931986212730408e-05, 2.8032809495925903e-05, 2.91336327791214e-05, 3.0234456062316895e-05, 3.133527934551239e-05, 3.2436102628707886e-05, 3.353692591190338e-05, 3.463774919509888e-05, 3.573857247829437e-05, 3.683939576148987e-05, 3.7940219044685364e-05, 3.904104232788086e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 5.0, 8.0, 4.0, 6.0, 12.0, 13.0, 29.0, 30.0, 48.0, 68.0, 104.0, 139.0, 186.0, 311.0, 473.0, 738.0, 1210.0, 2048.0, 3734.0, 6963.0, 14996.0, 38855.0, 137434.0, 614032.0, 152886.0, 42113.0, 15718.0, 7274.0, 3684.0, 2013.0, 1222.0, 746.0, 469.0, 316.0, 197.0, 134.0, 94.0, 72.0, 47.0, 44.0, 20.0, 21.0, 17.0, 6.0, 4.0, 4.0, 3.0, 0.0, 4.0, 0.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039703369140625, -0.03840303421020508, -0.037102699279785156, -0.035802364349365234, -0.03450202941894531, -0.03320169448852539, -0.03190135955810547, -0.030601024627685547, -0.029300689697265625, -0.028000354766845703, -0.02670001983642578, -0.02539968490600586, -0.024099349975585938, -0.022799015045166016, -0.021498680114746094, -0.020198345184326172, -0.01889801025390625, -0.017597675323486328, -0.016297340393066406, -0.014997005462646484, -0.013696670532226562, -0.01239633560180664, -0.011096000671386719, -0.009795665740966797, -0.008495330810546875, -0.007194995880126953, -0.005894660949707031, -0.004594326019287109, -0.0032939910888671875, -0.0019936561584472656, -0.0006933212280273438, 0.0006070137023925781, 0.0019073486328125, 0.003207683563232422, 0.004508018493652344, 0.005808353424072266, 0.0071086883544921875, 0.00840902328491211, 0.009709358215332031, 0.011009693145751953, 0.012310028076171875, 0.013610363006591797, 0.014910697937011719, 0.01621103286743164, 0.017511367797851562, 0.018811702728271484, 0.020112037658691406, 0.021412372589111328, 0.02271270751953125, 0.024013042449951172, 0.025313377380371094, 0.026613712310791016, 0.027914047241210938, 0.02921438217163086, 0.03051471710205078, 0.0318150520324707, 0.033115386962890625, 0.03441572189331055, 0.03571605682373047, 0.03701639175415039, 0.03831672668457031, 0.039617061614990234, 0.040917396545410156, 0.04221773147583008, 0.04351806640625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 10.0, 6.0, 15.0, 27.0, 39.0, 39.0, 53.0, 65.0, 89.0, 109.0, 104.0, 98.0, 82.0, 41.0, 55.0, 42.0, 30.0, 19.0, 20.0, 10.0, 10.0, 8.0, 10.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0499267578125, -0.04828977584838867, -0.046652793884277344, -0.045015811920166016, -0.04337882995605469, -0.04174184799194336, -0.04010486602783203, -0.0384678840637207, -0.036830902099609375, -0.03519392013549805, -0.03355693817138672, -0.03191995620727539, -0.030282974243164062, -0.028645992279052734, -0.027009010314941406, -0.025372028350830078, -0.02373504638671875, -0.022098064422607422, -0.020461082458496094, -0.018824100494384766, -0.017187118530273438, -0.01555013656616211, -0.013913154602050781, -0.012276172637939453, -0.010639190673828125, -0.009002208709716797, -0.007365226745605469, -0.005728244781494141, -0.0040912628173828125, -0.0024542808532714844, -0.0008172988891601562, 0.0008196830749511719, 0.0024566650390625, 0.004093647003173828, 0.005730628967285156, 0.007367610931396484, 0.009004592895507812, 0.01064157485961914, 0.012278556823730469, 0.013915538787841797, 0.015552520751953125, 0.017189502716064453, 0.01882648468017578, 0.02046346664428711, 0.022100448608398438, 0.023737430572509766, 0.025374412536621094, 0.027011394500732422, 0.02864837646484375, 0.030285358428955078, 0.031922340393066406, 0.033559322357177734, 0.03519630432128906, 0.03683328628540039, 0.03847026824951172, 0.04010725021362305, 0.041744232177734375, 0.0433812141418457, 0.04501819610595703, 0.04665517807006836, 0.04829216003417969, 0.049929141998291016, 0.051566123962402344, 0.05320310592651367, 0.054840087890625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 6.0, 15.0, 15.0, 39.0, 88.0, 192.0, 342.0, 155.0, 82.0, 33.0, 18.0, 10.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2531659603118896, -2.2084152698516846, -2.1636648178100586, -2.1189141273498535, -2.0741634368896484, -2.0294129848480225, -1.9846622943878174, -1.9399117231369019, -1.8951611518859863, -1.8504105806350708, -1.8056598901748657, -1.7609093189239502, -1.7161587476730347, -1.6714081764221191, -1.626657485961914, -1.5819069147109985, -1.5371562242507935, -1.492405652999878, -1.4476549625396729, -1.4029043912887573, -1.3581538200378418, -1.3134031295776367, -1.2686525583267212, -1.2239019870758057, -1.1791512966156006, -1.134400725364685, -1.08965003490448, -1.0448994636535645, -1.000148892402649, -0.9553982615470886, -0.9106476306915283, -0.8658970594406128, -0.8211463689804077, -0.7763957381248474, -0.7316451668739319, -0.6868945360183716, -0.642143964767456, -0.5973933339118958, -0.5526427030563354, -0.5078921318054199, -0.4631415009498596, -0.4183908998966217, -0.3736402988433838, -0.3288896679878235, -0.28413906693458557, -0.23938846588134766, -0.19463783502578735, -0.14988723397254944, -0.10513663291931152, -0.06038602441549301, -0.0156354159116745, 0.02911520004272461, 0.07386580109596252, 0.11861640214920044, 0.16336703300476074, 0.20811763405799866, 0.2528682351112366, 0.2976188361644745, 0.3423694372177124, 0.3871200680732727, 0.4318706691265106, 0.47662127017974854, 0.5213719010353088, 0.5661225318908691, 0.6108731031417847]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 9.0, 9.0, 9.0, 7.0, 5.0, 7.0, 12.0, 27.0, 10.0, 24.0, 27.0, 32.0, 25.0, 32.0, 52.0, 44.0, 65.0, 86.0, 86.0, 64.0, 51.0, 42.0, 42.0, 25.0, 37.0, 23.0, 21.0, 27.0, 17.0, 19.0, 11.0, 11.0, 6.0, 10.0, 7.0, 6.0, 3.0, 7.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5554711818695068, -0.5392701029777527, -0.5230690240859985, -0.5068679451942444, -0.4906668961048126, -0.47446581721305847, -0.4582647681236267, -0.44206368923187256, -0.4258626103401184, -0.40966153144836426, -0.3934604525566101, -0.37725940346717834, -0.3610583245754242, -0.34485724568367004, -0.3286561965942383, -0.31245511770248413, -0.29625403881073, -0.28005295991897583, -0.2638518810272217, -0.24765083193778992, -0.23144975304603577, -0.21524867415428162, -0.19904761016368866, -0.1828465461730957, -0.16664546728134155, -0.1504443883895874, -0.13424332439899445, -0.11804225295782089, -0.10184118151664734, -0.08564011007547379, -0.06943903863430023, -0.05323796719312668, -0.037036895751953125, -0.02083582431077957, -0.004634752869606018, 0.011566318571567535, 0.02776739001274109, 0.04396846145391464, 0.060169532895088196, 0.07637060433626175, 0.0925716757774353, 0.10877274721860886, 0.12497381865978241, 0.14117488265037537, 0.15737596154212952, 0.17357704043388367, 0.18977810442447662, 0.20597916841506958, 0.22218024730682373, 0.23838132619857788, 0.25458240509033203, 0.2707834541797638, 0.28698453307151794, 0.3031856119632721, 0.31938666105270386, 0.335587739944458, 0.35178881883621216, 0.3679898977279663, 0.38419097661972046, 0.4003920257091522, 0.41659310460090637, 0.4327941834926605, 0.4489952325820923, 0.46519631147384644, 0.4813973903656006]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 4.0, 11.0, 12.0, 18.0, 18.0, 16.0, 22.0, 39.0, 55.0, 105.0, 151.0, 230.0, 361.0, 560.0, 975.0, 1887.0, 3867.0, 9744.0, 40109.0, 716576.0, 3252771.0, 136388.0, 18476.0, 6031.0, 2560.0, 1328.0, 723.0, 406.0, 272.0, 165.0, 111.0, 85.0, 58.0, 34.0, 25.0, 20.0, 16.0, 12.0, 10.0, 10.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.07086181640625, -0.06826210021972656, -0.06566238403320312, -0.06306266784667969, -0.06046295166015625, -0.05786323547363281, -0.055263519287109375, -0.05266380310058594, -0.0500640869140625, -0.04746437072753906, -0.044864654541015625, -0.04226493835449219, -0.03966522216796875, -0.03706550598144531, -0.034465789794921875, -0.03186607360839844, -0.029266357421875, -0.026666641235351562, -0.024066925048828125, -0.021467208862304688, -0.01886749267578125, -0.016267776489257812, -0.013668060302734375, -0.011068344116210938, -0.0084686279296875, -0.0058689117431640625, -0.003269195556640625, -0.0006694793701171875, 0.00193023681640625, 0.0045299530029296875, 0.007129669189453125, 0.009729385375976562, 0.0123291015625, 0.014928817749023438, 0.017528533935546875, 0.020128250122070312, 0.02272796630859375, 0.025327682495117188, 0.027927398681640625, 0.030527114868164062, 0.0331268310546875, 0.03572654724121094, 0.038326263427734375, 0.04092597961425781, 0.04352569580078125, 0.04612541198730469, 0.048725128173828125, 0.05132484436035156, 0.053924560546875, 0.05652427673339844, 0.059123992919921875, 0.06172370910644531, 0.06432342529296875, 0.06692314147949219, 0.06952285766601562, 0.07212257385253906, 0.0747222900390625, 0.07732200622558594, 0.07992172241210938, 0.08252143859863281, 0.08512115478515625, 0.08772087097167969, 0.09032058715820312, 0.09292030334472656, 0.09552001953125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 9.0, 7.0, 11.0, 18.0, 10.0, 18.0, 21.0, 32.0, 29.0, 25.0, 48.0, 49.0, 41.0, 38.0, 42.0, 51.0, 53.0, 52.0, 44.0, 57.0, 54.0, 35.0, 41.0, 29.0, 31.0, 30.0, 22.0, 11.0, 24.0, 13.0, 5.0, 11.0, 8.0, 3.0, 8.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0303192138671875, -0.029388904571533203, -0.028458595275878906, -0.02752828598022461, -0.026597976684570312, -0.025667667388916016, -0.02473735809326172, -0.023807048797607422, -0.022876739501953125, -0.021946430206298828, -0.02101612091064453, -0.020085811614990234, -0.019155502319335938, -0.01822519302368164, -0.017294883728027344, -0.016364574432373047, -0.01543426513671875, -0.014503955841064453, -0.013573646545410156, -0.01264333724975586, -0.011713027954101562, -0.010782718658447266, -0.009852409362792969, -0.008922100067138672, -0.007991790771484375, -0.007061481475830078, -0.006131172180175781, -0.005200862884521484, -0.0042705535888671875, -0.0033402442932128906, -0.0024099349975585938, -0.0014796257019042969, -0.00054931640625, 0.0003809928894042969, 0.0013113021850585938, 0.0022416114807128906, 0.0031719207763671875, 0.004102230072021484, 0.005032539367675781, 0.005962848663330078, 0.006893157958984375, 0.007823467254638672, 0.008753776550292969, 0.009684085845947266, 0.010614395141601562, 0.01154470443725586, 0.012475013732910156, 0.013405323028564453, 0.01433563232421875, 0.015265941619873047, 0.016196250915527344, 0.01712656021118164, 0.018056869506835938, 0.018987178802490234, 0.01991748809814453, 0.020847797393798828, 0.021778106689453125, 0.022708415985107422, 0.02363872528076172, 0.024569034576416016, 0.025499343872070312, 0.02642965316772461, 0.027359962463378906, 0.028290271759033203, 0.0292205810546875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 15.0, 8.0, 15.0, 35.0, 66.0, 132.0, 278.0, 780.0, 2698.0, 28912.0, 4119550.0, 37658.0, 2944.0, 707.0, 257.0, 126.0, 45.0, 23.0, 11.0, 10.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.330322265625, -0.3191375732421875, -0.307952880859375, -0.2967681884765625, -0.28558349609375, -0.2743988037109375, -0.263214111328125, -0.2520294189453125, -0.2408447265625, -0.2296600341796875, -0.218475341796875, -0.2072906494140625, -0.19610595703125, -0.1849212646484375, -0.173736572265625, -0.1625518798828125, -0.1513671875, -0.1401824951171875, -0.128997802734375, -0.1178131103515625, -0.10662841796875, -0.0954437255859375, -0.084259033203125, -0.0730743408203125, -0.0618896484375, -0.0507049560546875, -0.039520263671875, -0.0283355712890625, -0.01715087890625, -0.0059661865234375, 0.005218505859375, 0.0164031982421875, 0.027587890625, 0.0387725830078125, 0.049957275390625, 0.0611419677734375, 0.07232666015625, 0.0835113525390625, 0.094696044921875, 0.1058807373046875, 0.1170654296875, 0.1282501220703125, 0.139434814453125, 0.1506195068359375, 0.16180419921875, 0.1729888916015625, 0.184173583984375, 0.1953582763671875, 0.20654296875, 0.2177276611328125, 0.228912353515625, 0.2400970458984375, 0.25128173828125, 0.2624664306640625, 0.273651123046875, 0.2848358154296875, 0.2960205078125, 0.3072052001953125, 0.318389892578125, 0.3295745849609375, 0.34075927734375, 0.3519439697265625, 0.363128662109375, 0.3743133544921875, 0.385498046875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 7.0, 6.0, 17.0, 24.0, 40.0, 114.0, 432.0, 2008.0, 1071.0, 210.0, 71.0, 30.0, 24.0, 14.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2880859375, -0.2808341979980469, -0.27358245849609375, -0.2663307189941406, -0.2590789794921875, -0.2518272399902344, -0.24457550048828125, -0.23732376098632812, -0.230072021484375, -0.22282028198242188, -0.21556854248046875, -0.20831680297851562, -0.2010650634765625, -0.19381332397460938, -0.18656158447265625, -0.17930984497070312, -0.17205810546875, -0.16480636596679688, -0.15755462646484375, -0.15030288696289062, -0.1430511474609375, -0.13579940795898438, -0.12854766845703125, -0.12129592895507812, -0.114044189453125, -0.10679244995117188, -0.09954071044921875, -0.09228897094726562, -0.0850372314453125, -0.07778549194335938, -0.07053375244140625, -0.06328201293945312, -0.0560302734375, -0.048778533935546875, -0.04152679443359375, -0.034275054931640625, -0.0270233154296875, -0.019771575927734375, -0.01251983642578125, -0.005268096923828125, 0.001983642578125, 0.009235382080078125, 0.01648712158203125, 0.023738861083984375, 0.0309906005859375, 0.038242340087890625, 0.04549407958984375, 0.052745819091796875, 0.05999755859375, 0.06724929809570312, 0.07450103759765625, 0.08175277709960938, 0.0890045166015625, 0.09625625610351562, 0.10350799560546875, 0.11075973510742188, 0.118011474609375, 0.12526321411132812, 0.13251495361328125, 0.13976669311523438, 0.1470184326171875, 0.15427017211914062, 0.16152191162109375, 0.16877365112304688, 0.176025390625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 14.0, 18.0, 43.0, 101.0, 187.0, 281.0, 205.0, 86.0, 31.0, 16.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.298693895339966, -2.2515151500701904, -2.204336643218994, -2.1571578979492188, -2.1099791526794434, -2.062800407409668, -2.0156216621398926, -1.9684431552886963, -1.921264410018921, -1.8740856647491455, -1.8269070386886597, -1.7797284126281738, -1.7325496673583984, -1.685370922088623, -1.6381922960281372, -1.5910136699676514, -1.543834924697876, -1.4966561794281006, -1.4494775533676147, -1.402298927307129, -1.3551201820373535, -1.3079414367675781, -1.2607628107070923, -1.2135841846466064, -1.166405439376831, -1.1192266941070557, -1.0720480680465698, -1.024869441986084, -0.9776906967163086, -0.930512011051178, -0.8833333253860474, -0.8361546397209167, -0.7889760732650757, -0.7417973875999451, -0.6946187019348145, -0.6474400162696838, -0.6002613306045532, -0.5530826449394226, -0.505903959274292, -0.4587252736091614, -0.41154658794403076, -0.36436790227890015, -0.31718921661376953, -0.2700105309486389, -0.2228318452835083, -0.17565315961837769, -0.12847447395324707, -0.08129578828811646, -0.03411710262298584, 0.013061583042144775, 0.06024026870727539, 0.107418954372406, 0.15459764003753662, 0.20177632570266724, 0.24895501136779785, 0.29613369703292847, 0.3433123826980591, 0.3904910683631897, 0.4376697540283203, 0.4848484396934509, 0.5320271253585815, 0.5792058110237122, 0.6263844966888428, 0.6735631823539734, 0.720741868019104]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 6.0, 3.0, 7.0, 9.0, 14.0, 11.0, 8.0, 15.0, 17.0, 25.0, 26.0, 29.0, 42.0, 33.0, 35.0, 45.0, 31.0, 40.0, 40.0, 49.0, 40.0, 33.0, 51.0, 32.0, 36.0, 43.0, 37.0, 26.0, 25.0, 32.0, 20.0, 17.0, 17.0, 15.0, 10.0, 14.0, 11.0, 5.0, 12.0, 5.0, 1.0, 7.0, 4.0, 3.0, 0.0, 8.0, 1.0, 1.0, 5.0], "bins": [-0.4417431950569153, -0.42889025807380676, -0.41603735089302063, -0.4031844139099121, -0.390331506729126, -0.37747856974601746, -0.36462563276290894, -0.3517727255821228, -0.3389197885990143, -0.32606685161590576, -0.31321394443511963, -0.3003610074520111, -0.2875080704689026, -0.27465516328811646, -0.26180222630500793, -0.2489493042230606, -0.23609638214111328, -0.22324346005916595, -0.21039053797721863, -0.1975376009941101, -0.18468467891216278, -0.17183175683021545, -0.15897881984710693, -0.1461258977651596, -0.13327297568321228, -0.12042005360126495, -0.10756712406873703, -0.0947141945362091, -0.08186127245426178, -0.06900835037231445, -0.05615542083978653, -0.043302491307258606, -0.03044956922531128, -0.017596643418073654, -0.004743717610836029, 0.008109208196401596, 0.02096213400363922, 0.03381505608558655, 0.04666798561811447, 0.059520915150642395, 0.07237383723258972, 0.08522675931453705, 0.09807968884706497, 0.1109326183795929, 0.12378554046154022, 0.13663846254348755, 0.14949139952659607, 0.1623443216085434, 0.17519724369049072, 0.18805016577243805, 0.20090308785438538, 0.2137560248374939, 0.22660894691944122, 0.23946186900138855, 0.25231480598449707, 0.2651677131652832, 0.2780206501483917, 0.29087358713150024, 0.3037264943122864, 0.3165794312953949, 0.3294323682785034, 0.34228527545928955, 0.35513821244239807, 0.3679911494255066, 0.3808440566062927]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 11.0, 3.0, 20.0, 18.0, 25.0, 45.0, 69.0, 90.0, 150.0, 223.0, 335.0, 453.0, 769.0, 1400.0, 2415.0, 4149.0, 8011.0, 16150.0, 34809.0, 81997.0, 207319.0, 354188.0, 193605.0, 76337.0, 33219.0, 15436.0, 7555.0, 4049.0, 2211.0, 1343.0, 765.0, 467.0, 306.0, 209.0, 107.0, 89.0, 70.0, 42.0, 22.0, 18.0, 14.0, 9.0, 6.0, 10.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.053802490234375, -0.05224132537841797, -0.05068016052246094, -0.049118995666503906, -0.047557830810546875, -0.045996665954589844, -0.04443550109863281, -0.04287433624267578, -0.04131317138671875, -0.03975200653076172, -0.03819084167480469, -0.036629676818847656, -0.035068511962890625, -0.033507347106933594, -0.03194618225097656, -0.03038501739501953, -0.0288238525390625, -0.02726268768310547, -0.025701522827148438, -0.024140357971191406, -0.022579193115234375, -0.021018028259277344, -0.019456863403320312, -0.01789569854736328, -0.01633453369140625, -0.014773368835449219, -0.013212203979492188, -0.011651039123535156, -0.010089874267578125, -0.008528709411621094, -0.0069675445556640625, -0.005406379699707031, -0.00384521484375, -0.0022840499877929688, -0.0007228851318359375, 0.0008382797241210938, 0.002399444580078125, 0.003960609436035156, 0.0055217742919921875, 0.007082939147949219, 0.00864410400390625, 0.010205268859863281, 0.011766433715820312, 0.013327598571777344, 0.014888763427734375, 0.016449928283691406, 0.018011093139648438, 0.01957225799560547, 0.0211334228515625, 0.02269458770751953, 0.024255752563476562, 0.025816917419433594, 0.027378082275390625, 0.028939247131347656, 0.030500411987304688, 0.03206157684326172, 0.03362274169921875, 0.03518390655517578, 0.03674507141113281, 0.038306236267089844, 0.039867401123046875, 0.041428565979003906, 0.04298973083496094, 0.04455089569091797, 0.046112060546875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 6.0, 10.0, 15.0, 19.0, 19.0, 17.0, 21.0, 27.0, 35.0, 32.0, 49.0, 52.0, 52.0, 48.0, 61.0, 44.0, 74.0, 51.0, 57.0, 56.0, 40.0, 32.0, 34.0, 29.0, 24.0, 21.0, 13.0, 10.0, 12.0, 10.0, 4.0, 5.0, 3.0, 2.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.039154052734375, -0.037824153900146484, -0.03649425506591797, -0.03516435623168945, -0.03383445739746094, -0.03250455856323242, -0.031174659729003906, -0.02984476089477539, -0.028514862060546875, -0.02718496322631836, -0.025855064392089844, -0.024525165557861328, -0.023195266723632812, -0.021865367889404297, -0.02053546905517578, -0.019205570220947266, -0.01787567138671875, -0.016545772552490234, -0.015215873718261719, -0.013885974884033203, -0.012556076049804688, -0.011226177215576172, -0.009896278381347656, -0.00856637954711914, -0.007236480712890625, -0.005906581878662109, -0.004576683044433594, -0.003246784210205078, -0.0019168853759765625, -0.0005869865417480469, 0.0007429122924804688, 0.0020728111267089844, 0.0034027099609375, 0.004732608795166016, 0.006062507629394531, 0.007392406463623047, 0.008722305297851562, 0.010052204132080078, 0.011382102966308594, 0.01271200180053711, 0.014041900634765625, 0.01537179946899414, 0.016701698303222656, 0.018031597137451172, 0.019361495971679688, 0.020691394805908203, 0.02202129364013672, 0.023351192474365234, 0.02468109130859375, 0.026010990142822266, 0.02734088897705078, 0.028670787811279297, 0.030000686645507812, 0.03133058547973633, 0.032660484313964844, 0.03399038314819336, 0.035320281982421875, 0.03665018081665039, 0.037980079650878906, 0.03930997848510742, 0.04063987731933594, 0.04196977615356445, 0.04329967498779297, 0.044629573822021484, 0.04595947265625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 9.0, 4.0, 8.0, 13.0, 10.0, 18.0, 18.0, 32.0, 47.0, 57.0, 67.0, 108.0, 128.0, 189.0, 274.0, 502.0, 981.0, 2035.0, 5403.0, 19473.0, 105571.0, 733235.0, 144438.0, 24367.0, 6522.0, 2351.0, 1063.0, 522.0, 317.0, 239.0, 144.0, 114.0, 73.0, 47.0, 39.0, 39.0, 21.0, 25.0, 14.0, 13.0, 4.0, 5.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1192626953125, -0.11536216735839844, -0.11146163940429688, -0.10756111145019531, -0.10366058349609375, -0.09976005554199219, -0.09585952758789062, -0.09195899963378906, -0.0880584716796875, -0.08415794372558594, -0.08025741577148438, -0.07635688781738281, -0.07245635986328125, -0.06855583190917969, -0.06465530395507812, -0.06075477600097656, -0.056854248046875, -0.05295372009277344, -0.049053192138671875, -0.04515266418457031, -0.04125213623046875, -0.03735160827636719, -0.033451080322265625, -0.029550552368164062, -0.0256500244140625, -0.021749496459960938, -0.017848968505859375, -0.013948440551757812, -0.01004791259765625, -0.0061473846435546875, -0.002246856689453125, 0.0016536712646484375, 0.00555419921875, 0.009454727172851562, 0.013355255126953125, 0.017255783081054688, 0.02115631103515625, 0.025056838989257812, 0.028957366943359375, 0.03285789489746094, 0.0367584228515625, 0.04065895080566406, 0.044559478759765625, 0.04846000671386719, 0.05236053466796875, 0.05626106262207031, 0.060161590576171875, 0.06406211853027344, 0.067962646484375, 0.07186317443847656, 0.07576370239257812, 0.07966423034667969, 0.08356475830078125, 0.08746528625488281, 0.09136581420898438, 0.09526634216308594, 0.0991668701171875, 0.10306739807128906, 0.10696792602539062, 0.11086845397949219, 0.11476898193359375, 0.11866950988769531, 0.12257003784179688, 0.12647056579589844, 0.13037109375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 7.0, 7.0, 5.0, 7.0, 11.0, 10.0, 17.0, 9.0, 13.0, 20.0, 15.0, 19.0, 37.0, 41.0, 44.0, 52.0, 54.0, 49.0, 60.0, 62.0, 68.0, 60.0, 50.0, 39.0, 44.0, 27.0, 34.0, 22.0, 15.0, 21.0, 8.0, 17.0, 9.0, 8.0, 8.0, 8.0, 3.0, 3.0, 3.0, 5.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1744384765625, -0.16887664794921875, -0.1633148193359375, -0.15775299072265625, -0.152191162109375, -0.14662933349609375, -0.1410675048828125, -0.13550567626953125, -0.12994384765625, -0.12438201904296875, -0.1188201904296875, -0.11325836181640625, -0.107696533203125, -0.10213470458984375, -0.0965728759765625, -0.09101104736328125, -0.08544921875, -0.07988739013671875, -0.0743255615234375, -0.06876373291015625, -0.063201904296875, -0.05764007568359375, -0.0520782470703125, -0.04651641845703125, -0.04095458984375, -0.03539276123046875, -0.0298309326171875, -0.02426910400390625, -0.018707275390625, -0.01314544677734375, -0.0075836181640625, -0.00202178955078125, 0.0035400390625, 0.00910186767578125, 0.0146636962890625, 0.02022552490234375, 0.025787353515625, 0.03134918212890625, 0.0369110107421875, 0.04247283935546875, 0.04803466796875, 0.05359649658203125, 0.0591583251953125, 0.06472015380859375, 0.070281982421875, 0.07584381103515625, 0.0814056396484375, 0.08696746826171875, 0.092529296875, 0.09809112548828125, 0.1036529541015625, 0.10921478271484375, 0.114776611328125, 0.12033843994140625, 0.1259002685546875, 0.13146209716796875, 0.13702392578125, 0.14258575439453125, 0.1481475830078125, 0.15370941162109375, 0.159271240234375, 0.16483306884765625, 0.1703948974609375, 0.17595672607421875, 0.1815185546875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 6.0, 9.0, 1.0, 16.0, 10.0, 16.0, 28.0, 47.0, 47.0, 59.0, 105.0, 137.0, 227.0, 321.0, 546.0, 1006.0, 1967.0, 4247.0, 11594.0, 41842.0, 599422.0, 329191.0, 38240.0, 10973.0, 4161.0, 1823.0, 958.0, 529.0, 333.0, 202.0, 132.0, 100.0, 75.0, 51.0, 36.0, 26.0, 24.0, 16.0, 12.0, 5.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.06787109375, -0.06593036651611328, -0.06398963928222656, -0.062048912048339844, -0.060108184814453125, -0.058167457580566406, -0.05622673034667969, -0.05428600311279297, -0.05234527587890625, -0.05040454864501953, -0.04846382141113281, -0.046523094177246094, -0.044582366943359375, -0.042641639709472656, -0.04070091247558594, -0.03876018524169922, -0.0368194580078125, -0.03487873077392578, -0.03293800354003906, -0.030997276306152344, -0.029056549072265625, -0.027115821838378906, -0.025175094604492188, -0.02323436737060547, -0.02129364013671875, -0.01935291290283203, -0.017412185668945312, -0.015471458435058594, -0.013530731201171875, -0.011590003967285156, -0.009649276733398438, -0.007708549499511719, -0.005767822265625, -0.0038270950317382812, -0.0018863677978515625, 5.435943603515625e-05, 0.001995086669921875, 0.003935813903808594, 0.0058765411376953125, 0.007817268371582031, 0.00975799560546875, 0.011698722839355469, 0.013639450073242188, 0.015580177307128906, 0.017520904541015625, 0.019461631774902344, 0.021402359008789062, 0.02334308624267578, 0.0252838134765625, 0.02722454071044922, 0.029165267944335938, 0.031105995178222656, 0.033046722412109375, 0.034987449645996094, 0.03692817687988281, 0.03886890411376953, 0.04080963134765625, 0.04275035858154297, 0.04469108581542969, 0.046631813049316406, 0.048572540283203125, 0.050513267517089844, 0.05245399475097656, 0.05439472198486328, 0.05633544921875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 6.0, 5.0, 10.0, 7.0, 8.0, 13.0, 18.0, 19.0, 28.0, 34.0, 37.0, 55.0, 86.0, 97.0, 106.0, 89.0, 58.0, 73.0, 58.0, 45.0, 28.0, 23.0, 20.0, 25.0, 10.0, 6.0, 10.0, 6.0, 1.0, 3.0, 2.0, 5.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8967857360839844e-05, -2.8157606720924377e-05, -2.734735608100891e-05, -2.6537105441093445e-05, -2.572685480117798e-05, -2.4916604161262512e-05, -2.4106353521347046e-05, -2.329610288143158e-05, -2.2485852241516113e-05, -2.1675601601600647e-05, -2.086535096168518e-05, -2.0055100321769714e-05, -1.9244849681854248e-05, -1.8434599041938782e-05, -1.7624348402023315e-05, -1.681409776210785e-05, -1.6003847122192383e-05, -1.5193596482276917e-05, -1.438334584236145e-05, -1.3573095202445984e-05, -1.2762844562530518e-05, -1.1952593922615051e-05, -1.1142343282699585e-05, -1.0332092642784119e-05, -9.521842002868652e-06, -8.711591362953186e-06, -7.90134072303772e-06, -7.091090083122253e-06, -6.280839443206787e-06, -5.470588803291321e-06, -4.6603381633758545e-06, -3.850087523460388e-06, -3.039836883544922e-06, -2.2295862436294556e-06, -1.4193356037139893e-06, -6.09084963798523e-07, 2.0116567611694336e-07, 1.0114163160324097e-06, 1.821666955947876e-06, 2.6319175958633423e-06, 3.4421682357788086e-06, 4.252418875694275e-06, 5.062669515609741e-06, 5.8729201555252075e-06, 6.683170795440674e-06, 7.49342143535614e-06, 8.303672075271606e-06, 9.113922715187073e-06, 9.924173355102539e-06, 1.0734423995018005e-05, 1.1544674634933472e-05, 1.2354925274848938e-05, 1.3165175914764404e-05, 1.397542655467987e-05, 1.4785677194595337e-05, 1.5595927834510803e-05, 1.640617847442627e-05, 1.7216429114341736e-05, 1.8026679754257202e-05, 1.883693039417267e-05, 1.9647181034088135e-05, 2.04574316740036e-05, 2.1267682313919067e-05, 2.2077932953834534e-05, 2.288818359375e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 2.0, 7.0, 9.0, 7.0, 13.0, 15.0, 14.0, 28.0, 40.0, 56.0, 101.0, 158.0, 231.0, 460.0, 865.0, 2056.0, 5419.0, 18091.0, 97708.0, 813505.0, 84319.0, 16444.0, 5062.0, 1990.0, 857.0, 455.0, 243.0, 123.0, 81.0, 49.0, 27.0, 31.0, 28.0, 12.0, 14.0, 7.0, 5.0, 7.0, 7.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.07171630859375, -0.06943702697753906, -0.06715774536132812, -0.06487846374511719, -0.06259918212890625, -0.06031990051269531, -0.058040618896484375, -0.05576133728027344, -0.0534820556640625, -0.05120277404785156, -0.048923492431640625, -0.04664421081542969, -0.04436492919921875, -0.04208564758300781, -0.039806365966796875, -0.03752708435058594, -0.035247802734375, -0.03296852111816406, -0.030689239501953125, -0.028409957885742188, -0.02613067626953125, -0.023851394653320312, -0.021572113037109375, -0.019292831420898438, -0.0170135498046875, -0.014734268188476562, -0.012454986572265625, -0.010175704956054688, -0.00789642333984375, -0.0056171417236328125, -0.003337860107421875, -0.0010585784912109375, 0.001220703125, 0.0034999847412109375, 0.005779266357421875, 0.008058547973632812, 0.01033782958984375, 0.012617111206054688, 0.014896392822265625, 0.017175674438476562, 0.0194549560546875, 0.021734237670898438, 0.024013519287109375, 0.026292800903320312, 0.02857208251953125, 0.030851364135742188, 0.033130645751953125, 0.03540992736816406, 0.037689208984375, 0.03996849060058594, 0.042247772216796875, 0.04452705383300781, 0.04680633544921875, 0.04908561706542969, 0.051364898681640625, 0.05364418029785156, 0.0559234619140625, 0.05820274353027344, 0.060482025146484375, 0.06276130676269531, 0.06504058837890625, 0.06731986999511719, 0.06959915161132812, 0.07187843322753906, 0.07415771484375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 4.0, 7.0, 4.0, 15.0, 17.0, 19.0, 22.0, 38.0, 29.0, 60.0, 69.0, 130.0, 174.0, 120.0, 91.0, 33.0, 37.0, 32.0, 19.0, 16.0, 15.0, 16.0, 5.0, 6.0, 5.0, 2.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045440673828125, -0.04342031478881836, -0.04139995574951172, -0.03937959671020508, -0.03735923767089844, -0.0353388786315918, -0.033318519592285156, -0.031298160552978516, -0.029277801513671875, -0.027257442474365234, -0.025237083435058594, -0.023216724395751953, -0.021196365356445312, -0.019176006317138672, -0.01715564727783203, -0.01513528823852539, -0.01311492919921875, -0.01109457015991211, -0.009074211120605469, -0.007053852081298828, -0.0050334930419921875, -0.003013134002685547, -0.0009927749633789062, 0.0010275840759277344, 0.003047943115234375, 0.005068302154541016, 0.007088661193847656, 0.009109020233154297, 0.011129379272460938, 0.013149738311767578, 0.015170097351074219, 0.01719045639038086, 0.0192108154296875, 0.02123117446899414, 0.02325153350830078, 0.025271892547607422, 0.027292251586914062, 0.029312610626220703, 0.031332969665527344, 0.033353328704833984, 0.035373687744140625, 0.037394046783447266, 0.039414405822753906, 0.04143476486206055, 0.04345512390136719, 0.04547548294067383, 0.04749584197998047, 0.04951620101928711, 0.05153656005859375, 0.05355691909790039, 0.05557727813720703, 0.05759763717651367, 0.05961799621582031, 0.06163835525512695, 0.0636587142944336, 0.06567907333374023, 0.06769943237304688, 0.06971979141235352, 0.07174015045166016, 0.0737605094909668, 0.07578086853027344, 0.07780122756958008, 0.07982158660888672, 0.08184194564819336, 0.0838623046875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 4.0, 0.0, 6.0, 7.0, 13.0, 10.0, 30.0, 53.0, 74.0, 98.0, 218.0, 253.0, 107.0, 56.0, 33.0, 21.0, 6.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6746373176574707, -1.6383001804351807, -1.6019630432128906, -1.5656259059906006, -1.5292887687683105, -1.492951512336731, -1.456614375114441, -1.4202772378921509, -1.3839401006698608, -1.3476029634475708, -1.3112658262252808, -1.2749286890029907, -1.2385914325714111, -1.202254295349121, -1.165917158126831, -1.129580020904541, -1.093242883682251, -1.056905746459961, -1.020568609237671, -0.9842314124107361, -0.947894275188446, -0.911557137966156, -0.8752199411392212, -0.8388828039169312, -0.8025456666946411, -0.7662085294723511, -0.729871392250061, -0.6935341954231262, -0.6571970582008362, -0.6208599209785461, -0.5845227241516113, -0.5481855869293213, -0.5118483304977417, -0.47551119327545166, -0.43917402625083923, -0.4028368592262268, -0.36649972200393677, -0.33016258478164673, -0.2938254177570343, -0.2574882507324219, -0.22115111351013184, -0.1848139613866806, -0.14847680926322937, -0.11213965713977814, -0.0758025050163269, -0.03946535289287567, -0.0031282007694244385, 0.03320896625518799, 0.06954610347747803, 0.10588325560092926, 0.1422204077243805, 0.17855755984783173, 0.21489471197128296, 0.251231849193573, 0.2875690162181854, 0.32390618324279785, 0.3602433204650879, 0.39658045768737793, 0.43291762471199036, 0.4692547917366028, 0.5055919289588928, 0.5419290661811829, 0.5782662630081177, 0.6146034002304077, 0.6509405374526978]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 3.0, 6.0, 3.0, 10.0, 11.0, 16.0, 18.0, 15.0, 29.0, 26.0, 21.0, 31.0, 33.0, 48.0, 48.0, 77.0, 145.0, 94.0, 64.0, 47.0, 38.0, 37.0, 28.0, 27.0, 15.0, 23.0, 13.0, 16.0, 16.0, 11.0, 6.0, 10.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.05391526222229, -1.0260175466537476, -0.9981198310852051, -0.9702221155166626, -0.9423243403434753, -0.9144266247749329, -0.8865289092063904, -0.8586311936378479, -0.8307334184646606, -0.8028357028961182, -0.7749379873275757, -0.7470402717590332, -0.719142496585846, -0.6912447810173035, -0.663347065448761, -0.6354493498802185, -0.607551634311676, -0.5796539187431335, -0.5517562031745911, -0.5238584280014038, -0.49596071243286133, -0.46806299686431885, -0.44016528129577637, -0.4122675657272339, -0.384369820356369, -0.35647210478782654, -0.32857435941696167, -0.3006766438484192, -0.2727789282798767, -0.24488118290901184, -0.21698346734046936, -0.18908573687076569, -0.161188006401062, -0.13329027593135834, -0.10539255291223526, -0.07749482989311218, -0.04959709942340851, -0.021699368953704834, 0.0061983466148376465, 0.03409607708454132, 0.061993807554244995, 0.08989153802394867, 0.11778926104307175, 0.14568698406219482, 0.1735847145318985, 0.20148244500160217, 0.22938016057014465, 0.2572779059410095, 0.285175621509552, 0.3130733370780945, 0.34097108244895935, 0.36886879801750183, 0.3967665433883667, 0.4246642589569092, 0.45256197452545166, 0.48045969009399414, 0.5083574056625366, 0.5362551212310791, 0.5641528367996216, 0.5920505523681641, 0.6199483275413513, 0.6478460431098938, 0.6757437586784363, 0.7036414742469788, 0.731539249420166]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 10.0, 12.0, 14.0, 21.0, 21.0, 29.0, 39.0, 61.0, 92.0, 119.0, 188.0, 378.0, 631.0, 1122.0, 2246.0, 5522.0, 21402.0, 348205.0, 3584278.0, 203936.0, 16594.0, 4750.0, 2072.0, 980.0, 548.0, 348.0, 221.0, 134.0, 90.0, 64.0, 40.0, 22.0, 22.0, 22.0, 12.0, 12.0, 7.0, 6.0, 5.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11785888671875, -0.1143331527709961, -0.11080741882324219, -0.10728168487548828, -0.10375595092773438, -0.10023021697998047, -0.09670448303222656, -0.09317874908447266, -0.08965301513671875, -0.08612728118896484, -0.08260154724121094, -0.07907581329345703, -0.07555007934570312, -0.07202434539794922, -0.06849861145019531, -0.0649728775024414, -0.0614471435546875, -0.057921409606933594, -0.05439567565917969, -0.05086994171142578, -0.047344207763671875, -0.04381847381591797, -0.04029273986816406, -0.036767005920410156, -0.03324127197265625, -0.029715538024902344, -0.026189804077148438, -0.02266407012939453, -0.019138336181640625, -0.015612602233886719, -0.012086868286132812, -0.008561134338378906, -0.005035400390625, -0.0015096664428710938, 0.0020160675048828125, 0.005541801452636719, 0.009067535400390625, 0.012593269348144531, 0.016119003295898438, 0.019644737243652344, 0.02317047119140625, 0.026696205139160156, 0.030221939086914062, 0.03374767303466797, 0.037273406982421875, 0.04079914093017578, 0.04432487487792969, 0.047850608825683594, 0.0513763427734375, 0.054902076721191406, 0.05842781066894531, 0.06195354461669922, 0.06547927856445312, 0.06900501251220703, 0.07253074645996094, 0.07605648040771484, 0.07958221435546875, 0.08310794830322266, 0.08663368225097656, 0.09015941619873047, 0.09368515014648438, 0.09721088409423828, 0.10073661804199219, 0.1042623519897461, 0.1077880859375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 9.0, 15.0, 21.0, 25.0, 26.0, 27.0, 31.0, 41.0, 68.0, 59.0, 64.0, 53.0, 63.0, 74.0, 64.0, 50.0, 62.0, 46.0, 40.0, 38.0, 24.0, 27.0, 13.0, 17.0, 7.0, 7.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.048828125, -0.047373294830322266, -0.04591846466064453, -0.0444636344909668, -0.04300880432128906, -0.04155397415161133, -0.040099143981933594, -0.03864431381225586, -0.037189483642578125, -0.03573465347290039, -0.034279823303222656, -0.03282499313354492, -0.03137016296386719, -0.029915332794189453, -0.02846050262451172, -0.027005672454833984, -0.02555084228515625, -0.024096012115478516, -0.02264118194580078, -0.021186351776123047, -0.019731521606445312, -0.018276691436767578, -0.016821861267089844, -0.01536703109741211, -0.013912200927734375, -0.01245737075805664, -0.011002540588378906, -0.009547710418701172, -0.008092880249023438, -0.006638050079345703, -0.005183219909667969, -0.0037283897399902344, -0.0022735595703125, -0.0008187294006347656, 0.0006361007690429688, 0.002090930938720703, 0.0035457611083984375, 0.005000591278076172, 0.006455421447753906, 0.00791025161743164, 0.009365081787109375, 0.01081991195678711, 0.012274742126464844, 0.013729572296142578, 0.015184402465820312, 0.016639232635498047, 0.01809406280517578, 0.019548892974853516, 0.02100372314453125, 0.022458553314208984, 0.02391338348388672, 0.025368213653564453, 0.026823043823242188, 0.028277873992919922, 0.029732704162597656, 0.03118753433227539, 0.032642364501953125, 0.03409719467163086, 0.035552024841308594, 0.03700685501098633, 0.03846168518066406, 0.0399165153503418, 0.04137134552001953, 0.042826175689697266, 0.044281005859375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 10.0, 23.0, 37.0, 81.0, 171.0, 352.0, 618.0, 9957.0, 4180469.0, 1669.0, 447.0, 246.0, 121.0, 44.0, 19.0, 12.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1796875, -1.1442718505859375, -1.108856201171875, -1.0734405517578125, -1.03802490234375, -1.0026092529296875, -0.967193603515625, -0.9317779541015625, -0.8963623046875, -0.8609466552734375, -0.825531005859375, -0.7901153564453125, -0.75469970703125, -0.7192840576171875, -0.683868408203125, -0.6484527587890625, -0.613037109375, -0.5776214599609375, -0.542205810546875, -0.5067901611328125, -0.47137451171875, -0.4359588623046875, -0.400543212890625, -0.3651275634765625, -0.3297119140625, -0.2942962646484375, -0.258880615234375, -0.2234649658203125, -0.18804931640625, -0.1526336669921875, -0.117218017578125, -0.0818023681640625, -0.04638671875, -0.0109710693359375, 0.024444580078125, 0.0598602294921875, 0.09527587890625, 0.1306915283203125, 0.166107177734375, 0.2015228271484375, 0.2369384765625, 0.2723541259765625, 0.307769775390625, 0.3431854248046875, 0.37860107421875, 0.4140167236328125, 0.449432373046875, 0.4848480224609375, 0.520263671875, 0.5556793212890625, 0.591094970703125, 0.6265106201171875, 0.66192626953125, 0.6973419189453125, 0.732757568359375, 0.7681732177734375, 0.8035888671875, 0.8390045166015625, 0.874420166015625, 0.9098358154296875, 0.94525146484375, 0.9806671142578125, 1.016082763671875, 1.0514984130859375, 1.0869140625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 9.0, 17.0, 40.0, 180.0, 1595.0, 1898.0, 246.0, 64.0, 21.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7666015625, -0.7521457672119141, -0.7376899719238281, -0.7232341766357422, -0.7087783813476562, -0.6943225860595703, -0.6798667907714844, -0.6654109954833984, -0.6509552001953125, -0.6364994049072266, -0.6220436096191406, -0.6075878143310547, -0.5931320190429688, -0.5786762237548828, -0.5642204284667969, -0.5497646331787109, -0.535308837890625, -0.5208530426025391, -0.5063972473144531, -0.4919414520263672, -0.47748565673828125, -0.4630298614501953, -0.4485740661621094, -0.43411827087402344, -0.4196624755859375, -0.40520668029785156, -0.3907508850097656, -0.3762950897216797, -0.36183929443359375, -0.3473834991455078, -0.3329277038574219, -0.31847190856933594, -0.30401611328125, -0.28956031799316406, -0.2751045227050781, -0.2606487274169922, -0.24619293212890625, -0.2317371368408203, -0.21728134155273438, -0.20282554626464844, -0.1883697509765625, -0.17391395568847656, -0.15945816040039062, -0.1450023651123047, -0.13054656982421875, -0.11609077453613281, -0.10163497924804688, -0.08717918395996094, -0.072723388671875, -0.05826759338378906, -0.043811798095703125, -0.029356002807617188, -0.01490020751953125, -0.0004444122314453125, 0.014011383056640625, 0.028467178344726562, 0.0429229736328125, 0.05737876892089844, 0.07183456420898438, 0.08629035949707031, 0.10074615478515625, 0.11520195007324219, 0.12965774536132812, 0.14411354064941406, 0.1585693359375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 2.0, 1.0, 8.0, 7.0, 15.0, 19.0, 21.0, 40.0, 94.0, 163.0, 286.0, 193.0, 86.0, 33.0, 18.0, 11.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4946515560150146, -3.4040281772613525, -3.3134047985076904, -3.2227814197540283, -3.132158041000366, -3.041534900665283, -2.950911521911621, -2.860288143157959, -2.769664764404297, -2.6790413856506348, -2.5884180068969727, -2.4977946281433105, -2.4071712493896484, -2.3165478706359863, -2.225924491882324, -2.135301351547241, -2.044677734375, -1.954054355621338, -1.8634309768676758, -1.7728075981140137, -1.6821843385696411, -1.591560959815979, -1.500937581062317, -1.4103143215179443, -1.3196909427642822, -1.2290675640106201, -1.138444185256958, -1.047820806503296, -0.9571975469589233, -0.8665741682052612, -0.7759507894515991, -0.6853274703025818, -0.5947041511535645, -0.5040807723999023, -0.413457453250885, -0.3228340744972229, -0.23221072554588318, -0.14158737659454346, -0.05096399784088135, 0.039659321308135986, 0.1302827000617981, 0.22090604901313782, 0.31152939796447754, 0.40215277671813965, 0.49277612566947937, 0.5833994746208191, 0.6740228533744812, 0.7646461725234985, 0.8552695512771606, 0.9458929300308228, 1.0365163087844849, 1.1271395683288574, 1.2177629470825195, 1.3083863258361816, 1.3990097045898438, 1.4896330833435059, 1.580256462097168, 1.67087984085083, 1.7615032196044922, 1.8521265983581543, 1.9427498579025269, 2.0333733558654785, 2.1239967346191406, 2.2146198749542236, 2.3052432537078857]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 4.0, 8.0, 7.0, 4.0, 9.0, 15.0, 14.0, 30.0, 24.0, 21.0, 34.0, 54.0, 46.0, 46.0, 64.0, 62.0, 56.0, 60.0, 63.0, 48.0, 51.0, 32.0, 51.0, 32.0, 36.0, 21.0, 26.0, 18.0, 11.0, 10.0, 6.0, 8.0, 8.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0613040924072266, -1.0201447010040283, -0.9789851903915405, -0.9378257393836975, -0.8966662883758545, -0.8555068969726562, -0.8143474459648132, -0.7731879949569702, -0.7320285439491272, -0.6908690929412842, -0.6497096419334412, -0.6085501909255981, -0.5673907995223999, -0.5262312889099121, -0.48507189750671387, -0.44391244649887085, -0.40275299549102783, -0.3615935444831848, -0.3204340934753418, -0.27927467226982117, -0.23811522126197815, -0.19695577025413513, -0.1557963341474533, -0.11463689804077148, -0.07347744703292847, -0.032318003475666046, 0.008841440081596375, 0.050000883638858795, 0.09116032719612122, 0.13231977820396423, 0.17347921431064606, 0.21463865041732788, 0.25579798221588135, 0.29695743322372437, 0.3381168842315674, 0.379276305437088, 0.42043575644493103, 0.46159520745277405, 0.5027546286582947, 0.5439140796661377, 0.5850735306739807, 0.6262329816818237, 0.6673924326896667, 0.7085518836975098, 0.749711275100708, 0.7908707857131958, 0.832030177116394, 0.8731896281242371, 0.9143490791320801, 0.9555085301399231, 0.9966679811477661, 1.0378273725509644, 1.0789868831634521, 1.1201462745666504, 1.1613057851791382, 1.2024651765823364, 1.2436246871948242, 1.2847840785980225, 1.3259435892105103, 1.3671029806137085, 1.4082624912261963, 1.4494218826293945, 1.4905813932418823, 1.5317407846450806, 1.5729001760482788]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 6.0, 4.0, 4.0, 8.0, 12.0, 25.0, 11.0, 26.0, 37.0, 67.0, 90.0, 122.0, 155.0, 230.0, 329.0, 451.0, 692.0, 1018.0, 1738.0, 2803.0, 5004.0, 9868.0, 21528.0, 55197.0, 186040.0, 486226.0, 179293.0, 54076.0, 21162.0, 9689.0, 4997.0, 2786.0, 1608.0, 1023.0, 693.0, 445.0, 344.0, 212.0, 155.0, 111.0, 77.0, 68.0, 40.0, 18.0, 20.0, 15.0, 16.0, 10.0, 7.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10028076171875, -0.09687995910644531, -0.09347915649414062, -0.09007835388183594, -0.08667755126953125, -0.08327674865722656, -0.07987594604492188, -0.07647514343261719, -0.0730743408203125, -0.06967353820800781, -0.06627273559570312, -0.06287193298339844, -0.05947113037109375, -0.05607032775878906, -0.052669525146484375, -0.04926872253417969, -0.045867919921875, -0.04246711730957031, -0.039066314697265625, -0.03566551208496094, -0.03226470947265625, -0.028863906860351562, -0.025463104248046875, -0.022062301635742188, -0.0186614990234375, -0.015260696411132812, -0.011859893798828125, -0.008459091186523438, -0.00505828857421875, -0.0016574859619140625, 0.001743316650390625, 0.0051441192626953125, 0.008544921875, 0.011945724487304688, 0.015346527099609375, 0.018747329711914062, 0.02214813232421875, 0.025548934936523438, 0.028949737548828125, 0.03235054016113281, 0.0357513427734375, 0.03915214538574219, 0.042552947998046875, 0.04595375061035156, 0.04935455322265625, 0.05275535583496094, 0.056156158447265625, 0.05955696105957031, 0.062957763671875, 0.06635856628417969, 0.06975936889648438, 0.07316017150878906, 0.07656097412109375, 0.07996177673339844, 0.08336257934570312, 0.08676338195800781, 0.0901641845703125, 0.09356498718261719, 0.09696578979492188, 0.10036659240722656, 0.10376739501953125, 0.10716819763183594, 0.11056900024414062, 0.11396980285644531, 0.11737060546875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 5.0, 5.0, 13.0, 8.0, 9.0, 13.0, 13.0, 21.0, 16.0, 32.0, 26.0, 30.0, 26.0, 47.0, 42.0, 58.0, 47.0, 46.0, 60.0, 53.0, 57.0, 44.0, 47.0, 38.0, 38.0, 38.0, 26.0, 15.0, 20.0, 10.0, 21.0, 11.0, 8.0, 11.0, 9.0, 8.0, 10.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06280517578125, -0.06068229675292969, -0.058559417724609375, -0.05643653869628906, -0.05431365966796875, -0.05219078063964844, -0.050067901611328125, -0.04794502258300781, -0.0458221435546875, -0.04369926452636719, -0.041576385498046875, -0.03945350646972656, -0.03733062744140625, -0.03520774841308594, -0.033084869384765625, -0.030961990356445312, -0.028839111328125, -0.026716232299804688, -0.024593353271484375, -0.022470474243164062, -0.02034759521484375, -0.018224716186523438, -0.016101837158203125, -0.013978958129882812, -0.0118560791015625, -0.009733200073242188, -0.007610321044921875, -0.0054874420166015625, -0.00336456298828125, -0.0012416839599609375, 0.000881195068359375, 0.0030040740966796875, 0.005126953125, 0.0072498321533203125, 0.009372711181640625, 0.011495590209960938, 0.01361846923828125, 0.015741348266601562, 0.017864227294921875, 0.019987106323242188, 0.0221099853515625, 0.024232864379882812, 0.026355743408203125, 0.028478622436523438, 0.03060150146484375, 0.03272438049316406, 0.034847259521484375, 0.03697013854980469, 0.039093017578125, 0.04121589660644531, 0.043338775634765625, 0.04546165466308594, 0.04758453369140625, 0.04970741271972656, 0.051830291748046875, 0.05395317077636719, 0.0560760498046875, 0.05819892883300781, 0.060321807861328125, 0.06244468688964844, 0.06456756591796875, 0.06669044494628906, 0.06881332397460938, 0.07093620300292969, 0.07305908203125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 8.0, 6.0, 2.0, 9.0, 7.0, 13.0, 17.0, 22.0, 25.0, 56.0, 74.0, 98.0, 170.0, 312.0, 554.0, 1373.0, 4868.0, 49796.0, 955268.0, 29729.0, 3753.0, 1130.0, 478.0, 266.0, 181.0, 99.0, 66.0, 50.0, 31.0, 24.0, 10.0, 14.0, 16.0, 5.0, 6.0, 1.0, 8.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.496337890625, -0.4800224304199219, -0.46370697021484375, -0.4473915100097656, -0.4310760498046875, -0.4147605895996094, -0.39844512939453125, -0.3821296691894531, -0.365814208984375, -0.3494987487792969, -0.33318328857421875, -0.3168678283691406, -0.3005523681640625, -0.2842369079589844, -0.26792144775390625, -0.2516059875488281, -0.23529052734375, -0.21897506713867188, -0.20265960693359375, -0.18634414672851562, -0.1700286865234375, -0.15371322631835938, -0.13739776611328125, -0.12108230590820312, -0.104766845703125, -0.08845138549804688, -0.07213592529296875, -0.055820465087890625, -0.0395050048828125, -0.023189544677734375, -0.00687408447265625, 0.009441375732421875, 0.0257568359375, 0.042072296142578125, 0.05838775634765625, 0.07470321655273438, 0.0910186767578125, 0.10733413696289062, 0.12364959716796875, 0.13996505737304688, 0.156280517578125, 0.17259597778320312, 0.18891143798828125, 0.20522689819335938, 0.2215423583984375, 0.23785781860351562, 0.25417327880859375, 0.2704887390136719, 0.28680419921875, 0.3031196594238281, 0.31943511962890625, 0.3357505798339844, 0.3520660400390625, 0.3683815002441406, 0.38469696044921875, 0.4010124206542969, 0.417327880859375, 0.4336433410644531, 0.44995880126953125, 0.4662742614746094, 0.4825897216796875, 0.4989051818847656, 0.5152206420898438, 0.5315361022949219, 0.5478515625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 4.0, 3.0, 5.0, 5.0, 10.0, 8.0, 18.0, 22.0, 24.0, 28.0, 40.0, 56.0, 64.0, 63.0, 98.0, 84.0, 92.0, 72.0, 60.0, 56.0, 49.0, 26.0, 26.0, 23.0, 18.0, 13.0, 3.0, 11.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.469482421875, -0.4537162780761719, -0.43795013427734375, -0.4221839904785156, -0.4064178466796875, -0.3906517028808594, -0.37488555908203125, -0.3591194152832031, -0.343353271484375, -0.3275871276855469, -0.31182098388671875, -0.2960548400878906, -0.2802886962890625, -0.2645225524902344, -0.24875640869140625, -0.23299026489257812, -0.21722412109375, -0.20145797729492188, -0.18569183349609375, -0.16992568969726562, -0.1541595458984375, -0.13839340209960938, -0.12262725830078125, -0.10686111450195312, -0.091094970703125, -0.07532882690429688, -0.05956268310546875, -0.043796539306640625, -0.0280303955078125, -0.012264251708984375, 0.00350189208984375, 0.019268035888671875, 0.0350341796875, 0.050800323486328125, 0.06656646728515625, 0.08233261108398438, 0.0980987548828125, 0.11386489868164062, 0.12963104248046875, 0.14539718627929688, 0.161163330078125, 0.17692947387695312, 0.19269561767578125, 0.20846176147460938, 0.2242279052734375, 0.23999404907226562, 0.25576019287109375, 0.2715263366699219, 0.28729248046875, 0.3030586242675781, 0.31882476806640625, 0.3345909118652344, 0.3503570556640625, 0.3661231994628906, 0.38188934326171875, 0.3976554870605469, 0.413421630859375, 0.4291877746582031, 0.44495391845703125, 0.4607200622558594, 0.4764862060546875, 0.4922523498535156, 0.5080184936523438, 0.5237846374511719, 0.53955078125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 9.0, 20.0, 18.0, 32.0, 73.0, 119.0, 271.0, 574.0, 1520.0, 4497.0, 22546.0, 899880.0, 105017.0, 9657.0, 2537.0, 930.0, 398.0, 200.0, 102.0, 63.0, 34.0, 23.0, 9.0, 8.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156494140625, -0.15123748779296875, -0.1459808349609375, -0.14072418212890625, -0.135467529296875, -0.13021087646484375, -0.1249542236328125, -0.11969757080078125, -0.11444091796875, -0.10918426513671875, -0.1039276123046875, -0.09867095947265625, -0.093414306640625, -0.08815765380859375, -0.0829010009765625, -0.07764434814453125, -0.0723876953125, -0.06713104248046875, -0.0618743896484375, -0.05661773681640625, -0.051361083984375, -0.04610443115234375, -0.0408477783203125, -0.03559112548828125, -0.03033447265625, -0.02507781982421875, -0.0198211669921875, -0.01456451416015625, -0.009307861328125, -0.00405120849609375, 0.0012054443359375, 0.00646209716796875, 0.01171875, 0.01697540283203125, 0.0222320556640625, 0.02748870849609375, 0.032745361328125, 0.03800201416015625, 0.0432586669921875, 0.04851531982421875, 0.05377197265625, 0.05902862548828125, 0.0642852783203125, 0.06954193115234375, 0.074798583984375, 0.08005523681640625, 0.0853118896484375, 0.09056854248046875, 0.0958251953125, 0.10108184814453125, 0.1063385009765625, 0.11159515380859375, 0.116851806640625, 0.12210845947265625, 0.1273651123046875, 0.13262176513671875, 0.13787841796875, 0.14313507080078125, 0.1483917236328125, 0.15364837646484375, 0.158905029296875, 0.16416168212890625, 0.1694183349609375, 0.17467498779296875, 0.179931640625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 4.0, 8.0, 5.0, 15.0, 18.0, 21.0, 25.0, 32.0, 53.0, 107.0, 129.0, 153.0, 120.0, 88.0, 58.0, 41.0, 28.0, 23.0, 15.0, 12.0, 12.0, 10.0, 5.0, 5.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.68952751159668e-05, -3.550667315721512e-05, -3.411807119846344e-05, -3.272946923971176e-05, -3.134086728096008e-05, -2.9952265322208405e-05, -2.8563663363456726e-05, -2.7175061404705048e-05, -2.578645944595337e-05, -2.439785748720169e-05, -2.3009255528450012e-05, -2.1620653569698334e-05, -2.0232051610946655e-05, -1.8843449652194977e-05, -1.74548476934433e-05, -1.606624573469162e-05, -1.4677643775939941e-05, -1.3289041817188263e-05, -1.1900439858436584e-05, -1.0511837899684906e-05, -9.123235940933228e-06, -7.734633982181549e-06, -6.346032023429871e-06, -4.957430064678192e-06, -3.5688281059265137e-06, -2.180226147174835e-06, -7.916241884231567e-07, 5.969777703285217e-07, 1.9855797290802e-06, 3.3741816878318787e-06, 4.762783646583557e-06, 6.151385605335236e-06, 7.539987564086914e-06, 8.928589522838593e-06, 1.0317191481590271e-05, 1.170579344034195e-05, 1.3094395399093628e-05, 1.4482997357845306e-05, 1.5871599316596985e-05, 1.7260201275348663e-05, 1.8648803234100342e-05, 2.003740519285202e-05, 2.14260071516037e-05, 2.2814609110355377e-05, 2.4203211069107056e-05, 2.5591813027858734e-05, 2.6980414986610413e-05, 2.836901694536209e-05, 2.975761890411377e-05, 3.114622086286545e-05, 3.2534822821617126e-05, 3.3923424780368805e-05, 3.5312026739120483e-05, 3.670062869787216e-05, 3.808923065662384e-05, 3.947783261537552e-05, 4.08664345741272e-05, 4.2255036532878876e-05, 4.3643638491630554e-05, 4.503224045038223e-05, 4.642084240913391e-05, 4.780944436788559e-05, 4.919804632663727e-05, 5.0586648285388947e-05, 5.1975250244140625e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 10.0, 5.0, 12.0, 16.0, 22.0, 29.0, 49.0, 82.0, 155.0, 315.0, 659.0, 1737.0, 6466.0, 56793.0, 931168.0, 42566.0, 5593.0, 1601.0, 616.0, 245.0, 137.0, 95.0, 68.0, 27.0, 27.0, 13.0, 11.0, 5.0, 5.0, 9.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14697265625, -0.14229965209960938, -0.13762664794921875, -0.13295364379882812, -0.1282806396484375, -0.12360763549804688, -0.11893463134765625, -0.11426162719726562, -0.109588623046875, -0.10491561889648438, -0.10024261474609375, -0.09556961059570312, -0.0908966064453125, -0.08622360229492188, -0.08155059814453125, -0.07687759399414062, -0.07220458984375, -0.06753158569335938, -0.06285858154296875, -0.058185577392578125, -0.0535125732421875, -0.048839569091796875, -0.04416656494140625, -0.039493560791015625, -0.034820556640625, -0.030147552490234375, -0.02547454833984375, -0.020801544189453125, -0.0161285400390625, -0.011455535888671875, -0.00678253173828125, -0.002109527587890625, 0.0025634765625, 0.007236480712890625, 0.01190948486328125, 0.016582489013671875, 0.0212554931640625, 0.025928497314453125, 0.03060150146484375, 0.035274505615234375, 0.039947509765625, 0.044620513916015625, 0.04929351806640625, 0.053966522216796875, 0.0586395263671875, 0.06331253051757812, 0.06798553466796875, 0.07265853881835938, 0.07733154296875, 0.08200454711914062, 0.08667755126953125, 0.09135055541992188, 0.0960235595703125, 0.10069656372070312, 0.10536956787109375, 0.11004257202148438, 0.114715576171875, 0.11938858032226562, 0.12406158447265625, 0.12873458862304688, 0.1334075927734375, 0.13808059692382812, 0.14275360107421875, 0.14742660522460938, 0.152099609375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 7.0, 7.0, 12.0, 7.0, 19.0, 16.0, 38.0, 42.0, 73.0, 115.0, 153.0, 159.0, 106.0, 67.0, 52.0, 29.0, 24.0, 24.0, 12.0, 7.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10614013671875, -0.10260581970214844, -0.09907150268554688, -0.09553718566894531, -0.09200286865234375, -0.08846855163574219, -0.08493423461914062, -0.08139991760253906, -0.0778656005859375, -0.07433128356933594, -0.07079696655273438, -0.06726264953613281, -0.06372833251953125, -0.06019401550292969, -0.056659698486328125, -0.05312538146972656, -0.049591064453125, -0.04605674743652344, -0.042522430419921875, -0.03898811340332031, -0.03545379638671875, -0.03191947937011719, -0.028385162353515625, -0.024850845336914062, -0.0213165283203125, -0.017782211303710938, -0.014247894287109375, -0.010713577270507812, -0.00717926025390625, -0.0036449432373046875, -0.000110626220703125, 0.0034236907958984375, 0.0069580078125, 0.010492324829101562, 0.014026641845703125, 0.017560958862304688, 0.02109527587890625, 0.024629592895507812, 0.028163909912109375, 0.03169822692871094, 0.0352325439453125, 0.03876686096191406, 0.042301177978515625, 0.04583549499511719, 0.04936981201171875, 0.05290412902832031, 0.056438446044921875, 0.05997276306152344, 0.063507080078125, 0.06704139709472656, 0.07057571411132812, 0.07411003112792969, 0.07764434814453125, 0.08117866516113281, 0.08471298217773438, 0.08824729919433594, 0.0917816162109375, 0.09531593322753906, 0.09885025024414062, 0.10238456726074219, 0.10591888427734375, 0.10945320129394531, 0.11298751831054688, 0.11652183532714844, 0.12005615234375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 22.0, 50.0, 140.0, 549.0, 165.0, 45.0, 20.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.825005531311035, -6.671842575073242, -6.518679141998291, -6.365516185760498, -6.212352752685547, -6.059189796447754, -5.906026363372803, -5.75286340713501, -5.599699974060059, -5.446537017822266, -5.2933735847473145, -5.1402106285095215, -4.98704719543457, -4.833884239196777, -4.680720806121826, -4.527557849884033, -4.374394416809082, -4.221231460571289, -4.068068027496338, -3.914904832839966, -3.7617416381835938, -3.6085784435272217, -3.4554152488708496, -3.3022522926330566, -3.1490893363952637, -2.9959261417388916, -2.8427629470825195, -2.6895997524261475, -2.5364365577697754, -2.3832733631134033, -2.2301101684570312, -2.0769472122192383, -1.923783540725708, -1.770620346069336, -1.6174571514129639, -1.4642939567565918, -1.3111307621002197, -1.1579675674438477, -1.0048044919967651, -0.8516412973403931, -0.698478102684021, -0.5453149080276489, -0.39215174317359924, -0.23898857831954956, -0.08582538366317749, 0.06733781099319458, 0.22050094604492188, 0.37366414070129395, 0.526827335357666, 0.6799905300140381, 0.8331537246704102, 0.9863168597221375, 1.1394801139831543, 1.2926433086395264, 1.4458063840866089, 1.598969578742981, 1.752132773399353, 1.905295968055725, 2.0584590435028076, 2.2116222381591797, 2.3647854328155518, 2.517948627471924, 2.671111822128296, 2.824275016784668, 2.97743821144104]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 8.0, 6.0, 11.0, 9.0, 16.0, 17.0, 17.0, 24.0, 27.0, 31.0, 24.0, 40.0, 33.0, 49.0, 117.0, 214.0, 64.0, 28.0, 31.0, 25.0, 30.0, 27.0, 21.0, 18.0, 15.0, 15.0, 13.0, 9.0, 16.0, 8.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.399120330810547, -2.3268136978149414, -2.254506826400757, -2.1821999549865723, -2.109893321990967, -2.0375866889953613, -1.9652798175811768, -1.8929730653762817, -1.8206663131713867, -1.7483595609664917, -1.6760528087615967, -1.6037460565567017, -1.5314393043518066, -1.4591325521469116, -1.3868257999420166, -1.3145190477371216, -1.2422122955322266, -1.1699055433273315, -1.0975987911224365, -1.0252920389175415, -0.9529852867126465, -0.8806785345077515, -0.8083717823028564, -0.7360650300979614, -0.6637582778930664, -0.5914515256881714, -0.5191447734832764, -0.44683802127838135, -0.37453126907348633, -0.3022245168685913, -0.2299177646636963, -0.15761101245880127, -0.08530449867248535, -0.012997746467590332, 0.05930900573730469, 0.1316157579421997, 0.20392251014709473, 0.27622926235198975, 0.34853601455688477, 0.4208427667617798, 0.4931495189666748, 0.5654562711715698, 0.6377630233764648, 0.7100697755813599, 0.7823765277862549, 0.8546832799911499, 0.9269900321960449, 0.9992967844009399, 1.071603536605835, 1.14391028881073, 1.216217041015625, 1.28852379322052, 1.360830545425415, 1.43313729763031, 1.505444049835205, 1.5777508020401, 1.6500575542449951, 1.7223643064498901, 1.7946710586547852, 1.8669778108596802, 1.9392845630645752, 2.0115914344787598, 2.0838980674743652, 2.1562047004699707, 2.2285115718841553]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 2.0, 7.0, 6.0, 4.0, 17.0, 12.0, 26.0, 40.0, 53.0, 59.0, 82.0, 130.0, 180.0, 257.0, 413.0, 627.0, 996.0, 1722.0, 2918.0, 5516.0, 12986.0, 38604.0, 170862.0, 963096.0, 2280599.0, 555697.0, 108445.0, 29483.0, 10265.0, 4664.0, 2480.0, 1413.0, 919.0, 551.0, 337.0, 255.0, 173.0, 111.0, 87.0, 48.0, 40.0, 25.0, 29.0, 17.0, 8.0, 9.0, 9.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0904541015625, -0.08726310729980469, -0.08407211303710938, -0.08088111877441406, -0.07769012451171875, -0.07449913024902344, -0.07130813598632812, -0.06811714172363281, -0.0649261474609375, -0.06173515319824219, -0.058544158935546875, -0.05535316467285156, -0.05216217041015625, -0.04897117614746094, -0.045780181884765625, -0.04258918762207031, -0.039398193359375, -0.03620719909667969, -0.033016204833984375, -0.029825210571289062, -0.02663421630859375, -0.023443222045898438, -0.020252227783203125, -0.017061233520507812, -0.0138702392578125, -0.010679244995117188, -0.007488250732421875, -0.0042972564697265625, -0.00110626220703125, 0.0020847320556640625, 0.005275726318359375, 0.008466720581054688, 0.01165771484375, 0.014848709106445312, 0.018039703369140625, 0.021230697631835938, 0.02442169189453125, 0.027612686157226562, 0.030803680419921875, 0.03399467468261719, 0.0371856689453125, 0.04037666320800781, 0.043567657470703125, 0.04675865173339844, 0.04994964599609375, 0.05314064025878906, 0.056331634521484375, 0.05952262878417969, 0.062713623046875, 0.06590461730957031, 0.06909561157226562, 0.07228660583496094, 0.07547760009765625, 0.07866859436035156, 0.08185958862304688, 0.08505058288574219, 0.0882415771484375, 0.09143257141113281, 0.09462356567382812, 0.09781455993652344, 0.10100555419921875, 0.10419654846191406, 0.10738754272460938, 0.11057853698730469, 0.11376953125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 5.0, 11.0, 4.0, 9.0, 8.0, 10.0, 15.0, 24.0, 26.0, 32.0, 41.0, 30.0, 60.0, 57.0, 53.0, 51.0, 67.0, 69.0, 69.0, 61.0, 38.0, 48.0, 39.0, 32.0, 20.0, 27.0, 17.0, 15.0, 14.0, 8.0, 5.0, 10.0, 5.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08648681640625, -0.0839090347290039, -0.08133125305175781, -0.07875347137451172, -0.07617568969726562, -0.07359790802001953, -0.07102012634277344, -0.06844234466552734, -0.06586456298828125, -0.06328678131103516, -0.06070899963378906, -0.05813121795654297, -0.055553436279296875, -0.05297565460205078, -0.05039787292480469, -0.047820091247558594, -0.0452423095703125, -0.042664527893066406, -0.04008674621582031, -0.03750896453857422, -0.034931182861328125, -0.03235340118408203, -0.029775619506835938, -0.027197837829589844, -0.02462005615234375, -0.022042274475097656, -0.019464492797851562, -0.01688671112060547, -0.014308929443359375, -0.011731147766113281, -0.009153366088867188, -0.006575584411621094, -0.003997802734375, -0.0014200210571289062, 0.0011577606201171875, 0.0037355422973632812, 0.006313323974609375, 0.008891105651855469, 0.011468887329101562, 0.014046669006347656, 0.01662445068359375, 0.019202232360839844, 0.021780014038085938, 0.02435779571533203, 0.026935577392578125, 0.02951335906982422, 0.03209114074707031, 0.034668922424316406, 0.0372467041015625, 0.039824485778808594, 0.04240226745605469, 0.04498004913330078, 0.047557830810546875, 0.05013561248779297, 0.05271339416503906, 0.055291175842285156, 0.05786895751953125, 0.060446739196777344, 0.06302452087402344, 0.06560230255126953, 0.06818008422851562, 0.07075786590576172, 0.07333564758300781, 0.0759134292602539, 0.0784912109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 10.0, 6.0, 10.0, 13.0, 28.0, 42.0, 61.0, 96.0, 229.0, 587.0, 2466.0, 3820410.0, 367379.0, 1961.0, 483.0, 222.0, 110.0, 71.0, 31.0, 23.0, 15.0, 9.0, 11.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3037109375, -1.264129638671875, -1.22454833984375, -1.184967041015625, -1.1453857421875, -1.105804443359375, -1.06622314453125, -1.026641845703125, -0.987060546875, -0.947479248046875, -0.90789794921875, -0.868316650390625, -0.8287353515625, -0.789154052734375, -0.74957275390625, -0.709991455078125, -0.67041015625, -0.630828857421875, -0.59124755859375, -0.551666259765625, -0.5120849609375, -0.472503662109375, -0.43292236328125, -0.393341064453125, -0.353759765625, -0.314178466796875, -0.27459716796875, -0.235015869140625, -0.1954345703125, -0.155853271484375, -0.11627197265625, -0.076690673828125, -0.037109375, 0.002471923828125, 0.04205322265625, 0.081634521484375, 0.1212158203125, 0.160797119140625, 0.20037841796875, 0.239959716796875, 0.279541015625, 0.319122314453125, 0.35870361328125, 0.398284912109375, 0.4378662109375, 0.477447509765625, 0.51702880859375, 0.556610107421875, 0.59619140625, 0.635772705078125, 0.67535400390625, 0.714935302734375, 0.7545166015625, 0.794097900390625, 0.83367919921875, 0.873260498046875, 0.912841796875, 0.952423095703125, 0.99200439453125, 1.031585693359375, 1.0711669921875, 1.110748291015625, 1.15032958984375, 1.189910888671875, 1.2294921875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 13.0, 33.0, 109.0, 433.0, 2218.0, 968.0, 226.0, 64.0, 12.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.001953125, -0.973114013671875, -0.94427490234375, -0.915435791015625, -0.8865966796875, -0.857757568359375, -0.82891845703125, -0.800079345703125, -0.771240234375, -0.742401123046875, -0.71356201171875, -0.684722900390625, -0.6558837890625, -0.627044677734375, -0.59820556640625, -0.569366455078125, -0.54052734375, -0.511688232421875, -0.48284912109375, -0.454010009765625, -0.4251708984375, -0.396331787109375, -0.36749267578125, -0.338653564453125, -0.309814453125, -0.280975341796875, -0.25213623046875, -0.223297119140625, -0.1944580078125, -0.165618896484375, -0.13677978515625, -0.107940673828125, -0.0791015625, -0.050262451171875, -0.02142333984375, 0.007415771484375, 0.0362548828125, 0.065093994140625, 0.09393310546875, 0.122772216796875, 0.151611328125, 0.180450439453125, 0.20928955078125, 0.238128662109375, 0.2669677734375, 0.295806884765625, 0.32464599609375, 0.353485107421875, 0.38232421875, 0.411163330078125, 0.44000244140625, 0.468841552734375, 0.4976806640625, 0.526519775390625, 0.55535888671875, 0.584197998046875, 0.613037109375, 0.641876220703125, 0.67071533203125, 0.699554443359375, 0.7283935546875, 0.757232666015625, 0.78607177734375, 0.814910888671875, 0.84375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 2.0, 7.0, 8.0, 8.0, 25.0, 20.0, 36.0, 78.0, 134.0, 206.0, 182.0, 122.0, 71.0, 39.0, 19.0, 8.0, 11.0, 7.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.041259765625, -3.939580202102661, -3.837900400161743, -3.7362208366394043, -3.6345412731170654, -3.5328617095947266, -3.4311819076538086, -3.3295023441314697, -3.227822780609131, -3.126143217086792, -3.024463415145874, -2.922783851623535, -2.8211042881011963, -2.7194247245788574, -2.6177449226379395, -2.5160653591156006, -2.4143855571746826, -2.3127059936523438, -2.211026191711426, -2.109346628189087, -2.007667064666748, -1.9059873819351196, -1.8043076992034912, -1.7026281356811523, -1.600948452949524, -1.4992687702178955, -1.3975892066955566, -1.2959095239639282, -1.1942298412322998, -1.092550277709961, -0.9908705949783325, -0.8891909718513489, -0.7875111103057861, -0.6858314871788025, -0.5841518640518188, -0.48247218132019043, -0.3807925581932068, -0.27911293506622314, -0.17743325233459473, -0.07575362920761108, 0.02592599391937256, 0.1276056319475174, 0.22928526997566223, 0.33096492290496826, 0.4326445460319519, 0.5343241691589355, 0.636003851890564, 0.7376834750175476, 0.8393630981445312, 0.9410427212715149, 1.0427223443984985, 1.144402027130127, 1.2460815906524658, 1.3477612733840942, 1.4494409561157227, 1.5511205196380615, 1.65280020236969, 1.7544798851013184, 1.8561594486236572, 1.9578391313552856, 2.059518814086914, 2.161198377609253, 2.262877941131592, 2.3645577430725098, 2.4662373065948486]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 10.0, 8.0, 9.0, 11.0, 33.0, 33.0, 37.0, 50.0, 63.0, 56.0, 79.0, 91.0, 94.0, 70.0, 49.0, 46.0, 38.0, 53.0, 34.0, 30.0, 19.0, 20.0, 13.0, 16.0, 12.0, 9.0, 9.0, 4.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.935934066772461, -1.8644180297851562, -1.792901873588562, -1.7213858366012573, -1.649869680404663, -1.5783536434173584, -1.5068376064300537, -1.435321569442749, -1.3638054132461548, -1.29228937625885, -1.2207732200622559, -1.1492571830749512, -1.0777411460876465, -1.0062249898910522, -0.9347089529037476, -0.8631928563117981, -0.7916767597198486, -0.7201606631278992, -0.6486445665359497, -0.577128529548645, -0.5056124329566956, -0.4340963363647461, -0.362580269575119, -0.29106420278549194, -0.21954810619354248, -0.1480320245027542, -0.07651594281196594, -0.004999861121177673, 0.0665162205696106, 0.13803231716156006, 0.20954838395118713, 0.2810644507408142, 0.35258054733276367, 0.42409664392471313, 0.4956127107143402, 0.5671287775039673, 0.6386448740959167, 0.7101609706878662, 0.7816770076751709, 0.8531931042671204, 0.9247092008590698, 0.9962252974510193, 1.0677413940429688, 1.1392574310302734, 1.2107734680175781, 1.2822896242141724, 1.353805661201477, 1.4253218173980713, 1.496837854385376, 1.5683538913726807, 1.639870047569275, 1.7113860845565796, 1.7829022407531738, 1.8544182777404785, 1.9259343147277832, 1.997450351715088, 2.0689663887023926, 2.1404824256896973, 2.211998462677002, 2.2835147380828857, 2.3550307750701904, 2.426546812057495, 2.4980628490448, 2.5695788860321045, 2.6410951614379883]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 14.0, 11.0, 23.0, 46.0, 64.0, 115.0, 193.0, 415.0, 893.0, 2108.0, 6254.0, 25017.0, 202503.0, 745525.0, 49359.0, 10341.0, 3252.0, 1233.0, 558.0, 275.0, 142.0, 93.0, 38.0, 28.0, 14.0, 9.0, 7.0, 8.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2705078125, -0.26259803771972656, -0.2546882629394531, -0.2467784881591797, -0.23886871337890625, -0.2309589385986328, -0.22304916381835938, -0.21513938903808594, -0.2072296142578125, -0.19931983947753906, -0.19141006469726562, -0.1835002899169922, -0.17559051513671875, -0.1676807403564453, -0.15977096557617188, -0.15186119079589844, -0.143951416015625, -0.13604164123535156, -0.12813186645507812, -0.12022209167480469, -0.11231231689453125, -0.10440254211425781, -0.09649276733398438, -0.08858299255371094, -0.0806732177734375, -0.07276344299316406, -0.06485366821289062, -0.05694389343261719, -0.04903411865234375, -0.04112434387207031, -0.033214569091796875, -0.025304794311523438, -0.01739501953125, -0.009485244750976562, -0.001575469970703125, 0.0063343048095703125, 0.01424407958984375, 0.022153854370117188, 0.030063629150390625, 0.03797340393066406, 0.0458831787109375, 0.05379295349121094, 0.061702728271484375, 0.06961250305175781, 0.07752227783203125, 0.08543205261230469, 0.09334182739257812, 0.10125160217285156, 0.109161376953125, 0.11707115173339844, 0.12498092651367188, 0.1328907012939453, 0.14080047607421875, 0.1487102508544922, 0.15662002563476562, 0.16452980041503906, 0.1724395751953125, 0.18034934997558594, 0.18825912475585938, 0.1961688995361328, 0.20407867431640625, 0.2119884490966797, 0.21989822387695312, 0.22780799865722656, 0.2357177734375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 8.0, 11.0, 9.0, 17.0, 26.0, 24.0, 31.0, 22.0, 50.0, 61.0, 53.0, 67.0, 63.0, 75.0, 78.0, 47.0, 44.0, 54.0, 52.0, 31.0, 37.0, 37.0, 20.0, 14.0, 15.0, 6.0, 14.0, 3.0, 8.0, 2.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1383056640625, -0.1346292495727539, -0.1309528350830078, -0.12727642059326172, -0.12360000610351562, -0.11992359161376953, -0.11624717712402344, -0.11257076263427734, -0.10889434814453125, -0.10521793365478516, -0.10154151916503906, -0.09786510467529297, -0.09418869018554688, -0.09051227569580078, -0.08683586120605469, -0.0831594467163086, -0.0794830322265625, -0.0758066177368164, -0.07213020324707031, -0.06845378875732422, -0.06477737426757812, -0.06110095977783203, -0.05742454528808594, -0.053748130798339844, -0.05007171630859375, -0.046395301818847656, -0.04271888732910156, -0.03904247283935547, -0.035366058349609375, -0.03168964385986328, -0.028013229370117188, -0.024336814880371094, -0.020660400390625, -0.016983985900878906, -0.013307571411132812, -0.009631156921386719, -0.005954742431640625, -0.0022783279418945312, 0.0013980865478515625, 0.005074501037597656, 0.00875091552734375, 0.012427330017089844, 0.016103744506835938, 0.01978015899658203, 0.023456573486328125, 0.02713298797607422, 0.030809402465820312, 0.034485816955566406, 0.0381622314453125, 0.041838645935058594, 0.04551506042480469, 0.04919147491455078, 0.052867889404296875, 0.05654430389404297, 0.06022071838378906, 0.06389713287353516, 0.06757354736328125, 0.07124996185302734, 0.07492637634277344, 0.07860279083251953, 0.08227920532226562, 0.08595561981201172, 0.08963203430175781, 0.0933084487915039, 0.09698486328125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 5.0, 7.0, 5.0, 4.0, 4.0, 9.0, 11.0, 33.0, 31.0, 27.0, 51.0, 86.0, 142.0, 326.0, 699.0, 2285.0, 11775.0, 837331.0, 183672.0, 8813.0, 1902.0, 602.0, 294.0, 145.0, 93.0, 61.0, 32.0, 31.0, 23.0, 16.0, 9.0, 7.0, 8.0, 5.0, 4.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29638671875, -0.28577423095703125, -0.2751617431640625, -0.26454925537109375, -0.253936767578125, -0.24332427978515625, -0.2327117919921875, -0.22209930419921875, -0.21148681640625, -0.20087432861328125, -0.1902618408203125, -0.17964935302734375, -0.169036865234375, -0.15842437744140625, -0.1478118896484375, -0.13719940185546875, -0.1265869140625, -0.11597442626953125, -0.1053619384765625, -0.09474945068359375, -0.084136962890625, -0.07352447509765625, -0.0629119873046875, -0.05229949951171875, -0.04168701171875, -0.03107452392578125, -0.0204620361328125, -0.00984954833984375, 0.000762939453125, 0.01137542724609375, 0.0219879150390625, 0.03260040283203125, 0.043212890625, 0.05382537841796875, 0.0644378662109375, 0.07505035400390625, 0.085662841796875, 0.09627532958984375, 0.1068878173828125, 0.11750030517578125, 0.12811279296875, 0.13872528076171875, 0.1493377685546875, 0.15995025634765625, 0.170562744140625, 0.18117523193359375, 0.1917877197265625, 0.20240020751953125, 0.2130126953125, 0.22362518310546875, 0.2342376708984375, 0.24485015869140625, 0.255462646484375, 0.26607513427734375, 0.2766876220703125, 0.28730010986328125, 0.29791259765625, 0.30852508544921875, 0.3191375732421875, 0.32975006103515625, 0.340362548828125, 0.35097503662109375, 0.3615875244140625, 0.37220001220703125, 0.3828125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 5.0, 5.0, 5.0, 4.0, 6.0, 5.0, 12.0, 9.0, 15.0, 20.0, 24.0, 25.0, 33.0, 34.0, 61.0, 67.0, 89.0, 91.0, 73.0, 84.0, 57.0, 57.0, 33.0, 35.0, 27.0, 24.0, 21.0, 15.0, 11.0, 10.0, 13.0, 8.0, 7.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.413818359375, -0.40030670166015625, -0.3867950439453125, -0.37328338623046875, -0.359771728515625, -0.34626007080078125, -0.3327484130859375, -0.31923675537109375, -0.30572509765625, -0.29221343994140625, -0.2787017822265625, -0.26519012451171875, -0.251678466796875, -0.23816680908203125, -0.2246551513671875, -0.21114349365234375, -0.1976318359375, -0.18412017822265625, -0.1706085205078125, -0.15709686279296875, -0.143585205078125, -0.13007354736328125, -0.1165618896484375, -0.10305023193359375, -0.08953857421875, -0.07602691650390625, -0.0625152587890625, -0.04900360107421875, -0.035491943359375, -0.02198028564453125, -0.0084686279296875, 0.00504302978515625, 0.0185546875, 0.03206634521484375, 0.0455780029296875, 0.05908966064453125, 0.072601318359375, 0.08611297607421875, 0.0996246337890625, 0.11313629150390625, 0.12664794921875, 0.14015960693359375, 0.1536712646484375, 0.16718292236328125, 0.180694580078125, 0.19420623779296875, 0.2077178955078125, 0.22122955322265625, 0.2347412109375, 0.24825286865234375, 0.2617645263671875, 0.27527618408203125, 0.288787841796875, 0.30229949951171875, 0.3158111572265625, 0.32932281494140625, 0.34283447265625, 0.35634613037109375, 0.3698577880859375, 0.38336944580078125, 0.396881103515625, 0.41039276123046875, 0.4239044189453125, 0.43741607666015625, 0.450927734375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 1.0, 3.0, 7.0, 5.0, 4.0, 9.0, 8.0, 18.0, 17.0, 25.0, 46.0, 52.0, 86.0, 170.0, 341.0, 802.0, 2879.0, 23319.0, 995646.0, 20802.0, 2728.0, 802.0, 343.0, 180.0, 97.0, 53.0, 35.0, 25.0, 17.0, 15.0, 8.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06268310546875, -0.059622764587402344, -0.05656242370605469, -0.05350208282470703, -0.050441741943359375, -0.04738140106201172, -0.04432106018066406, -0.041260719299316406, -0.03820037841796875, -0.035140037536621094, -0.03207969665527344, -0.02901935577392578, -0.025959014892578125, -0.02289867401123047, -0.019838333129882812, -0.016777992248535156, -0.0137176513671875, -0.010657310485839844, -0.0075969696044921875, -0.004536628723144531, -0.001476287841796875, 0.0015840530395507812, 0.0046443939208984375, 0.007704734802246094, 0.01076507568359375, 0.013825416564941406, 0.016885757446289062, 0.01994609832763672, 0.023006439208984375, 0.02606678009033203, 0.029127120971679688, 0.032187461853027344, 0.035247802734375, 0.038308143615722656, 0.04136848449707031, 0.04442882537841797, 0.047489166259765625, 0.05054950714111328, 0.05360984802246094, 0.056670188903808594, 0.05973052978515625, 0.0627908706665039, 0.06585121154785156, 0.06891155242919922, 0.07197189331054688, 0.07503223419189453, 0.07809257507324219, 0.08115291595458984, 0.0842132568359375, 0.08727359771728516, 0.09033393859863281, 0.09339427947998047, 0.09645462036132812, 0.09951496124267578, 0.10257530212402344, 0.1056356430053711, 0.10869598388671875, 0.1117563247680664, 0.11481666564941406, 0.11787700653076172, 0.12093734741210938, 0.12399768829345703, 0.1270580291748047, 0.13011837005615234, 0.1331787109375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 5.0, 4.0, 6.0, 2.0, 5.0, 9.0, 6.0, 18.0, 8.0, 14.0, 14.0, 23.0, 24.0, 29.0, 36.0, 38.0, 50.0, 61.0, 49.0, 60.0, 56.0, 67.0, 61.0, 64.0, 56.0, 32.0, 33.0, 21.0, 20.0, 20.0, 14.0, 18.0, 16.0, 9.0, 12.0, 3.0, 11.0, 6.0, 3.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.537799835205078e-05, -1.4892779290676117e-05, -1.4407560229301453e-05, -1.3922341167926788e-05, -1.3437122106552124e-05, -1.295190304517746e-05, -1.2466683983802795e-05, -1.1981464922428131e-05, -1.1496245861053467e-05, -1.1011026799678802e-05, -1.0525807738304138e-05, -1.0040588676929474e-05, -9.55536961555481e-06, -9.070150554180145e-06, -8.584931492805481e-06, -8.099712431430817e-06, -7.614493370056152e-06, -7.129274308681488e-06, -6.644055247306824e-06, -6.1588361859321594e-06, -5.673617124557495e-06, -5.188398063182831e-06, -4.7031790018081665e-06, -4.217959940433502e-06, -3.732740879058838e-06, -3.2475218176841736e-06, -2.7623027563095093e-06, -2.277083694934845e-06, -1.7918646335601807e-06, -1.3066455721855164e-06, -8.21426510810852e-07, -3.3620744943618774e-07, 1.4901161193847656e-07, 6.342306733131409e-07, 1.1194497346878052e-06, 1.6046687960624695e-06, 2.089887857437134e-06, 2.575106918811798e-06, 3.0603259801864624e-06, 3.5455450415611267e-06, 4.030764102935791e-06, 4.515983164310455e-06, 5.00120222568512e-06, 5.486421287059784e-06, 5.971640348434448e-06, 6.4568594098091125e-06, 6.942078471183777e-06, 7.427297532558441e-06, 7.912516593933105e-06, 8.39773565530777e-06, 8.882954716682434e-06, 9.368173778057098e-06, 9.853392839431763e-06, 1.0338611900806427e-05, 1.0823830962181091e-05, 1.1309050023555756e-05, 1.179426908493042e-05, 1.2279488146305084e-05, 1.2764707207679749e-05, 1.3249926269054413e-05, 1.3735145330429077e-05, 1.4220364391803741e-05, 1.4705583453178406e-05, 1.519080251455307e-05, 1.5676021575927734e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 7.0, 8.0, 10.0, 15.0, 18.0, 22.0, 56.0, 85.0, 147.0, 286.0, 506.0, 1249.0, 3157.0, 11638.0, 317289.0, 696681.0, 11765.0, 3135.0, 1248.0, 587.0, 271.0, 159.0, 72.0, 48.0, 32.0, 22.0, 17.0, 3.0, 3.0, 7.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.0880126953125, -0.08563423156738281, -0.08325576782226562, -0.08087730407714844, -0.07849884033203125, -0.07612037658691406, -0.07374191284179688, -0.07136344909667969, -0.0689849853515625, -0.06660652160644531, -0.06422805786132812, -0.06184959411621094, -0.05947113037109375, -0.05709266662597656, -0.054714202880859375, -0.05233573913574219, -0.049957275390625, -0.04757881164550781, -0.045200347900390625, -0.04282188415527344, -0.04044342041015625, -0.03806495666503906, -0.035686492919921875, -0.03330802917480469, -0.0309295654296875, -0.028551101684570312, -0.026172637939453125, -0.023794174194335938, -0.02141571044921875, -0.019037246704101562, -0.016658782958984375, -0.014280319213867188, -0.01190185546875, -0.009523391723632812, -0.007144927978515625, -0.0047664642333984375, -0.00238800048828125, -9.5367431640625e-06, 0.002368927001953125, 0.0047473907470703125, 0.0071258544921875, 0.009504318237304688, 0.011882781982421875, 0.014261245727539062, 0.01663970947265625, 0.019018173217773438, 0.021396636962890625, 0.023775100708007812, 0.026153564453125, 0.028532028198242188, 0.030910491943359375, 0.03328895568847656, 0.03566741943359375, 0.03804588317871094, 0.040424346923828125, 0.04280281066894531, 0.0451812744140625, 0.04755973815917969, 0.049938201904296875, 0.05231666564941406, 0.05469512939453125, 0.05707359313964844, 0.059452056884765625, 0.06183052062988281, 0.064208984375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 4.0, 1.0, 10.0, 22.0, 34.0, 53.0, 137.0, 425.0, 175.0, 66.0, 38.0, 15.0, 9.0, 9.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1197509765625, -0.11656665802001953, -0.11338233947753906, -0.1101980209350586, -0.10701370239257812, -0.10382938385009766, -0.10064506530761719, -0.09746074676513672, -0.09427642822265625, -0.09109210968017578, -0.08790779113769531, -0.08472347259521484, -0.08153915405273438, -0.0783548355102539, -0.07517051696777344, -0.07198619842529297, -0.0688018798828125, -0.06561756134033203, -0.06243324279785156, -0.059248924255371094, -0.056064605712890625, -0.052880287170410156, -0.04969596862792969, -0.04651165008544922, -0.04332733154296875, -0.04014301300048828, -0.03695869445800781, -0.033774375915527344, -0.030590057373046875, -0.027405738830566406, -0.024221420288085938, -0.02103710174560547, -0.017852783203125, -0.014668464660644531, -0.011484146118164062, -0.008299827575683594, -0.005115509033203125, -0.0019311904907226562, 0.0012531280517578125, 0.004437446594238281, 0.00762176513671875, 0.010806083679199219, 0.013990402221679688, 0.017174720764160156, 0.020359039306640625, 0.023543357849121094, 0.026727676391601562, 0.02991199493408203, 0.0330963134765625, 0.03628063201904297, 0.03946495056152344, 0.042649269104003906, 0.045833587646484375, 0.049017906188964844, 0.05220222473144531, 0.05538654327392578, 0.05857086181640625, 0.06175518035888672, 0.06493949890136719, 0.06812381744384766, 0.07130813598632812, 0.0744924545288086, 0.07767677307128906, 0.08086109161376953, 0.08404541015625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 16.0, 32.0, 66.0, 338.0, 403.0, 63.0, 35.0, 24.0, 11.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.347710132598877, -1.2685073614120483, -1.1893044710159302, -1.1101016998291016, -1.0308988094329834, -0.9516960382461548, -0.8724932670593262, -0.7932904362678528, -0.7140876054763794, -0.634884774684906, -0.5556819438934326, -0.476479172706604, -0.3972763419151306, -0.3180735111236572, -0.23887071013450623, -0.15966790914535522, -0.08046507835388184, -0.0012622624635696411, 0.07794055342674255, 0.15714336931705475, 0.23634618520736694, 0.31554901599884033, 0.39475181698799133, 0.47395461797714233, 0.5531574487686157, 0.6323602795600891, 0.7115631103515625, 0.7907658815383911, 0.8699687123298645, 0.9491715431213379, 1.0283743143081665, 1.1075770854949951, 1.1867802143096924, 1.265982985496521, 1.3451858758926392, 1.4243886470794678, 1.503591537475586, 1.5827943086624146, 1.6619970798492432, 1.7411999702453613, 1.82040274143219, 1.8996055126190186, 1.9788084030151367, 2.058011293411255, 2.137213945388794, 2.216416835784912, 2.2956197261810303, 2.3748223781585693, 2.4540252685546875, 2.5332281589508057, 2.6124308109283447, 2.691633701324463, 2.770836591720581, 2.850039482116699, 2.9292421340942383, 3.0084450244903564, 3.0876479148864746, 3.1668508052825928, 3.246053457260132, 3.32525634765625, 3.404459238052368, 3.4836621284484863, 3.5628647804260254, 3.6420676708221436, 3.7212703227996826]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 6.0, 4.0, 6.0, 10.0, 7.0, 11.0, 11.0, 18.0, 21.0, 10.0, 21.0, 25.0, 24.0, 30.0, 29.0, 245.0, 241.0, 31.0, 32.0, 45.0, 27.0, 30.0, 14.0, 13.0, 18.0, 12.0, 8.0, 12.0, 4.0, 7.0, 5.0, 11.0, 8.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3713531494140625, -1.3284969329833984, -1.2856407165527344, -1.2427845001220703, -1.1999282836914062, -1.1570720672607422, -1.1142158508300781, -1.071359634399414, -1.02850341796875, -0.9856472015380859, -0.9427909851074219, -0.8999347686767578, -0.8570785522460938, -0.8142223358154297, -0.7713661789894104, -0.7285099625587463, -0.685653805732727, -0.642797589302063, -0.5999413728713989, -0.5570851564407349, -0.5142289400100708, -0.4713727533817291, -0.42851656675338745, -0.3856603503227234, -0.3428041338920593, -0.29994791746139526, -0.2570917010307312, -0.21423551440238953, -0.17137929797172546, -0.1285230815410614, -0.08566689491271973, -0.042810678482055664, 4.553794860839844e-05, 0.042901746928691864, 0.08575795590877533, 0.1286141574382782, 0.17147037386894226, 0.21432659029960632, 0.257182776927948, 0.30003899335861206, 0.3428952097892761, 0.3857514262199402, 0.42860764265060425, 0.4714638292789459, 0.5143200159072876, 0.5571762323379517, 0.6000324487686157, 0.6428886651992798, 0.6857448816299438, 0.7286010980606079, 0.771457314491272, 0.814313530921936, 0.8571697473526001, 0.9000259637832642, 0.9428821206092834, 0.9857383370399475, 1.0285944938659668, 1.0714507102966309, 1.114306926727295, 1.157163143157959, 1.200019359588623, 1.242875576019287, 1.2857317924499512, 1.3285880088806152, 1.3714442253112793]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 8.0, 12.0, 27.0, 18.0, 47.0, 54.0, 71.0, 327.0, 171.0, 77.0, 56.0, 42.0, 28.0, 27.0, 11.0, 12.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2008056640625, -0.19520187377929688, -0.18959808349609375, -0.18399429321289062, -0.1783905029296875, -0.17278671264648438, -0.16718292236328125, -0.16157913208007812, -0.155975341796875, -0.15037155151367188, -0.14476776123046875, -0.13916397094726562, -0.1335601806640625, -0.12795639038085938, -0.12235260009765625, -0.11674880981445312, -0.11114501953125, -0.10554122924804688, -0.09993743896484375, -0.09433364868164062, -0.0887298583984375, -0.08312606811523438, -0.07752227783203125, -0.07191848754882812, -0.066314697265625, -0.060710906982421875, -0.05510711669921875, -0.049503326416015625, -0.0438995361328125, -0.038295745849609375, -0.03269195556640625, -0.027088165283203125, -0.021484375, -0.015880584716796875, -0.01027679443359375, -0.004673004150390625, 0.0009307861328125, 0.006534576416015625, 0.01213836669921875, 0.017742156982421875, 0.023345947265625, 0.028949737548828125, 0.03455352783203125, 0.040157318115234375, 0.0457611083984375, 0.051364898681640625, 0.05696868896484375, 0.06257247924804688, 0.06817626953125, 0.07378005981445312, 0.07938385009765625, 0.08498764038085938, 0.0905914306640625, 0.09619522094726562, 0.10179901123046875, 0.10740280151367188, 0.113006591796875, 0.11861038208007812, 0.12421417236328125, 0.12981796264648438, 0.1354217529296875, 0.14102554321289062, 0.14662933349609375, 0.15223312377929688, 0.1578369140625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 9.0, 21.0, 8.0, 11.0, 20.0, 31.0, 50.0, 40.0, 55.0, 99.0, 170.0, 346.0, 634.0, 1542.0, 4928.0, 63582.0, 8304330.0, 8569.0, 2194.0, 901.0, 406.0, 205.0, 146.0, 82.0, 48.0, 57.0, 35.0, 30.0, 14.0, 12.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.841816782951355, -0.8171857595443726, -0.7925547361373901, -0.7679237127304077, -0.7432927489280701, -0.7186617255210876, -0.6940307021141052, -0.6693996787071228, -0.6447687149047852, -0.6201376914978027, -0.5955066680908203, -0.5708756446838379, -0.5462446808815002, -0.5216136574745178, -0.4969826340675354, -0.472351610660553, -0.44772058725357056, -0.42308956384658813, -0.3984585702419281, -0.3738275468349457, -0.34919655323028564, -0.3245655298233032, -0.2999345064163208, -0.2753034830093384, -0.25067248940467834, -0.22604148089885712, -0.2014104723930359, -0.17677944898605347, -0.15214844048023224, -0.127517431974411, -0.10288640856742859, -0.07825540006160736, -0.05362439155578613, -0.028993379324674606, -0.00436236709356308, 0.020268648862838745, 0.04489965736865997, 0.0695306658744812, 0.09416168928146362, 0.11879269778728485, 0.14342370629310608, 0.1680547147989273, 0.19268572330474854, 0.21731674671173096, 0.24194775521755219, 0.2665787637233734, 0.29120978713035583, 0.31584078073501587, 0.3404718041419983, 0.3651028275489807, 0.38973382115364075, 0.41436484456062317, 0.4389958381652832, 0.4636268615722656, 0.48825788497924805, 0.5128889083862305, 0.5375199317932129, 0.5621509552001953, 0.5867819786071777, 0.6114130020141602, 0.6360439658164978, 0.6606749892234802, 0.6853060126304626, 0.7099370360374451, 0.7345679998397827]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 4.0, 3.0, 3.0, 10.0, 2.0, 7.0, 1.0, 4.0, 9.0, 4.0, 6.0, 2.0, 2.0, 9.0, 4.0, 4.0, 1.0, 1.0, 4.0, 5.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.8215011954307556, -0.7937370538711548, -0.765972912311554, -0.7382087707519531, -0.7104446887969971, -0.6826804876327515, -0.6549164056777954, -0.6271522641181946, -0.5993881225585938, -0.5716239809989929, -0.5438598394393921, -0.5160956978797913, -0.4883315861225128, -0.460567444562912, -0.43280333280563354, -0.4050391912460327, -0.3772750496864319, -0.34951090812683105, -0.3217467665672302, -0.2939826548099518, -0.26621851325035095, -0.23845437169075012, -0.21069024503231049, -0.18292611837387085, -0.15516197681427002, -0.1273978352546692, -0.09963370859622955, -0.07186957448720932, -0.04410544037818909, -0.016341298818588257, 0.01142282783985138, 0.039186954498291016, 0.06695115566253662, 0.09471528977155685, 0.12247942388057709, 0.15024355053901672, 0.17800769209861755, 0.20577183365821838, 0.23353596031665802, 0.26130008697509766, 0.2890642285346985, 0.3168283700942993, 0.34459251165390015, 0.3723566234111786, 0.4001207649707794, 0.42788490653038025, 0.4556490182876587, 0.4834131598472595, 0.5111773014068604, 0.5389414429664612, 0.566705584526062, 0.5944697260856628, 0.6222338676452637, 0.6499979496002197, 0.6777620911598206, 0.7055262327194214, 0.7332903742790222, 0.761054515838623, 0.7888186573982239, 0.8165827989578247, 0.8443468809127808, 0.8721110820770264, 0.8998751640319824, 0.9276393055915833, 0.9554034471511841]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [7.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 9.0, 3.0, 6.0, 11.0, 10.0, 29.0, 38.0, 44.0, 62.0, 96.0, 123.0, 201.0, 353.0, 549.0, 996.0, 1704.0, 3678.0, 8134.0, 22030.0, 75637.0, 242926.0, 117024.0, 30139.0, 10424.0, 4325.0, 2281.0, 1221.0, 720.0, 428.0, 310.0, 205.0, 135.0, 107.0, 75.0, 50.0, 45.0, 28.0, 27.0, 23.0, 18.0, 8.0, 4.0, 5.0, 10.0, 0.0, 3.0, 2.0, 6.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.6826171875, -0.6579360961914062, -0.6332550048828125, -0.6085739135742188, -0.583892822265625, -0.5592117309570312, -0.5345306396484375, -0.5098495483398438, -0.48516845703125, -0.46048736572265625, -0.4358062744140625, -0.41112518310546875, -0.386444091796875, -0.36176300048828125, -0.3370819091796875, -0.31240081787109375, -0.2877197265625, -0.26303863525390625, -0.2383575439453125, -0.21367645263671875, -0.188995361328125, -0.16431427001953125, -0.1396331787109375, -0.11495208740234375, -0.09027099609375, -0.06558990478515625, -0.0409088134765625, -0.01622772216796875, 0.008453369140625, 0.03313446044921875, 0.0578155517578125, 0.08249664306640625, 0.107177734375, 0.13185882568359375, 0.1565399169921875, 0.18122100830078125, 0.205902099609375, 0.23058319091796875, 0.2552642822265625, 0.27994537353515625, 0.30462646484375, 0.32930755615234375, 0.3539886474609375, 0.37866973876953125, 0.403350830078125, 0.42803192138671875, 0.4527130126953125, 0.47739410400390625, 0.5020751953125, 0.5267562866210938, 0.5514373779296875, 0.5761184692382812, 0.600799560546875, 0.6254806518554688, 0.6501617431640625, 0.6748428344726562, 0.69952392578125, 0.7242050170898438, 0.7488861083984375, 0.7735671997070312, 0.798248291015625, 0.8229293823242188, 0.8476104736328125, 0.8722915649414062, 0.89697265625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 7.0, 7.0, 7.0, 14.0, 19.0, 25.0, 31.0, 41.0, 50.0, 63.0, 81.0, 88.0, 81.0, 86.0, 81.0, 68.0, 52.0, 35.0, 32.0, 26.0, 25.0, 19.0, 12.0, 11.0, 8.0, 4.0, 6.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1376953125, -0.13363265991210938, -0.12957000732421875, -0.12550735473632812, -0.1214447021484375, -0.11738204956054688, -0.11331939697265625, -0.10925674438476562, -0.105194091796875, -0.10113143920898438, -0.09706878662109375, -0.09300613403320312, -0.0889434814453125, -0.08488082885742188, -0.08081817626953125, -0.07675552368164062, -0.07269287109375, -0.06863021850585938, -0.06456756591796875, -0.060504913330078125, -0.0564422607421875, -0.052379608154296875, -0.04831695556640625, -0.044254302978515625, -0.040191650390625, -0.036128997802734375, -0.03206634521484375, -0.028003692626953125, -0.0239410400390625, -0.019878387451171875, -0.01581573486328125, -0.011753082275390625, -0.0076904296875, -0.003627777099609375, 0.00043487548828125, 0.004497528076171875, 0.0085601806640625, 0.012622833251953125, 0.01668548583984375, 0.020748138427734375, 0.024810791015625, 0.028873443603515625, 0.03293609619140625, 0.036998748779296875, 0.0410614013671875, 0.045124053955078125, 0.04918670654296875, 0.053249359130859375, 0.05731201171875, 0.061374664306640625, 0.06543731689453125, 0.06949996948242188, 0.0735626220703125, 0.07762527465820312, 0.08168792724609375, 0.08575057983398438, 0.089813232421875, 0.09387588500976562, 0.09793853759765625, 0.10200119018554688, 0.1060638427734375, 0.11012649536132812, 0.11418914794921875, 0.11825180053710938, 0.122314453125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 7.0, 13.0, 10.0, 29.0, 38.0, 48.0, 74.0, 62.0, 62.0, 41.0, 28.0, 16.0, 11.0, 8.0, 9.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8406106233596802, -0.8140976428985596, -0.7875846028327942, -0.7610716223716736, -0.7345585823059082, -0.7080456018447876, -0.681532621383667, -0.6550195813179016, -0.628506600856781, -0.6019936203956604, -0.575480580329895, -0.5489675998687744, -0.522454559803009, -0.4959415793418884, -0.46942856907844543, -0.44291555881500244, -0.41640254855155945, -0.38988953828811646, -0.36337652802467346, -0.33686351776123047, -0.31035053730010986, -0.28383752703666687, -0.2573245167732239, -0.23081152141094208, -0.20429851114749908, -0.1777855008840561, -0.1512725055217743, -0.1247594952583313, -0.0982464924454689, -0.0717334896326065, -0.04522047936916351, -0.018707484006881714, 0.007805526256561279, 0.034318529069423676, 0.06083153560757637, 0.08734454214572906, 0.11385754495859146, 0.14037054777145386, 0.16688355803489685, 0.19339655339717865, 0.21990956366062164, 0.24642257392406464, 0.27293556928634644, 0.29944857954978943, 0.3259615898132324, 0.352474570274353, 0.3789876103401184, 0.405500590801239, 0.432013601064682, 0.458526611328125, 0.485039621591568, 0.511552631855011, 0.5380656123161316, 0.564578652381897, 0.5910916328430176, 0.6176046133041382, 0.6441176533699036, 0.6706306338310242, 0.6971436738967896, 0.7236566543579102, 0.7501696944236755, 0.7766826748847961, 0.8031957149505615, 0.8297086954116821, 0.8562216758728027]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 4.0, 4.0, 7.0, 8.0, 14.0, 34.0, 61.0, 92.0, 98.0, 53.0, 42.0, 14.0, 9.0, 8.0, 6.0, 3.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6522510051727295, -0.6285818815231323, -0.6049128174781799, -0.5812436938285828, -0.5575746297836304, -0.5339055061340332, -0.510236382484436, -0.48656731843948364, -0.46289822459220886, -0.4392291307449341, -0.4155600368976593, -0.3918909430503845, -0.36822181940078735, -0.34455275535583496, -0.3208836317062378, -0.297214537858963, -0.27354544401168823, -0.24987635016441345, -0.22620725631713867, -0.2025381475687027, -0.17886905372142792, -0.15519995987415314, -0.13153085112571716, -0.10786175727844238, -0.0841926634311676, -0.060523565858602524, -0.036854468286037445, -0.013185366988182068, 0.010483726859092712, 0.03415282070636749, 0.05782192945480347, 0.08149102330207825, 0.10516011714935303, 0.1288292109966278, 0.1524983048439026, 0.17616741359233856, 0.19983650743961334, 0.22350560128688812, 0.2471747100353241, 0.2708438038825989, 0.29451289772987366, 0.31818199157714844, 0.3418510854244232, 0.365520179271698, 0.38918930292129517, 0.41285836696624756, 0.4365274906158447, 0.4601965844631195, 0.4838656783103943, 0.5075348019599915, 0.5312038660049438, 0.554872989654541, 0.5785420536994934, 0.6022111773490906, 0.625880241394043, 0.6495493650436401, 0.6732184886932373, 0.6968876123428345, 0.7205566763877869, 0.744225800037384, 0.7678948640823364, 0.7915639877319336, 0.8152331113815308, 0.8389021754264832, 0.8625712394714355]}, "train/train_runtime": 5180.8925, "train/train_samples_per_second": 5.508, "train/train_steps_per_second": 0.086, "train/total_flos": 0.0, "train/train_loss": 4.375692403904526, "eval/loss": 4.211044788360596, "eval/wer": 2.02631892106307, "eval/runtime": 1133.2799, "eval/samples_per_second": 2.331, "eval/steps_per_second": 0.292, "_wandb": {"runtime": 6671}} \ No newline at end of file